NotificationsYou must be signed in to change notification settings
Fork506
Star5.4k

Commitb4b4fea

authored

Add efficientdet models (#67)

* add effdet check* Add effdet models and catalogs* clean-up* register effdet models* Add generalized image type support for layout models* Add effdet tests* Update reqs

1 parent9b73ff1 commitb4b4feaCopy full SHA for b4b4fea

File tree

12 files changed

+402

-24

lines changed

dev-requirements.txt
setup.py
src/layoutparser
- __init__.py
- file_utils.py
- models
  - __init__.py
  - base_layoutmodel.py
  - detectron2
    - layoutmodel.py
  - effdet
  - paddledetection
    - layoutmodel.py
tests
- test_model.py

12 files changed

+402

-24

lines changed

`‎dev-requirements.txt`

Lines changed: 3 additions & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,5 @@`
`1`	`1`	`pytest`
	`2`	`+torch`
`2`	`3`	`numpy`
`3`	`4`	`opencv-python`
`4`	`5`	`pandas`
`@@ -11,4 +12,5 @@ google-cloud-vision==1`
`11`	`12`	`pytesseract`
`12`	`13`	`pycocotools`
`13`	`14`	`git+https://github.com/facebookresearch/detectron2.git@v0.4#egg=detectron2`
`14`		`-paddlepaddle`
	`15`	`+paddlepaddle`
	`16`	`+effdet`

`‎setup.py`

Lines changed: 4 additions & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -24,7 +24,6 @@`
`24`	`24`	`"pandas",`
`25`	`25`	`"pillow",`
`26`	`26`	`"pyyaml>=5.1",`
`27`		`-"torch",`
`28`	`27`	`"torchvision",`
`29`	`28`	`"iopath",`
`30`	`29`	`],`
`@@ -33,6 +32,10 @@`
`33`	`32`	`'google-cloud-vision==1',`
`34`	`33`	`'pytesseract'`
`35`	`34`	`],`
	`35`	`+"effdet": [`
	`36`	`+"torch",`
	`37`	`+"effdet"`
	`38`	`+ ]`
`36`	`39`	`},`
`37`	`40`	`include_package_data=True`
`38`	`41`	`)`

`‎src/layoutparser/init.py`

Lines changed: 4 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -6,6 +6,7 @@`
`6`	`6`	`_LazyModule,`
`7`	`7`	`is_detectron2_available,`
`8`	`8`	`is_paddle_available,`
	`9`	`+is_effdet_available,`
`9`	`10`	`is_pytesseract_available,`
`10`	`11`	`is_gcv_available,`
`11`	`12`	`)`
`@@ -45,6 +46,9 @@`
`45`	`46`	`ifis_paddle_available():`
`46`	`47`	`_import_structure["models.paddledetection"]= ["PaddleDetectionLayoutModel"]`
`47`	`48`
	`49`	`+ifis_effdet_available():`
	`50`	`+_import_structure["models.effdet"]= ["EfficientDetLayoutModel"]`
	`51`	`+`
`48`	`52`	`ifis_pytesseract_available():`
`49`	`53`	`_import_structure["ocr.tesseract_agent"]= [`
`50`	`54`	`"TesseractAgent",`

`‎src/layoutparser/file_utils.py`

Lines changed: 22 additions & 5 deletions

Original file line number	Diff line number	Diff line change
`@@ -39,11 +39,18 @@`
`39`	`39`	`# The name of the paddlepaddle library:`
`40`	`40`	`# Install name: pip install paddlepaddle`
`41`	`41`	`# Import name: import paddle`
`42`		`-_paddle_version=importlib_metadata.version("paddlepaddle")`
	`42`	`+_paddle_version=importlib_metadata.version("paddlepaddle")`
`43`	`43`	`logger.debug(f"Paddle version{_paddle_version} available.")`
`44`	`44`	`exceptimportlib_metadata.PackageNotFoundError:`
`45`	`45`	`_paddle_available=False`
`46`	`46`
	`47`	`+_effdet_available=importlib.util.find_spec("effdet")isnotNone`
	`48`	`+try:`
	`49`	`+_effdet_version=importlib_metadata.version("effdet")`
	`50`	`+logger.debug(f"Effdet version{_effdet_version} available.")`
	`51`	`+exceptimportlib_metadata.PackageNotFoundError:`
	`52`	`+_effdet_version=False`
	`53`	`+`
`47`	`54`	`###########################################`
`48`	`55`	`############## OCR Tool Deps ##############`
`49`	`56`	`###########################################`
`@@ -78,12 +85,16 @@ def is_torch_cuda_available():`
`78`	`85`	`returnFalse`
`79`	`86`
`80`	`87`
	`88`	`+defis_detectron2_available():`
	`89`	`+return_detectron2_available`
	`90`	`+`
	`91`	`+`
`81`	`92`	`defis_paddle_available():`
`82`	`93`	`return_paddle_available`
`83`	`94`
`84`	`95`
`85`		`-defis_detectron2_available():`
`86`		`-return_detectron2_available`
	`96`	`+defis_effdet_available():`
	`97`	`+return_effdet_available`
`87`	`98`
`88`	`99`
`89`	`100`	`defis_pytesseract_available():`
`@@ -111,6 +122,11 @@ def is_gcv_available():`
`111`	`122`	`installation page: https://github.com/PaddlePaddle/Paddle and follow the ones that match your environment.`
`112`	`123`	`"""`
`113`	`124`
	`125`	`+EFFDET_IMPORT_ERROR="""`
	`126`	`+{0} requires the effdet library but it was not found in your environment. You can install it with pip:`
	`127`	+`pip install effdet`
	`128`	`+"""`
	`129`	`+`
`114`	`130`	`PYTESSERACT_IMPORT_ERROR="""`
`115`	`131`	`{0} requires the PyTesseract library but it was not found in your environment. You can install it with pip:`
`116`	`132`	`pip install pytesseract`
`@@ -126,6 +142,7 @@ def is_gcv_available():`
`126`	`142`	`("torch", (is_torch_available,PYTORCH_IMPORT_ERROR)),`
`127`	`143`	`("detectron2", (is_detectron2_available,DETECTRON2_IMPORT_ERROR)),`
`128`	`144`	`("paddle", (is_paddle_available,PADDLE_IMPORT_ERROR)),`
	`145`	`+ ("effdet", (is_effdet_available, )),`
`129`	`146`	`("pytesseract", (is_pytesseract_available,PYTESSERACT_IMPORT_ERROR)),`
`130`	`147`	`("google-cloud-vision", (is_gcv_available,GCV_IMPORT_ERROR)),`
`131`	`148`	`]`
`@@ -172,7 +189,7 @@ def __init__(`
`172`	`189`	`self._import_structure=import_structure`
`173`	`190`
`174`	`191`	`# Following [PEP 366](https://www.python.org/dev/peps/pep-0366/)`
`175`		`-# The __package__ variable should be set`
	`192`	`+# The __package__ variable should be set`
`176`	`193`	`# https://docs.python.org/3/reference/import.html#__package__`
`177`	`194`	`self.__package__=self.__name__`
`178`	`195`
`@@ -198,4 +215,4 @@ def _get_module(self, module_name: str):`
`198`	`215`	`returnimportlib.import_module("."+module_name,self.__name__)`
`199`	`216`
`200`	`217`	`def__reduce__(self):`
`201`		`-return (self.__class__, (self._name,self.__file__,self._import_structure))`
	`218`	`+return (self.__class__, (self._name,self.__file__,self._import_structure))`

`‎src/layoutparser/models/init.py`

Lines changed: 2 additions & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,3 @@`
`1`	`1`	`from .detectron2.layoutmodelimportDetectron2LayoutModel`
`2`		`-from .paddledetection.layoutmodelimportPaddleDetectionLayoutModel`
	`2`	`+from .paddledetection.layoutmodelimportPaddleDetectionLayoutModel`
	`3`	`+from .effdet.layoutmodelimportEfficientDetLayoutModel`

`‎src/layoutparser/models/base_layoutmodel.py`

Lines changed: 9 additions & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,17 +1,23 @@`
	`1`	`+fromtypingimportUnion`
`1`	`2`	`fromabcimportABC,abstractmethod`
`2`	`3`
`3`	`4`	`from ..file_utilsimportrequires_backends`
`4`	`5`
`5`	`6`
`6`	`7`	`classBaseLayoutModel(ABC):`
`7`		`-`
`8`	`8`	`@property`
`9`	`9`	`@abstractmethod`
`10`	`10`	`defDETECTOR_NAME(self):`
`11`	`11`	`pass`
`12`		`-`
	`12`	`+`
	`13`	`+@abstractmethod`
	`14`	`+defdetect(self,image):`
	`15`	`+pass`
	`16`	`+`
`13`	`17`	`@abstractmethod`
`14`		`-defdetect(self):`
	`18`	`+defimage_loader(self,image:Union["ndarray","Image"]):`
	`19`	`+"""It will process the input images appropriately to the target format.`
	`20`	`+ """`
`15`	`21`	`pass`
`16`	`22`
`17`	`23`	`# Add lazy loading mechanisms for layout models, refer to`

`‎src/layoutparser/models/detectron2/layoutmodel.py`

Lines changed: 10 additions & 5 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,3 +1,4 @@`
	`1`	`+fromtypingimportUnion`
`1`	`2`	`fromPILimportImage`
`2`	`3`	`importnumpyasnp`
`3`	`4`
`@@ -41,7 +42,7 @@ class Detectron2LayoutModel(BaseLayoutModel):`
`41`	`42`
`42`	`43`	`Examples::`
`43`	`44`	`>>> import layoutparser as lp`
`44`		`- >>> model = lp.models.Detectron2LayoutModel('lp://HJDataset/faster_rcnn_R_50_FPN_3x/config')`
	`45`	`+ >>> model = lp.Detectron2LayoutModel('lp://HJDataset/faster_rcnn_R_50_FPN_3x/config')`
`45`	`46`	`>>> model.detect(image)`
`46`	`47`
`47`	`48`	`"""`
`@@ -108,7 +109,7 @@ def _reconstruct_path_with_detector_name(self, path: str) -> str:`
`108`	`109`	`model_name_segments=model_name.split("/")`
`109`	`110`	`if (`
`110`	`111`	`len(model_name_segments)==3`
`111`		`-and"detectron2"notinmodel_name_segments`
	`112`	`+andself.DETECTOR_NAMEnotinmodel_name_segments`
`112`	`113`	`):`
`113`	`114`	`return"lp://"+self.DETECTOR_NAME+"/"+path[len("lp://") :]`
`114`	`115`	`returnpath`
`@@ -148,12 +149,16 @@ def detect(self, image):`
`148`	`149`	:obj:`~layoutparser.Layout`: The detected layout of the input image
`149`	`150`	`"""`
`150`	`151`
	`152`	`+image=self.image_loader(image)`
	`153`	`+outputs=self.model(image)`
	`154`	`+layout=self.gather_output(outputs)`
	`155`	`+returnlayout`
	`156`	`+`
	`157`	`+defimage_loader(self,image:Union["np.ndarray","Image.Image"]):`
`151`	`158`	`# Convert PIL Image Input`
`152`	`159`	`ifisinstance(image,Image.Image):`
`153`	`160`	`ifimage.mode!="RGB":`
`154`	`161`	`image=image.convert("RGB")`
`155`	`162`	`image=np.array(image)`
`156`	`163`
`157`		`-outputs=self.model(image)`
`158`		`-layout=self.gather_output(outputs)`
`159`		`-returnlayout`
	`164`	`+returnimage`

`‎src/layoutparser/models/effdet/init.py`

Lines changed: 2 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+from .importcatalogas_UNUSED`
	`2`	`+from .layoutmodelimportEfficientDetLayoutModel`

`‎src/layoutparser/models/effdet/catalog.py`

Lines changed: 53 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,53 @@`
	`1`	`+fromiopath.common.file_ioimportPathHandler`
	`2`	`+`
	`3`	`+from ..base_catalogimportPathManager`
	`4`	`+`
	`5`	`+MODEL_CATALOG= {`
	`6`	`+"PubLayNet": {`
	`7`	`+"tf_efficientdet_d0":"https://www.dropbox.com/s/ukbw5s673633hsw/publaynet-tf_efficientdet_d0.pth.tar?dl=1",`
	`8`	`+"tf_efficientdet_d1":"https://www.dropbox.com/s/gxy11xkkiwnpgog/publaynet-tf_efficientdet_d1.pth.tar?dl=1"`
	`9`	`+ },`
	`10`	`+"MFD": {`
	`11`	`+"tf_efficientdet_d0":"https://www.dropbox.com/s/dkr22iux7thlhel/mfd-tf_efficientdet_d0.pth.tar?dl=1",`
	`12`	`+"tf_efficientdet_d1":"https://www.dropbox.com/s/icmbiaqr5s9bz1x/mfd-tf_efficientdet_d1.pth.tar?dl=1"`
	`13`	`+ }`
	`14`	`+}`
	`15`	`+`
	`16`	`+# In effdet training scripts, it requires the label_map starting`
	`17`	`+# from 1 instead of 0`
	`18`	`+LABEL_MAP_CATALOG= {`
	`19`	`+"PubLayNet": {`
	`20`	`+1:"Text",`
	`21`	`+2:"Title",`
	`22`	`+3:"List",`
	`23`	`+4:"Table",`
	`24`	`+5:"Figure"`
	`25`	`+ }`
	`26`	`+}`
	`27`	`+`
	`28`	`+classLayoutParserEfficientDetModelHandler(PathHandler):`
	`29`	`+"""`
	`30`	`+ Resolve anything that's in LayoutParser model zoo.`
	`31`	`+ """`
	`32`	`+`
	`33`	`+PREFIX="lp://efficientdet/"`
	`34`	`+`
	`35`	`+def_get_supported_prefixes(self):`
	`36`	`+return [self.PREFIX]`
	`37`	`+`
	`38`	`+def_get_local_path(self,path,**kwargs):`
	`39`	`+model_name=path[len(self.PREFIX) :]`
	`40`	`+`
	`41`	`+dataset_name,*model_name,data_type=model_name.split("/")`
	`42`	`+`
	`43`	`+ifdata_type=="weight":`
	`44`	`+model_url=MODEL_CATALOG[dataset_name]["/".join(model_name)]`
	`45`	`+else:`
	`46`	`+raiseValueError(f"Unknown data_type{data_type}")`
	`47`	`+returnPathManager.get_local_path(model_url,**kwargs)`
	`48`	`+`
	`49`	`+def_open(self,path,mode="r",**kwargs):`
	`50`	`+returnPathManager.open(self._get_local_path(path),mode,**kwargs)`
	`51`	`+`
	`52`	`+`
	`53`	`+PathManager.register_handler(LayoutParserEfficientDetModelHandler())`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commitb4b4fea

File tree

12 files changed

12 files changed

`‎dev-requirements.txt`

`‎setup.py`

`‎src/layoutparser/init.py`

`‎src/layoutparser/file_utils.py`

`‎src/layoutparser/models/init.py`

`‎src/layoutparser/models/base_layoutmodel.py`

`‎src/layoutparser/models/detectron2/layoutmodel.py`

`‎src/layoutparser/models/effdet/init.py`

`‎src/layoutparser/models/effdet/catalog.py`

0 commit comments