Add the model for the NewspaperNavigator Dataset

lolipopshock · lolipopshock · commit ff6bdff612d2 · 2020-11-29T12:54:26.000-05:00
diff --git a/docs/notes/modelzoo.md b/docs/notes/modelzoo.md
@@ -25,6 +25,7 @@ model.detect(image)
 | [PubLayNet](https://github.com/ibm-aur-nlp/PubLayNet)        | [mask_rcnn_R_50_FPN_3x](https://www.dropbox.com/s/u9wbsfwz4y0ziki/config.yml?dl=1) | lp://PubLayNet/mask_rcnn_R_50_FPN_3x/config   |                                                              |
 | [PubLayNet](https://github.com/ibm-aur-nlp/PubLayNet)        | [mask_rcnn_X_101_32x8d_FPN_3x](https://www.dropbox.com/s/nau5ut6zgthunil/config.yaml?dl=1) | lp://PubLayNet/mask_rcnn_X_101_32x8d_FPN_3x/config | 88.98 [eval.csv](https://www.dropbox.com/s/15ytg3fzmc6l59x/eval.csv?dl=0) |
 | [PrimaLayout](https://www.primaresearch.org/dataset/)        | [mask_rcnn_R_50_FPN_3x](https://www.dropbox.com/s/yc92x97k50abynt/config.yaml?dl=1) | lp://PrimaLayout/mask_rcnn_R_50_FPN_3x/config | 69.35 [eval.csv](https://www.dropbox.com/s/9uuql57uedvb9mo/eval.csv?dl=0) |
+| [NewspaperNavigator](https://news-navigator.labs.loc.gov/)       | [faster_rcnn_R_50_FPN_3x](https://www.dropbox.com/s/wnido8pk4oubyzr/config.yml?dl=1) | lp://NewspaperNavigator/faster_rcnn_R_50_FPN_3x/config |                                                              |
 
 * For PubLayNet models, we suggest using `mask_rcnn_X_101_32x8d_FPN_3x` model as it's trained on the whole training set, while others are only trained on the validation set (the size is only around 1/50). You could expect a 15% AP improvement using the `mask_rcnn_X_101_32x8d_FPN_3x` model.
 
@@ -34,4 +35,5 @@ model.detect(image)
 | ------------------------------------------------------------ | ------------------------------------------------------------ |
 | [HJDataset](https://dell-research-harvard.github.io/HJDataset/) | `{1:"Page Frame", 2:"Row", 3:"Title Region", 4:"Text Region", 5:"Title", 6:"Subtitle", 7:"Other"}` |
 | [PubLayNet](https://github.com/ibm-aur-nlp/PubLayNet)        | `{0: "Text", 1: "Title", 2: "List", 3:"Table", 4:"Figure"}`     |
-| [PrimaLayout](https://www.primaresearch.org/dataset/)        | `{1:"TextRegion", 2:"ImageRegion", 3:"TableRegion", 4:"MathsRegion", 5:"SeparatorRegion", 6:"OtherRegion"}` |
+| [PrimaLayout](https://www.primaresearch.org/dataset/)        | `{1:"TextRegion", 2:"ImageRegion", 3:"TableRegion", 4:"MathsRegion", 5:"SeparatorRegion", 6:"OtherRegion"}` |
+| [NewspaperNavigator](https://news-navigator.labs.loc.gov/)        | `{0: "Photograph", 1: "Illustration", 2: "Map", 3: "Comics/Cartoon", 4: "Editorial Cartoon", 5: "Headline", 6: "Advertisement"}` |
diff --git a/src/layoutparser/models/catalog.py b/src/layoutparser/models/catalog.py
@@ -13,6 +13,9 @@
     },
     "PrimaLayout": {
         "mask_rcnn_R_50_FPN_3x": "https://www.dropbox.com/s/h7th27jfv19rxiy/model_final.pth?dl=1"
+    },
+    "NewspaperNavigator": {
+        'faster_rcnn_R_50_FPN_3x': 'https://www.dropbox.com/s/6ewh6g8rqt2ev3a/model_final.pth?dl=1',
     }
 }
 
@@ -29,6 +32,9 @@
     },
     "PrimaLayout": {
         "mask_rcnn_R_50_FPN_3x": "https://www.dropbox.com/s/yc92x97k50abynt/config.yaml?dl=1"
+    },
+    "NewspaperNavigator": {
+        'faster_rcnn_R_50_FPN_3x': 'https://www.dropbox.com/s/wnido8pk4oubyzr/config.yml?dl=1',
     }
 }
 
diff --git a/tests/test_model.py b/tests/test_model.py
@@ -9,6 +9,7 @@
         'lp://PubLayNet/faster_rcnn_R_50_FPN_3x/config',
         'lp://PubLayNet/mask_rcnn_R_50_FPN_3x/config',
         'lp://PubLayNet/mask_rcnn_X_101_32x8d_FPN_3x/config',
+        'lp://NewspaperNavigator/faster_rcnn_R_50_FPN_3x/config',
     ]
 
 

Original file line number	Diff line number	Diff line change
`@@ -13,6 +13,9 @@`
`13`	`13`	`},`
`14`	`14`	`"PrimaLayout": {`
`15`	`15`	`"mask_rcnn_R_50_FPN_3x": "https://www.dropbox.com/s/h7th27jfv19rxiy/model_final.pth?dl=1"`
	`16`	`+ },`
	`17`	`+ "NewspaperNavigator": {`
	`18`	`+ 'faster_rcnn_R_50_FPN_3x': 'https://www.dropbox.com/s/6ewh6g8rqt2ev3a/model_final.pth?dl=1',`
`16`	`19`	`}`
`17`	`20`	`}`
`18`	`21`
`@@ -29,6 +32,9 @@`
`29`	`32`	`},`
`30`	`33`	`"PrimaLayout": {`
`31`	`34`	`"mask_rcnn_R_50_FPN_3x": "https://www.dropbox.com/s/yc92x97k50abynt/config.yaml?dl=1"`
	`35`	`+ },`
	`36`	`+ "NewspaperNavigator": {`
	`37`	`+ 'faster_rcnn_R_50_FPN_3x': 'https://www.dropbox.com/s/wnido8pk4oubyzr/config.yml?dl=1',`
`32`	`38`	`}`
`33`	`39`	`}`
`34`	`40`
Original file line number	Diff line number	Diff line change
`@@ -9,6 +9,7 @@`
`9`	`9`	`'lp://PubLayNet/faster_rcnn_R_50_FPN_3x/config',`
`10`	`10`	`'lp://PubLayNet/mask_rcnn_R_50_FPN_3x/config',`
`11`	`11`	`'lp://PubLayNet/mask_rcnn_X_101_32x8d_FPN_3x/config',`
	`12`	`+ 'lp://NewspaperNavigator/faster_rcnn_R_50_FPN_3x/config',`
`12`	`13`	`]`
`13`	`14`
`14`	`15`