feat: add rotation in demo

mindee · charlesmindee · Mar 22, 2022 · Mar 16, 2022 · Mar 16, 2022 · Mar 16, 2022
commit bbdcce3916f241d39487b65b5ee3682a758cdc7d
diff --git a/demo/app.py b/demo/app.py
@@ -73,7 +73,10 @@ def main():
 
         else:
             with st.spinner('Loading model...'):
-                predictor = ocr_predictor(det_arch, reco_arch, pretrained=True)
+                predictor = ocr_predictor(
+                    det_arch, reco_arch, pretrained=True,
+                    assume_straight_pages=(det_arch != "linknet_resnet18_rotation")
+                )
 
             with st.spinner('Analyzing...'):
 
@@ -97,8 +100,9 @@ def main():
 
                 # Page reconsitution under input page
                 page_export = out.pages[0].export()
-                img = out.pages[0].synthesize()
-                cols[3].image(img, clamp=True)
+                if det_arch != "linknet_resnet18_rotation":
+                    img = out.pages[0].synthesize()
+                    cols[3].image(img, clamp=True)
 
                 # Display JSON
                 st.markdown("\nHere are your analysis results in JSON format:")

diff --git a/doctr/utils/visualization.py b/doctr/utils/visualization.py
@@ -219,13 +219,16 @@ def visualize_page(
                             int(page['dimensions'][1] * word['geometry'][0][0]),
                             int(page['dimensions'][0] * word['geometry'][0][1])
                         )
-                    ax.text(
-                        *text_loc,
-                        word['value'],
-                        size=10,
-                        alpha=0.5,
-                        color=(0, 0, 1),
-                    )
+
+                    if len(word['geometry']) == 2:
+                        # We draw only if boxes are in straight format
+                        ax.text(
+                            *text_loc,
+                            word['value'],
+                            size=10,
+                            alpha=0.5,
+                            color=(0, 0, 1),
+                        )
 
         if display_artefacts:
             for artefact in block['artefacts']:
@@ -252,7 +255,6 @@ def visualize_page(
 def synthesize_page(
     page: Dict[str, Any],
     draw_proba: bool = False,
-    font_size: int = 13,
     font_family: Optional[str] = None,
 ) -> np.ndarray:
     """Draw a the content of the element page (OCR response) on a blank page.