fixed the mypy errors

Signed-off-by: Peter Staar <[email protected]>
DS4SD · PeterStaar-IBM · Dec 7, 2024 · Nov 13, 2024 · Nov 14, 2024 · Nov 14, 2024
commit 1df160632eb73b531f4cf08ebcc781564a6912f3
diff --git a/docling_parse/utils.py b/docling_parse/utils.py
@@ -1,18 +1,19 @@
 import json
 import logging
-from typing import Dict, List, Optional, Tuple
+from typing import Dict, List, Optional, Tuple, Union
 
 from PIL import Image, ImageColor, ImageDraw, ImageFont
+from PIL.ImageFont import FreeTypeFont
 
 
 def _draw_text_in_bounding_bbox(
-    img,
-    draw: ImageDraw.Draw,
+    img: Image.Image,
+    draw: ImageDraw.ImageDraw,
     bbox: Tuple[float, float, float, float],
     text: str,
-    font: Optional[ImageFont.ImageFont] = None,
+    font: Optional[Union[FreeTypeFont, ImageFont.ImageFont]] = None,
     fill: str = "black",
-):
+) -> ImageDraw.ImageDraw:
     """
     Draws text inside a bounding box by creating a temporary image,
     resizing it, and pasting it into the original image at bbox.
@@ -75,7 +76,7 @@ def _draw_text_in_bounding_bbox(
 
     # Paste the resized text image onto the original image
     # draw.bitmap((paste_x, paste_y), resized_img)#, fill=None)
-    img.paste((paste_x, paste_y), "black", resized_img)  # , fill=None)
+    img.paste((paste_x, paste_y), resized_img)  # , "black")  # , fill=None)
 
     # draw.text((50, 50), text, font=font, fill=(0,0,0,255))
 
@@ -340,30 +341,18 @@ def _draw_annotations(
     """
     # Create a blank white image with RGBA mode
     img = Image.new("RGBA", (round(W), round(H)), (255, 255, 255, 255))
+    draw = ImageDraw.Draw(img)
+    """
     overlay = Image.new(
         "RGBA", (round(W), round(H)), (255, 255, 255, 0)
     )  # Transparent overlay
     draw = ImageDraw.Draw(overlay)
+    """
 
     # Draw each rectangle by connecting its four points
     if draw_images:
         for row in images:
 
-            """
-            x0 = row[images_header.index("x0")]
-            y0 = row[images_header.index("y0")]
-            x1 = row[images_header.index("x1")]
-            y1 = row[images_header.index("y1")]
-
-            # Define the four corners of the rectangle
-            bl = (x0, H - y0)
-            br = (x1, H - y0)
-            tr = (x1, H - y1)
-            tl = (x0, H - y1)
-
-            # Draw the rectangle as a polygon
-            draw.polygon([bl, br, tr, tl], outline="green", fill="yellow")
-            """
             bbox = [
                 row[images_header.index("x0")],
                 row[images_header.index("y0")],
@@ -409,19 +398,14 @@ def _draw_annotations(
                     alpha=cell_alpha,
                 )
 
-            """
-            if "glyph" in row[cells_header.index("text")]:
-                logging.info(f" skip cell -> {row}")
-                continue
-            """
-
             # Fixme: the _draw_text_in_bounding_bbox is not yet working
             text = row[cells_header.index(f"text")]
-            if False and draw_cells_text and len(text) > 0:
+            if draw_cells_text and len(text) > 0:
                 draw = _draw_text_in_bounding_bbox(
-                    overlay,
+                    # overlay,
+                    img,
                     draw,
-                    bbox=[rect[0][0], rect[0][1], rect[2][0], rect[2][1]],
+                    bbox=(rect[0][0], rect[0][1], rect[2][0], rect[2][1]),
                     text=text,
                 )
 
@@ -532,6 +516,6 @@ def _draw_annotations(
         draw.polygon([bl, br, tr, tl], outline=outl_color, width=cropbox_width)
 
     # Composite the overlay with the base image
-    img = Image.alpha_composite(img, overlay)
+    # img = Image.alpha_composite(img, overlay)
 
     return img
diff --git a/docling_parse/visualize.py b/docling_parse/visualize.py
@@ -4,7 +4,7 @@
 import os
 from typing import Dict, Optional
 
-from docling_parse.pdf_parsers import (  # type: ignore[attr-defined]
+from docling_parse.pdf_parsers import (  # type: ignore[import]
     pdf_parser_v1,
     pdf_parser_v2,
 )
@@ -333,14 +333,17 @@ def visualise_v2(
 
         for category in categories:
 
-            img_orig = create_pil_image_of_page_v2(page, category=category)
+            img = create_pil_image_of_page_v2(
+                page, category=category, draw_cells_text=display_text
+            )
 
             if interactive:
-                img_orig.show()
+                img.show()
 
             if output_dir is not None and page_num == -1:
                 oname = os.path.join(
-                    output_dir, f"{os.path.basename(pdf_path)}_page={pi}.v2.{_}.png"
+                    output_dir,
+                    f"{os.path.basename(pdf_path)}_page={pi}.v2.{category}.png",
                 )
                 logging.info(f"output: {oname}")
 
@@ -349,7 +352,7 @@ def visualise_v2(
             elif output_dir is not None and page_num != -1:
                 oname = os.path.join(
                     output_dir,
-                    f"{os.path.basename(pdf_path)}_page={page_num}.v2.{_}.png",
+                    f"{os.path.basename(pdf_path)}_page={pi}.v2.{category}.png",
                 )
                 logging.info(f"output: {oname}")
 

diff --git a/pyproject.toml b/pyproject.toml
@@ -109,6 +109,9 @@ show_error_codes = true
 python_version = "3.9"
 # plugins = ["pydantic.mypy"]
 
+#[mypy-docling_parse.*]
+#ignore_missing_imports = True
+
 [[tool.mypy.overrides]]
 module = [
     "tabulate.*",

diff --git a/tests/test_parse_v1.py b/tests/test_parse_v1.py
@@ -12,7 +12,7 @@
 import json
 import os
 
-from docling_parse.pdf_parsers import pdf_parser_v1  # type: ignore[attr-defined]
+from docling_parse.pdf_parsers import pdf_parser_v1  # type: ignore[import]
 
 
 def verify_reference_output(true_doc, pred_doc):

diff --git a/tests/test_parse_v2.py b/tests/test_parse_v2.py
@@ -13,7 +13,7 @@
 import json
 import os
 
-from docling_parse.pdf_parsers import pdf_parser_v2  # type: ignore[attr-defined]
+from docling_parse.pdf_parsers import pdf_parser_v2  # type: ignore[import]
 from docling_parse.utils import create_pil_image_of_page_v2