Spaces:

ai-for-obs
/

dawsonia-demo

Running

App Files Files Community

Ashwin V. Mohanan commited on 16 days ago

Commit

97ba84c

1 Parent(s): 9714711

Digitize and visualize

Browse files

Files changed (6) hide show

app/assets/jinja-templates/image.j2 +9 -0
app/gradio_config.py +15 -3
app/main.py +18 -13
app/tabs/submit.py +45 -36
app/tabs/visualizer.py +67 -0
examples/bjur/303/266klubb.png +0 -0

app/assets/jinja-templates/image.j2 ADDED Viewed

	@@ -0,0 +1,9 @@

+<svg viewBox="0 0 {{ page.width }} {{ page.height }}" xmlns="http://www.w3.org/2000/svg">
+    <image height="{{ page.height }}" width="{{ page.width }}" href="/gradio_api/file={{ page.path }}" />
+    {%- for line in page.cells -%}
+        <a class="cellline line{{loop.index}} highlighted" onmouseover="document.querySelectorAll('.line{{loop.index}}').forEach(element => {element.classList.remove('highlighted')});" onmouseout="document.querySelectorAll('.line{{loop.index}}').forEach(element => {element.classList.add('highlighted')});">
+        <polygon id="{{ loop.index }}" points="{% for point in line.polygon %}{{ point|join(',') }}{% if not loop.last %} {% endif %}{% endfor %}"/>
+        <text class="celltext" x="{{ line.text_x }}" y="{{ line.text_y }}">{{ line.text }}</text>
+        </a>
+    {% endfor %}
+</svg>

app/gradio_config.py CHANGED Viewed

@@ -34,17 +34,29 @@ css = """
   overflow: visible;
 }
-/* style of textline svg elements */
-.textline {
   fill: transparent;
   stroke: blue;
   stroke-width: 10;
   stroke-opacity: 0.2;
 }
 .highlighted polygon {
   fill:blue;
-  fill-opacity: 0.2;
 }
 span.highlighted {

   overflow: visible;
 }
+/* style of table cell svg elements */
+.cellline {
   fill: transparent;
   stroke: blue;
   stroke-width: 10;
   stroke-opacity: 0.2;
 }
+svg > a > text {
+  fill: transparent;
+  stroke: transparent;
+}
+svg > a.highlighted > text {
+  fill: white;
+  stroke: transparent;
+  font-size: large;
+}
 .highlighted polygon {
   fill:blue;
+  fill-opacity: 0.7;
+  stroke: black;
 }
 span.highlighted {

app/main.py CHANGED Viewed

@@ -2,6 +2,7 @@ import logging
 import os
 import gradio as gr
 # from htrflow.models.huggingface.trocr import TrOCR
 from app.gradio_config import css, theme
@@ -10,8 +11,8 @@ from app.gradio_config import css, theme
 # from app.tabs.export import export
 from app.tabs.submit import collection_submit_state, submit
-# from app.tabs.visualizer import collection as collection_viz_state
-# from app.tabs.visualizer import visualizer
 # Suppress transformers logging
 logging.getLogger("transformers").setLevel(logging.ERROR)
@@ -54,8 +55,8 @@ with gr.Blocks(title="Dawsonia Demo", theme=theme, css=css, head=html_header) as
         with gr.Tab(label="Upload") as tab_submit:
             submit.render()
-        # with gr.Tab(label="Result", interactive=False, id="result") as tab_visualizer:
-        #     visualizer.render()
         #
         # with gr.Tab(label="Export", interactive=False) as tab_export:
         #     export.render()
@@ -69,17 +70,17 @@ with gr.Blocks(title="Dawsonia Demo", theme=theme, css=css, head=html_header) as
         state_value = input_value
         return state_value if state_value is not None else gr.skip()
-    # collection_submit_state.change(
-    #     activate_tab, collection_submit_state, tab_visualizer
-    # )
     # collection_submit_state.change(activate_tab, collection_submit_state, tab_export)
     collection_submit_state.change(lambda: gr.Tabs(selected="result"), outputs=navbar)
-    # tab_visualizer.select(
-    #     inputs=[collection_submit_state, collection_viz_state],
-    #     outputs=[collection_viz_state],
-    #     fn=sync_gradio_object_state,
-    # )
     #
     # tab_export.select(
     #     inputs=[collection_submit_state, collection_export_state],
@@ -91,5 +92,9 @@ demo.queue()
 if __name__ == "__main__":
     demo.launch(
-        server_name="0.0.0.0", server_port=7860, enable_monitoring=True, show_api=False
     )

 import os
 import gradio as gr
 # from htrflow.models.huggingface.trocr import TrOCR
 from app.gradio_config import css, theme
 # from app.tabs.export import export
 from app.tabs.submit import collection_submit_state, submit
+from app.tabs.visualizer import collection as collection_viz_state
+from app.tabs.visualizer import visualizer
 # Suppress transformers logging
 logging.getLogger("transformers").setLevel(logging.ERROR)
         with gr.Tab(label="Upload") as tab_submit:
             submit.render()
+        with gr.Tab(label="Result", interactive=False, id="result") as tab_visualizer:
+            visualizer.render()
         #
         # with gr.Tab(label="Export", interactive=False) as tab_export:
         #     export.render()
         state_value = input_value
         return state_value if state_value is not None else gr.skip()
+    collection_submit_state.change(
+        activate_tab, collection_submit_state, tab_visualizer
+    )
     # collection_submit_state.change(activate_tab, collection_submit_state, tab_export)
     collection_submit_state.change(lambda: gr.Tabs(selected="result"), outputs=navbar)
+    tab_visualizer.select(
+        inputs=[collection_submit_state, collection_viz_state],
+        outputs=[collection_viz_state],
+        fn=sync_gradio_object_state,
+    )
     #
     # tab_export.select(
     #     inputs=[collection_submit_state, collection_export_state],
 if __name__ == "__main__":
     demo.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        enable_monitoring=True,
+        show_api=False,
+        allowed_paths=[".gradio_cache/output"],
     )

app/tabs/submit.py CHANGED Viewed

@@ -3,6 +3,7 @@ import logging
 import os
 from pathlib import Path
 import time
 from PIL import Image
 from dawsonia import io
@@ -26,7 +27,7 @@ MAX_IMAGES = int(os.environ.get("MAX_IMAGES", 5))
 # Setup the cache directory to point to the directory where the example images
 # are located. The images must lay in the cache directory because otherwise they
 # have to be reuploaded when drag-and-dropped to the input image widget.
-GRADIO_CACHE = ".gradio_cache"
 DATA_CACHE = os.path.join(GRADIO_CACHE, "data")
 EXAMPLES_DIRECTORY = os.path.join(os.getcwd(), "examples")
@@ -38,17 +39,13 @@ PIPELINES: dict[str, dict[str, str]] = {
     )
 }
-if os.environ.get("GRADIO_CACHE_DIR", GRADIO_CACHE) != GRADIO_CACHE:
-    os.environ["GRADIO_CACHE_DIR"] = GRADIO_CACHE
-    logger.warning("Setting GRADIO_CACHE_DIR to '%s' (overriding a previous value).")
 def run_dawsonia(
-    table_fmt_config_override, first_page, last_page, book, progress=gr.Progress()
 ):
     if book is None:
         raise ValueError("You need to select / upload the pages to digitize")
     progress(0, desc="Dawsonia: starting")
     model_path = Path("data/models/dawsonia/2024-07-02")
@@ -70,59 +67,70 @@ def run_dawsonia(
     ]
     collection = []
-    for page_number in range(first_page, last_page):
-        output_path_page = output_path_book / str(page_number)
-        gr.Info(f"Digitizing {page_number = }")
-        *_, stats = digitize.digitize_page_and_write_output(
-            book,
-            init_data,
-            page_number=page_number,
-            date_str=f"0000-page-{page_number}",
-            model_path=model_path,
-            model_predict=ml.model_predict,
-            prob_thresh=0.5,
-            output_path_page=output_path_page,
-            output_text_fmt=False,
-            debug=False,
-        )
-        progress_value = (page_number - first_page) / max(1, last_page - first_page)
-        progress(progress_value, desc=f"Dawsonia: {stats!s:.50}")
-        collection.append(read_page(stats, output_path_book, str(page_number)))
     gr.Info("Pages were succesfully digitized ✨")
     yield collection, gr.skip()
-def read_page(stats: digitize.Statistics, output_path_book: Path, prefix: str):
     if stats.tables_detected > 0:
         values_df = pd.read_parquet((output_path_book / prefix).with_suffix(".parquet"))
         table_meta = json.loads(
             (output_path_book / "table_meta" / prefix).with_suffix(".json").read_text()
         )
         with Image.open(
-            (output_path_book / "pages" / prefix).with_suffix(".webp")
         ) as im:
             width = im.width
             height = im.height
         values_array = values_df.values.flatten()
-        bbox_array = np.array(table_meta["table_positions"]).reshape(
-            values_array.size, 4
         )
         cells = [
             make_cell(value, bbox) for value, bbox in zip(values_array, bbox_array)
         ]
-        return Page(width, height, cells)
 def make_cell(value: str, bbox: NDArray[np.int64]):
-    x, y, w, h = bbox
-    xmax, ymax = x+w, y+h
-    polygon = (x,y), (xmax, y), (xmax, ymax), (x, ymax), (x,y)
     return TableCell(polygon, text_x=x, text_y=y, text=value)
@@ -229,11 +237,12 @@ with gr.Blocks() as submit:
         if len(images) > MAX_IMAGES:
             gr.Warning(f"Maximum images you can upload is set to: {MAX_IMAGES}")
             return gr.update(value=None)
         return images
     run_button.click(
         fn=run_dawsonia,
-        inputs=(table_fmt_config_override, first_page, last_page, batch_book_state),
         outputs=(collection_submit_state, batch_image_gallery),
     )
     edit_table_fmt_button.click(lambda: Modal(visible=True), None, edit_table_fmt_modal)

 import os
 from pathlib import Path
 import time
+import warnings
 from PIL import Image
 from dawsonia import io
 # Setup the cache directory to point to the directory where the example images
 # are located. The images must lay in the cache directory because otherwise they
 # have to be reuploaded when drag-and-dropped to the input image widget.
+GRADIO_CACHE = os.getenv("GRADIO_CACHE_DIR", ".gradio_cache")
 DATA_CACHE = os.path.join(GRADIO_CACHE, "data")
 EXAMPLES_DIRECTORY = os.path.join(os.getcwd(), "examples")
     )
 }
 def run_dawsonia(
+    table_fmt_config_override, first_page, last_page, book, gallery, progress=gr.Progress()
 ):
     if book is None:
         raise ValueError("You need to select / upload the pages to digitize")
     progress(0, desc="Dawsonia: starting")
     model_path = Path("data/models/dawsonia/2024-07-02")
     ]
     collection = []
+    images = []
+    with warnings.catch_warnings():
+        warnings.simplefilter("ignore", FutureWarning)
+        for page_number, im_from_gallery in zip(range(first_page, last_page), gallery):
+            output_path_page = output_path_book / str(page_number)
+            gr.Info(f"Digitizing {page_number = }")
+            if not (output_path_book / str(page_number)).with_suffix(".parquet").exists():
+                digitize.digitize_page_and_write_output(
+                    book,
+                    init_data,
+                    page_number=page_number,
+                    date_str=f"0000-page-{page_number}",
+                    model_path=model_path,
+                    model_predict=ml.model_predict,
+                    prob_thresh=0.5,
+                    output_path_page=output_path_page,
+                    output_text_fmt=False,
+                    debug=False,
+                )
+            progress_value = (page_number - first_page) / max(1, last_page - first_page)
+            page, im = read_page(output_path_book, str(page_number), progress, progress_value) # , im_from_gallery[0])
+            collection.append(page)
+            images.append(im)
     gr.Info("Pages were succesfully digitized ✨")
+    # yield collection, images
     yield collection, gr.skip()
+def read_page(output_path_book: Path, prefix: str, progress, progress_value, im_path_from_gallery: str = ""):
+    stats = digitize.Statistics.from_json((output_path_book / "statistics" / prefix).with_suffix(".json"))
+    print(stats)
+    progress(progress_value, desc=f"Dawsonia: {stats!s:.50}")
     if stats.tables_detected > 0:
         values_df = pd.read_parquet((output_path_book / prefix).with_suffix(".parquet"))
         table_meta = json.loads(
             (output_path_book / "table_meta" / prefix).with_suffix(".json").read_text()
         )
         with Image.open(
+            image_path:=(output_path_book / "pages" / prefix).with_suffix(".webp")
         ) as im:
             width = im.width
             height = im.height
         values_array = values_df.values.flatten()
+        bbox_array = np.hstack(table_meta["table_positions"]).reshape(
+            -1, 4
         )
         cells = [
             make_cell(value, bbox) for value, bbox in zip(values_array, bbox_array)
         ]
+        return Page(width, height, cells, im_path_from_gallery or str(image_path)), im
 def make_cell(value: str, bbox: NDArray[np.int64]):
+    y, x, h, w = bbox
+    xmin, ymin = x-w//2, y-h//2
+    xmax, ymax = x+w//2, y+h//2
+    polygon = (xmin,ymin), (xmax, ymin), (xmax, ymax), (xmin, ymax), (xmin,ymin)
     return TableCell(polygon, text_x=x, text_y=y, text=value)
         if len(images) > MAX_IMAGES:
             gr.Warning(f"Maximum images you can upload is set to: {MAX_IMAGES}")
             return gr.update(value=None)
         return images
     run_button.click(
         fn=run_dawsonia,
+        inputs=(table_fmt_config_override, first_page, last_page, batch_book_state, batch_image_gallery),
         outputs=(collection_submit_state, batch_image_gallery),
     )
     edit_table_fmt_button.click(lambda: Modal(visible=True), None, edit_table_fmt_modal)

app/tabs/visualizer.py ADDED Viewed

	@@ -0,0 +1,67 @@

+import gradio as gr
+from jinja2 import Environment, FileSystemLoader
+_ENV = Environment(loader=FileSystemLoader("app/assets/jinja-templates"))
+_IMAGE_TEMPLATE = _ENV.get_template("image.j2")
+from typing import NamedTuple
+from dawsonia.typing import BBoxTuple
+class TableCell(NamedTuple):
+    polygon: tuple[tuple[int, int], ...]
+    text_x: int
+    text_y: int
+    text: str
+class Page(NamedTuple):
+    width: int
+    height: int
+    cells: list[TableCell]
+    path: str
+def render_image(collection: list[Page], current_page_index: int) -> str:
+    return _IMAGE_TEMPLATE.render(
+        page=collection[current_page_index],
+    )
+with gr.Blocks() as visualizer:
+    gr.Markdown("# Result")
+    gr.Markdown(
+        "The image to the below shows where Dawsonia found text in the image."
+    )
+    with gr.Row():
+        # Annotated image panel
+        with gr.Column(scale=2):
+            image = gr.HTML(
+                label="Annotated image",
+                padding=False,
+                elem_classes="svg-image",
+                container=True,
+                max_height="65vh",
+                min_height="65vh",
+                show_label=True,
+            )
+            image_caption = gr.Markdown(elem_classes="button-group-viz")
+            with gr.Row(elem_classes="button-group-viz"):
+                left = gr.Button(
+                    "← Previous", visible=False, interactive=False, scale=0
+                )
+                right = gr.Button("Next →", visible=False, scale=0)
+    collection = gr.State()
+    current_page_index = gr.State(0)
+    # Updates on collection change:
+    # - update the view
+    # - reset the page index (always start on page 0)
+    # - toggle visibility of navigation buttons (don't show them for single pages)
+    # - update the image caption
+    collection.change(
+        render_image, inputs=[collection, current_page_index], outputs=image
+    )

examples/bjur/303/266klubb.png ADDED Viewed