Spaces:

Riksarkivet
/

htr_demo

Running on T4

viklofg commited on 7 days ago

Commit

c369c5b

1 Parent(s): 5a98ee7

Update result visualization

The result viewer renders the polygons as SVG elements instead of drawing
them onto the page. The lines' polygon and text are highlighted when hovered.

Files changed (5) hide show

app/assets/jinja-templates/image +7 -0
app/assets/jinja-templates/transcription +10 -0
app/gradio_config.py +27 -0
app/main.py +4 -3
app/tabs/visualizer.py +23 -179

app/assets/jinja-templates/image ADDED Viewed

	@@ -0,0 +1,7 @@

+<svg viewBox="0 0 {{ page.width }} {{ page.height }}" xmlns="http://www.w3.org/2000/svg">
+    <image height="{{ page.height }}" width="{{ page.width }}" href="/gradio_api/file={{ page.path }}" />
+    {%- for line in lines -%}
+        <a class="textline line{{loop.index}}" onmouseover="document.querySelectorAll('.line{{loop.index}}').forEach(element => {element.classList.add('highlighted')});" onmouseout="document.querySelectorAll('*').forEach(element => {element.classList.remove('highlighted')});">
+        <polygon id="{{ loop.index }}" points="{% for point in line.polygon %}{{ point|join(',') }}{% if not loop.last %} {% endif %}{% endfor %}"/></a>
+    {% endfor %}
+</svg>

app/assets/jinja-templates/transcription ADDED Viewed

	@@ -0,0 +1,10 @@

+{%- for line in lines -%}
+<span
+    class="textline line{{loop.index}}"
+    onmouseover="document.querySelectorAll('.line{{loop.index}}').forEach(element => {element.classList.add('highlighted')});"
+    onmouseout="document.querySelectorAll('*').forEach(element => {element.classList.remove('highlighted')});"
+>
+    {{line.text}}
+</span>
+<br>
+{% endfor %}

app/gradio_config.py CHANGED Viewed

@@ -13,5 +13,32 @@ theme = gr.themes.Default(
 )
 css = """
 """

 )
 css = """
+.svg-image {
+  height: auto;
+  width: 100%;
+  margin: auto;
+}
+.transcription {
+  font-size: large;
+}
+/* style of textline svg elements */
+.textline {
+  fill: transparent;
+  stroke: blue;
+  stroke-width: 10;
+  stroke-opacity: 0.2;
+}
+.highlighted polygon {
+  fill:blue;
+  fill-opacity: 0.2;
+}
+span.highlighted {
+  background-color: rgba(0%, 0%, 100%, 0.2);
+  font-size: large;
+}
 """

app/main.py CHANGED Viewed

@@ -7,7 +7,8 @@ from app.tabs.submit import (
     custom_template_yaml,
     collection_submit_state,
 )
-from app.tabs.visualizer import visualizer, collection_viz_state, viz_image_gallery
 from app.tabs.templating import (
     templating_block,
     TEMPLATE_IMAGE_FOLDER,
@@ -75,7 +76,7 @@ with gr.Blocks(title="HTRflow", theme=theme, css=css, head=matomo) as demo:
         with gr.Tab(label="Submit Job") as tab_submit:
             submit.render()
-        with gr.Tab(label="Visualize Result") as tab_visualizer:
             visualizer.render()
     @demo.load()
@@ -129,7 +130,7 @@ demo.queue()
 if __name__ == "__main__":
     demo.launch(
         server_name="0.0.0.0",
-        server_port=7860,
         enable_monitoring=True,
         # show_error=True,
     )

     custom_template_yaml,
     collection_submit_state,
 )
+from app.tabs.visualizer import visualizer, collection_viz_state
 from app.tabs.templating import (
     templating_block,
     TEMPLATE_IMAGE_FOLDER,
         with gr.Tab(label="Submit Job") as tab_submit:
             submit.render()
+        with gr.Tab(label="Result") as tab_visualizer:
             visualizer.render()
     @demo.load()
 if __name__ == "__main__":
     demo.launch(
         server_name="0.0.0.0",
+        server_port=7862,
         enable_monitoring=True,
         # show_error=True,
     )

app/tabs/visualizer.py CHANGED Viewed

@@ -1,193 +1,37 @@
 import gradio as gr
-import pandas as pd
-import numpy as np
-import time
-from collections import defaultdict
-from typing import List, Dict, Any
-from htrflow.volume.volume import Collection, ImageNode, PageNode
-from htrflow.utils.draw import draw_polygons
-from htrflow.utils import imgproc
-from htrflow.results import Segment
-def load_visualize_state_from_submit(col: Collection, progress):
-    results = []
-    total_steps = len(col.pages)
-    for page_idx, page_node in enumerate(col):
-        page_node.to_original_size()
-        page_image = page_node.image.copy()
-        progress((page_idx + 1) / total_steps, desc="Running Visualizer")
-        line_polygons = []
-        line_crops = []
-        recog_conf_values = {}
-        for i, node in enumerate(page_node.traverse(filter=lambda n: n.is_line())):
-            if node.polygon:
-                line_polygons.append(node.polygon)
-            try:
-                cropped_line_img = imgproc.crop(page_image, node.bbox)
-                cropped_line_img = np.clip(cropped_line_img, 0, 255).astype(np.uint8)
-                line_crops.append(cropped_line_img)
-            except Exception:
-                continue
-            if node.text_result:
-                recog_conf_values[i] = list(
-                    zip(node.text_result.texts, node.text_result.scores)
-                )
-        annotated_image = draw_polygons(image=page_image, polygons=line_polygons)
-        annotated_page_node = np.clip(annotated_image, 0, 255).astype(np.uint8)
-        results.append(
-            {
-                "page_image": page_node,
-                "annotated_page_node": annotated_page_node,
-                "line_crops": line_crops,
-                "recog_conf_values": _convert_conf_values_to_df(recog_conf_values),
-            }
-        )
-    return results
-def _convert_conf_values_to_df(
-    conf_values: Dict[int, List[tuple[str, float]]]
-) -> pd.DataFrame:
-    """Convert recognition confidence values to a pandas DataFrame."""
-    return pd.DataFrame(
-        [
-            {"Transcription": text, "Confidence Score": f"{score:.4f}"}
-            for values in conf_values.values()
-            for text, score in values
-        ]
-    )
 with gr.Blocks() as visualizer:
-    with gr.Column(variant="panel"):
-        with gr.Row():
-            collection_viz_state = gr.State()
-            result_collection_viz_state = gr.State()
-            with gr.Column():
-                viz_image_gallery = gr.Gallery(
-                    file_types=["image"],
-                    label="Visualized Images from HTRflow",
-                    interactive=False,
-                    height=600,
-                    object_fit="cover",
-                    columns=5,
-                    preview=True,
-                )
-                visualize_button = gr.Button(
-                    "Visualize", scale=0, min_width=200, variant="primary"
-                )
-                progress_bar = gr.Textbox(visible=False, show_label=False)
-            with gr.Column():
-                cropped_image_gallery = gr.Gallery(
-                    interactive=False,
-                    preview=True,
-                    label="Cropped Polygons",
-                    height=200,
-                )
-                df_for_cropped_images = gr.Dataframe(
-                    label="Cropped Transcriptions",
-                    headers=["Transcription", "Confidence Score"],
-                    interactive=False,
-                )
-    def on_visualize_button_clicked(collection_viz, progress=gr.Progress()):
-        """
-        This function:
-        - Receives the collection (collection_viz).
-        - Processes it into 'results' (list of dicts with annotated_page_node, line_crops, dataframe).
-        - Returns:
-            1) 'results' as state
-            2) List of annotated_page_node images (one per page) to populate viz_image_gallery
-        """
-        if not collection_viz:
-            return None, []
-        results = load_visualize_state_from_submit(collection_viz, progress)
-        annotated_images = [r["annotated_page_node"] for r in results]
-        return results, annotated_images, gr.skip()
-    visualize_button.click(lambda: gr.update(visible=True), outputs=progress_bar).then(
-        fn=on_visualize_button_clicked,
-        inputs=collection_viz_state,
-        outputs=[result_collection_viz_state, viz_image_gallery, progress_bar],
-    ).then(lambda: gr.update(visible=False), outputs=progress_bar)
-    @viz_image_gallery.change(
-        inputs=result_collection_viz_state,
-        outputs=[cropped_image_gallery, df_for_cropped_images],
-    )
-    def update_c_gallery_and_dataframe(results):
-        selected = results[0]
-        return selected["line_crops"], selected["recog_conf_values"]
-    @viz_image_gallery.select(
-        inputs=result_collection_viz_state,
-        outputs=[cropped_image_gallery, df_for_cropped_images],
-    )
-    def on_dataframe_select(evt: gr.SelectData, results):
-        """
-        evt.index => the index of the selected image in the gallery
-        results => the state object from result_collection_viz_state
-        Return the line crops and the recognized text for that index.
-        """
-        if results is None or evt.index is None:
-            return [], pd.DataFrame(columns=["Transcription", "Confidence Score"])
-        idx = evt.index
-        selected = results[idx]
-        return selected["line_crops"], selected["recog_conf_values"]
-    @df_for_cropped_images.select(
-        outputs=[cropped_image_gallery],
-    )
-    def on_dataframe_select(evt: gr.SelectData):
-        return gr.update(selected_index=evt.index[0])
-    @cropped_image_gallery.select(
-        inputs=df_for_cropped_images, outputs=df_for_cropped_images
-    )
-    def return_image_from_gallery(df, evt: gr.SelectData):
-        selected_index = evt.index
-        def highlight_row(row):
-            return [
-                (
-                    "border: 1px solid blue; font-weight: bold"
-                    if row.name == selected_index
-                    else ""
-                )
-                for _ in row
-            ]
-        styler = df.style.apply(highlight_row, axis=1)
-        return styler
-# TODO: if state is empty from submit? dont show visualize button...
-# TODO: Add reading order in dataframe
-# TODO: Add reading order in visualization to the left
-# TODO: be able to click on mask on the left?
-# TODO: Show how to clone and setup pylaia? Which would probably be a seperate docker container!
-# TODO: fix api! and client... Notebook for api?

 import gradio as gr
+from jinja2 import Environment, FileSystemLoader
+_ENV = Environment(loader=FileSystemLoader("app/assets/jinja-templates"))
+_IMAGE_TEMPLATE = _ENV.get_template("image")
+_TRANSCRIPTION_TEMPLATE = _ENV.get_template("transcription")
+def render_image(state):
+    return _IMAGE_TEMPLATE.render(page=state[0], lines=state[0].traverse(lambda node: node.is_line()))
+def render_transcription(state):
+    return _TRANSCRIPTION_TEMPLATE.render(lines=state[0].traverse(lambda node: node.is_line()))
 with gr.Blocks() as visualizer:
+    with gr.Row():
+        # Columns are needed here to get the scale right. The documentation
+        # claims all components have the `scale` argument but it doesn't
+        # seem to work for HTML components.
+        # Transcription panel
+        with gr.Column(scale=1):
+            gr.Markdown("## Transcription")
+            transcription = gr.HTML(elem_classes="transcription", container=True, max_height="60vh")
+        # Annotated image panel
+        with gr.Column(scale=2):
+            gr.Markdown("## Annotated image")
+            image = gr.HTML(padding=False, elem_classes="svg-image", container=True)
+    collection_viz_state = gr.State()
+    collection_viz_state.change(render_image, inputs=collection_viz_state, outputs=image)
+    collection_viz_state.change(render_transcription, inputs=collection_viz_state, outputs=transcription)