Spaces:

UniquePratham
/

DualTextOCRFusion

Running

UniquePratham commited on Sep 29

Commit

99c8074

•

1 Parent(s): 6cd9e3d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -80,10 +80,14 @@ def polish_text_with_ai(cleaned_text):
     return polished_text
 # Extract text using GOT
 def extract_text_got(image_file, model, tokenizer):
     return model.chat(tokenizer, image_file, ocr_type='ocr')
 # Extract text using Qwen
 def extract_text_qwen(image_file, model, processor):
     try:
         image = Image.open(image_file).convert('RGB')
@@ -103,14 +107,14 @@ def extract_text_qwen(image_file, model, processor):
 # Function to highlight the keyword in the text
-def highlight_text(cleaned_text,start,end):
-    result = text_highlighter(
-    text=cleaned_text,
-    labels=[("KEYWORD", "#0000FF")],
-    annotations=[
-        {"start": start, "end": end, "tag": "KEYWORD"},
-    ],
-)
 # Title and UI
@@ -129,7 +133,8 @@ uploaded_file = st.sidebar.file_uploader(
 # Input from clipboard
 # Paste image button
-image_data = st.sidebar.paste(label="Paste From Clipboard", key="image_clipboard")
 if image_data is not None:
     clipboard_use = True
     header, encoded = image_data.split(",", 1)
@@ -217,6 +222,6 @@ if uploaded_file:
             len = search_query.length
             end = index + len
             if index != -1:
-                highlight_text(cleaned_text,start,end)
             else:
                 st.write("No Search Found.")

     return polished_text
 # Extract text using GOT
 def extract_text_got(image_file, model, tokenizer):
     return model.chat(tokenizer, image_file, ocr_type='ocr')
 # Extract text using Qwen
 def extract_text_qwen(image_file, model, processor):
     try:
         image = Image.open(image_file).convert('RGB')
 # Function to highlight the keyword in the text
+def highlight_text(cleaned_text, start, end):
+    text_highlighter(
+        text=cleaned_text,
+        labels=[("KEYWORD", "#0000FF")],
+        annotations=[
+            {"start": start, "end": end, "tag": "KEYWORD"},
+        ],
+    )
 # Title and UI
 # Input from clipboard
 # Paste image button
+image_data = paste(
+    label="Paste From Clipboard", key="image_clipboard")
 if image_data is not None:
     clipboard_use = True
     header, encoded = image_data.split(",", 1)
             len = search_query.length
             end = index + len
             if index != -1:
+                highlight_text(cleaned_text, start, end)
             else:
                 st.write("No Search Found.")