Spaces:

PDAson
/

SGG-relation-annotator

Sleeping

App Files Files Community

PDAson commited on 19 days ago

Commit

aac1fab

verified ·

1 Parent(s): a203f9e

Upload 3 files

Browse files

Files changed (3) hide show

annotator_v3_3.py +378 -0
requirements.txt +80 -0
sample_six_grid_split_4_new.json +0 -0

annotator_v3_3.py ADDED Viewed

	@@ -0,0 +1,378 @@

+import gradio as gr
+import json
+import os
+import re
+from collections import defaultdict
+def load_main_data(json_file_path):
+    """假设 JSON 是一个列表，每个元素形如:
+    {
+      'image_path': 'some_path',
+      'subject': 'xxx',
+      'object': 'yyy',
+      'options': { 'state': [...], 'action': [...], 'spatial': [...] }
+    }
+    """
+    with open(json_file_path, 'r', encoding='utf-8') as f:
+        return json.load(f)
+def load_output_dict(output_file):
+    """读取已标注数据。如果不存在，则返回空字典。"""
+    if os.path.exists(output_file):
+        try:
+            with open(output_file, 'r', encoding='utf-8') as f:
+                data = json.load(f)
+            if not isinstance(data, dict):
+                data = {}
+            return data
+        except json.JSONDecodeError:
+            return {}
+    else:
+        return {}
+def save_output_dict(output_file, data):
+    """保存标注结果到 output.json"""
+    with open(output_file, 'w', encoding='utf-8') as f:
+        json.dump(data, f, indent=2, ensure_ascii=False)
+def extract_image_id_from_path(full_path):
+    """
+    从 full_path 提取 'image_数字' 这一段，若找不到则返回去掉目录的文件名。
+    例如:
+      annotated_image_folder\\split_4\\output_images_1592503\\image_1592503_pair_2_black bus_parked on.jpg
+      -> 'image_1592503'
+    """
+    # 先统一斜杠
+    full_path = full_path.replace("\\", "/")
+    filename = os.path.basename(full_path)
+    # 用正则匹配 "image_后面若干数字"
+    m = re.search(r"(image_\d+)", filename)
+    if m:
+        return m.group(1)
+    return filename  # 如果失败，就退而求其次（不建议这么多文件都失败）
+def gradio_interface(json_file_path='sample_six_grid_split_4_new.json'):
+    """
+    主要变化：
+      1) 用 extract_image_id_from_path 提取 image_XXXX 做分组，以便同一原图的多个 pair 正确显示 "Pair x/y for this image"。
+      2) 保留 Subject / Object 并排显示，并在 status 中额外显示：此 pair 在当前图片中是第几/共几。
+    """
+    data = load_main_data(json_file_path)  # 假设是 list
+    output_file = 'output.json'
+    labeled_data = load_output_dict(output_file)
+    # ---------------------------------------------------
+    # 1) 预处理：根据 "image_id" 分组
+    # ---------------------------------------------------
+    image_to_indices = defaultdict(list)
+    for idx, item in enumerate(data):
+        raw_path = item.get("image_path", "")
+        image_id = extract_image_id_from_path(raw_path)
+        image_to_indices[image_id].append(idx)
+    local_index_map = {}
+    local_count_map = {}
+    for image_id, idx_list in image_to_indices.items():
+        # 保持出现顺序
+        for local_i, real_idx in enumerate(idx_list):
+            local_index_map[real_idx] = local_i
+            local_count_map[real_idx] = len(idx_list)
+    # ---------------------------------------------------
+    # 2) 一些辅助函数
+    # ---------------------------------------------------
+    def get_item_info(idx):
+        item = data[idx]
+        image_path = item.get("image_path", "")
+        if not os.path.exists(image_path):
+            image_path = "placeholder.jpg"
+        subject = item.get("subject", "")
+        obj = item.get("object", "")
+        opts = item.get("options", {})
+        return image_path, subject, obj, opts
+    def split_options(options_list):
+        """前5个给 Radio，其余给 Dropdown"""
+        if len(options_list) <= 5:
+            return options_list, []
+        else:
+            return options_list[:5], options_list[5:]
+    def update_final_selection(radio_val, dropdown_val):
+        """Radio 优先，否则 Dropdown"""
+        if radio_val:
+            return radio_val
+        return dropdown_val or None
+    def update_skip_value(checked):
+        """skip_checkbox => bool -> str"""
+        return str(checked)
+    # ---------------------------------------------------
+    # 3) 初始化：idx=0
+    # ---------------------------------------------------
+    init_idx = 0
+    init_image, init_sub, init_obj, init_opts = get_item_info(init_idx)
+    state_radio_list, state_dropdown_list = split_options(init_opts.get("state", []))
+    action_radio_list, action_dropdown_list = split_options(init_opts.get("action", []))
+    spatial_radio_list, spatial_dropdown_list = split_options(init_opts.get("spatial", []))
+    init_radio_val = None
+    init_dropdown_val = None
+    init_skip_val = False
+    # ---------------------------------------------------
+    # 4) 搭建 Gradio 界面
+    # ---------------------------------------------------
+    with gr.Blocks() as demo:
+        cur_idx_state = gr.State(init_idx)
+        with gr.Row():
+            # 左侧：图像、Status、Details，以及翻页按钮
+            with gr.Column(scale=1):
+                img_view = gr.Image(value=init_image, label="Image")
+                # 这里的 status_box 会显示 全局进度+当前图片内的进度
+                status_box = gr.Textbox(
+                    value="",
+                    label="Status",
+                    interactive=False
+                )
+                info_box = gr.Textbox(
+                    value="Details: (will be updated...)",
+                    label="Details",
+                    interactive=False
+                )
+                with gr.Row():
+                    btn_prev = gr.Button("← Previous", variant="secondary")
+                    btn_next = gr.Button("Next →", variant="primary")
+            # 右侧：主逻辑
+            with gr.Column(scale=1):
+                # 在同一个 Row 显示 (Subject -> Object) + skip_checkbox
+                with gr.Row():
+                    subject_object_md = gr.Markdown(
+                        f"**{init_sub} → {init_obj}**",
+                        elem_id="subject_object_header"
+                    )
+                    skip_checkbox = gr.Checkbox(
+                        value=init_skip_val,
+                        label="No relation (skip this pair)"
+                    )
+                skip_final = gr.Textbox(value=str(init_skip_val), visible=False)
+                skip_checkbox.change(
+                    fn=update_skip_value,
+                    inputs=[skip_checkbox],
+                    outputs=[skip_final]
+                )
+                # --- State ---
+                gr.Markdown("### State")
+                state_radio = gr.Radio(choices=state_radio_list, value=init_radio_val, label="Top 5")
+                state_dd = gr.Dropdown(choices=state_dropdown_list, value=init_dropdown_val, label="More Options")
+                state_final = gr.Textbox(value=None, visible=False, label="Final State")
+                state_radio.change(
+                    fn=update_final_selection,
+                    inputs=[state_radio, state_dd],
+                    outputs=state_final
+                )
+                state_dd.change(
+                    fn=update_final_selection,
+                    inputs=[state_radio, state_dd],
+                    outputs=state_final
+                )
+                # --- Action ---
+                gr.Markdown("### Action")
+                action_radio = gr.Radio(choices=action_radio_list, value=init_radio_val, label="Top 5")
+                action_dd = gr.Dropdown(choices=action_dropdown_list, value=init_dropdown_val, label="More Options")
+                action_final = gr.Textbox(value=None, visible=False, label="Final Action")
+                action_radio.change(
+                    fn=update_final_selection,
+                    inputs=[action_radio, action_dd],
+                    outputs=action_final
+                )
+                action_dd.change(
+                    fn=update_final_selection,
+                    inputs=[action_radio, action_dd],
+                    outputs=action_final
+                )
+                # --- Spatial ---
+                gr.Markdown("### Spatial")
+                spatial_radio = gr.Radio(choices=spatial_radio_list, value=init_radio_val, label="Top 5")
+                spatial_dd = gr.Dropdown(choices=spatial_dropdown_list, value=init_dropdown_val, label="More Options")
+                spatial_final = gr.Textbox(value=None, visible=False, label="Final Spatial")
+                spatial_radio.change(
+                    fn=update_final_selection,
+                    inputs=[spatial_radio, spatial_dd],
+                    outputs=spatial_final
+                )
+                spatial_dd.change(
+                    fn=update_final_selection,
+                    inputs=[spatial_radio, spatial_dd],
+                    outputs=spatial_final
+                )
+        # 底部的 Save
+        with gr.Row():
+            btn_save = gr.Button("Save", variant="primary")
+        # ---------------------------------------------------
+        # 5) 翻页函数
+        # ---------------------------------------------------
+        def go_next(cur_idx):
+            new_idx = (cur_idx + 1) % len(data)
+            return _jump_to_index(new_idx)
+        def go_prev(cur_idx):
+            new_idx = (cur_idx - 1) % len(data)
+            return _jump_to_index(new_idx)
+        def _jump_to_index(new_idx):
+            # 获取数据
+            image_path, sub, obj, opts = get_item_info(new_idx)
+            # 全局进度：new_idx+1 / len(data)
+            global_status = f"Currently showing: {new_idx+1}/{len(data)}"
+            # 获取本图的局部索引
+            local_idx = local_index_map[new_idx]  # 从 0 开始
+            local_count = local_count_map[new_idx]
+            # 组合显示
+            new_status = f"{global_status}. (Pair {local_idx+1}/{local_count} for this image.)"
+            new_info = f"Subject: {sub}, Object: {obj}"
+            # 改 Markdown: "**sub -> obj**"
+            subobj_md = f"**{sub} → {obj}**"
+            st_list, st_dd = split_options(opts.get("state", []))
+            ac_list, ac_dd = split_options(opts.get("action", []))
+            sp_list, sp_dd = split_options(opts.get("spatial", []))
+            rec = labeled_data.get(str(new_idx), {})
+            skip_val = rec.get("skip", False)
+            if skip_val is True:
+                final_st_val = None
+                final_ac_val = None
+                final_sp_val = None
+            else:
+                final_st_val = rec.get("state", None)
+                final_ac_val = rec.get("action", None)
+                final_sp_val = rec.get("spatial", None)
+            return (
+                # 更新索引
+                new_idx,
+                # 更新图像
+                image_path,
+                # 更新 Status, Info
+                new_status,
+                new_info,
+                # 更新 subject_object_md
+                subobj_md,
+                # skip
+                bool(skip_val),
+                str(skip_val),
+                # state
+                gr.update(choices=st_list, value=None),
+                gr.update(choices=st_dd,   value=None),
+                final_st_val,
+                # action
+                gr.update(choices=ac_list, value=None),
+                gr.update(choices=ac_dd,   value=None),
+                final_ac_val,
+                # spatial
+                gr.update(choices=sp_list, value=None),
+                gr.update(choices=sp_dd,   value=None),
+                final_sp_val
+            )
+        btn_next.click(
+            fn=go_next,
+            inputs=[cur_idx_state],
+            outputs=[
+                cur_idx_state,
+                img_view,
+                status_box,
+                info_box,
+                subject_object_md,
+                skip_checkbox,
+                skip_final,
+                state_radio,
+                state_dd,
+                state_final,
+                action_radio,
+                action_dd,
+                action_final,
+                spatial_radio,
+                spatial_dd,
+                spatial_final
+            ]
+        )
+        btn_prev.click(
+            fn=go_prev,
+            inputs=[cur_idx_state],
+            outputs=[
+                cur_idx_state,
+                img_view,
+                status_box,
+                info_box,
+                subject_object_md,
+                skip_checkbox,
+                skip_final,
+                state_radio,
+                state_dd,
+                state_final,
+                action_radio,
+                action_dd,
+                action_final,
+                spatial_radio,
+                spatial_dd,
+                spatial_final
+            ]
+        )
+        # ---------------------------------------------------
+        # 6) 保存逻辑
+        # ---------------------------------------------------
+        def handle_save(st_val, ac_val, sp_val, cur_idx, skip_val):
+            skip_flag = (skip_val == "True")
+            image_path, sub, obj, _ = get_item_info(cur_idx)
+            if skip_flag:
+                labeled_data[str(cur_idx)] = {
+                    "subject": sub,
+                    "object": obj,
+                    "skip": True
+                }
+                save_output_dict(output_file, labeled_data)
+                return f"Skipped pair: {sub} - {obj}."
+            else:
+                if not st_val or not ac_val or not sp_val:
+                    return "Please select all 3 categories or check 'no suitable option'!"
+                labeled_data[str(cur_idx)] = {
+                    "subject": sub,
+                    "object": obj,
+                    "skip": False,
+                    "state": st_val,
+                    "action": ac_val,
+                    "spatial": sp_val
+                }
+                save_output_dict(output_file, labeled_data)
+                return f"Saved: {sub}, {obj}, state={st_val}, action={ac_val}, spatial={sp_val}"
+        btn_save.click(
+            fn=handle_save,
+            inputs=[state_final, action_final, spatial_final, cur_idx_state, skip_final],
+            outputs=status_box
+        )
+    return demo
+if __name__ == '__main__':
+    gradio_interface().launch(share=True)

requirements.txt ADDED Viewed

	@@ -0,0 +1,80 @@

+aiofiles==23.2.1
+aiohappyeyeballs==2.4.4
+aiohttp==3.10.11
+aiosignal==1.3.1
+altair==5.4.1
+annotated-types==0.7.0
+anyio==4.5.2
+async-timeout==5.0.1
+attrs==24.2.0
+certifi==2024.8.30
+charset-normalizer==3.4.0
+click==8.1.7
+colorama==0.4.6
+contourpy==1.1.1
+cycler==0.12.1
+exceptiongroup==1.2.2
+fastapi==0.115.5
+ffmpy==0.4.0
+filelock==3.16.1
+fonttools==4.55.0
+frozenlist==1.5.0
+fsspec==2024.10.0
+gradio==3.48.0
+gradio_client==0.6.1
+h11==0.14.0
+httpcore==1.0.7
+httpx==0.27.2
+huggingface-hub==0.26.2
+idna==3.10
+importlib_resources==6.4.5
+Jinja2==3.1.4
+jsonschema==4.23.0
+jsonschema-specifications==2023.12.1
+kiwisolver==1.4.7
+linkify-it-py==2.0.3
+markdown-it-py==2.2.0
+MarkupSafe==2.1.5
+matplotlib==3.7.5
+mdit-py-plugins==0.3.3
+mdurl==0.1.2
+multidict==6.1.0
+narwhals==1.15.1
+numpy==1.24.4
+opencv-python==4.10.0.84
+orjson==3.10.12
+packaging==24.2
+pandas==2.0.3
+pillow==10.4.0
+pkgutil_resolve_name==1.3.10
+propcache==0.2.0
+pydantic==2.10.2
+pydantic_core==2.27.1
+pydub==0.25.1
+Pygments==2.18.0
+pyparsing==3.1.4
+python-dateutil==2.9.0.post0
+python-multipart==0.0.17
+pytz==2024.2
+PyYAML==6.0.2
+referencing==0.35.1
+requests==2.32.3
+rich==13.9.4
+rpds-py==0.20.1
+ruff==0.8.0
+semantic-version==2.10.0
+shellingham==1.5.4
+six==1.16.0
+sniffio==1.3.1
+starlette==0.41.3
+tomlkit==0.12.0
+tqdm==4.67.1
+typer==0.13.1
+typing_extensions==4.12.2
+tzdata==2024.2
+uc-micro-py==1.0.3
+urllib3==2.2.3
+uvicorn==0.32.1
+websockets==11.0.3
+yarl==1.15.2
+zipp==3.20.2

sample_six_grid_split_4_new.json ADDED Viewed

The diff for this file is too large to render. See raw diff