Spaces:

ASLP-lab
/

OSUM

Running on Zero

App Files Files Community

tomxxie commited on 7 days ago

Commit

dd9bb13

1 Parent(s): d9ae2cb

新增链接

Browse files

Files changed (2) hide show

app.py +58 -26
app_old.py +58 -26

app.py CHANGED Viewed

@@ -158,11 +158,35 @@ def download_audio(input_wav_path):
     else:
         return None
 # 创建 Gradio 界面
-with gr.Blocks() as demo:
     # 添加标题
     gr.Markdown(
-        f"""
         <div style="display: flex; align-items: center; justify-content: center; text-align: center;">
             <h1 style="font-family: 'Arial', sans-serif; color: #014377; font-size: 32px; margin-bottom: 0; display: inline-block; vertical-align: middle;">
                 OSUM Speech Understanding Model Test
@@ -175,17 +199,17 @@ with gr.Blocks() as demo:
     with gr.Row():
         with gr.Column(scale=1):
             audio_input = gr.Audio(label="Record", type="filepath")
-        with gr.Column(scale=1, min_width=300):  # 给输出框设置最小宽度，确保等高对齐
             output_text = gr.Textbox(label="Output", lines=8, placeholder="The generated result will be displayed here...", interactive=False)
     # 添加任务选择和自定义输入框
     with gr.Row():
         task_dropdown = gr.Dropdown(
             label="Task",
-            choices=list(TASK_PROMPT_MAPPING.keys()) + ["Custom Task Prompt"],  # 新增选项
             value="ASR (Automatic Speech Recognition)"
         )
-        custom_prompt_input = gr.Textbox(label="Custom Task Prompt", placeholder="Please enter a custom task prompt...", visible=False)  # 新增文本输入框
     # 添加按钮（下载按钮在左边，开始处理按钮在右边）
     with gr.Row():
@@ -205,20 +229,24 @@ with gr.Blocks() as demo:
         save_button = gr.Button("Submit Feedback", variant="secondary")
     # 添加底部内容
-    with gr.Row():
-        # 底部内容容器
-        with gr.Column(scale=1, min_width=800):  # 设置最小宽度以确保内容居中
-            gr.Markdown(
-                f"""
-                <div style="position: fixed; bottom: 20px; left: 50%; transform: translateX(-50%); display: flex; align-items: center; justify-content: center; gap: 20px;">
-                    <div style="text-align: center;">
-                        <p style="margin: 0;"><strong>Audio, Speech and Language Processing Group (ASLP@NPU),</strong></p>
-                        <p style="margin: 0;"><strong>Northwestern Polytechnical University</strong></p>
-                    </div>
-                    <img src="data:image/png;base64,{encoded_string}" alt="OSUM Logo" style="height: 80px; width: auto;">
-                </div>
-                """
-            )
     # 绑定事件
     def show_confirmation(output_res, input_wav_path, input_prompt):
@@ -229,12 +257,16 @@ with gr.Blocks() as demo:
         return gr.update(visible=False)
     def handle_submit(input_wav_path, task_choice, custom_prompt):
-        if task_choice == "Custom Task Prompt":
-            input_prompt = custom_prompt  # 使用用户输入的自定义文本
-        else:
-            input_prompt = TASK_PROMPT_MAPPING.get(task_choice, "未知任务类型")  # 使用预定义的提示
-        output_res = do_decode(input_wav_path, input_prompt)
-        return output_res
     # 当任务选择框的值发生变化时，更新自定义输入框的可见性
     task_dropdown.change(
@@ -256,7 +288,7 @@ with gr.Blocks() as demo:
     download_button.click(
         fn=download_audio,
         inputs=[audio_input],
-        outputs=[download_button]  # 输出到 download_button
     )
     save_button.click(

     else:
         return None
+# 自定义 CSS 样式
+CSS = """
+.custom-footer {
+    position: fixed;
+    bottom: 20px;  /* 距离页面底部的距离 */
+    left: 50%;
+    transform: translateX(-50%);
+    display: flex;
+    align-items: center;
+    justify-content: center;
+    gap: 20px;
+    text-align: center;
+    font-weight: bold;
+    padding-bottom: 20px;  /* 在底部添加额外的间距 */
+}
+.custom-footer p {
+    margin: 0;
+}
+.custom-footer img {
+    height: 80px;
+    width: auto;
+}
+"""
 # 创建 Gradio 界面
+with gr.Blocks(css=CSS) as demo:
     # 添加标题
     gr.Markdown(
+        """
         <div style="display: flex; align-items: center; justify-content: center; text-align: center;">
             <h1 style="font-family: 'Arial', sans-serif; color: #014377; font-size: 32px; margin-bottom: 0; display: inline-block; vertical-align: middle;">
                 OSUM Speech Understanding Model Test
     with gr.Row():
         with gr.Column(scale=1):
             audio_input = gr.Audio(label="Record", type="filepath")
+        with gr.Column(scale=1, min_width=300):
             output_text = gr.Textbox(label="Output", lines=8, placeholder="The generated result will be displayed here...", interactive=False)
     # 添加任务选择和自定义输入框
     with gr.Row():
         task_dropdown = gr.Dropdown(
             label="Task",
+            choices=list(TASK_PROMPT_MAPPING.keys()) + ["Custom Task Prompt"],
             value="ASR (Automatic Speech Recognition)"
         )
+        custom_prompt_input = gr.Textbox(label="Custom Task Prompt", placeholder="Please enter a custom task prompt...", visible=False)
     # 添加按钮（下载按钮在左边，开始处理按钮在右边）
     with gr.Row():
         save_button = gr.Button("Submit Feedback", variant="secondary")
     # 添加底部内容
+    gr.HTML(
+        f"""
+        <div class="custom-footer">
+            <div>
+                <p>
+                    <a href="http://www.nwpu-aslp.org/" target="_blank">Audio, Speech and Language Processing Group (ASLP@NPU)</a>,
+                </p>
+                <p>
+                    Northwestern Polytechnical University
+                </p>
+                <p>
+                    <a href="https://github.com/ASLP-lab/OSUM" target="_blank">GitHub</a>
+                </p>
+            </div>
+            <img src="data:image/png;base64,{encoded_string}" alt="OSUM Logo">
+        </div>
+        """
+    )
     # 绑定事件
     def show_confirmation(output_res, input_wav_path, input_prompt):
         return gr.update(visible=False)
     def handle_submit(input_wav_path, task_choice, custom_prompt):
+        try:
+            if task_choice == "Custom Task Prompt":
+                input_prompt = custom_prompt
+            else:
+                input_prompt = TASK_PROMPT_MAPPING.get(task_choice, "未知任务类型")
+            output_res = do_decode(input_wav_path, input_prompt)
+            return output_res
+        except Exception as e:
+            print(f"Error in handle_submit: {e}")
+            return "Error occurred. Please check the input."
     # 当任务选择框的值发生变化时，更新自定义输入框的可见性
     task_dropdown.change(
     download_button.click(
         fn=download_audio,
         inputs=[audio_input],
+        outputs=[download_button]
     )
     save_button.click(

app_old.py CHANGED Viewed

@@ -158,11 +158,35 @@ def download_audio(input_wav_path):
     else:
         return None
 # 创建 Gradio 界面
-with gr.Blocks() as demo:
     # 添加标题
     gr.Markdown(
-        f"""
         <div style="display: flex; align-items: center; justify-content: center; text-align: center;">
             <h1 style="font-family: 'Arial', sans-serif; color: #014377; font-size: 32px; margin-bottom: 0; display: inline-block; vertical-align: middle;">
                 OSUM Speech Understanding Model Test
@@ -175,17 +199,17 @@ with gr.Blocks() as demo:
     with gr.Row():
         with gr.Column(scale=1):
             audio_input = gr.Audio(label="Record", type="filepath")
-        with gr.Column(scale=1, min_width=300):  # 给输出框设置最小宽度，确保等高对齐
             output_text = gr.Textbox(label="Output", lines=8, placeholder="The generated result will be displayed here...", interactive=False)
     # 添加任务选择和自定义输入框
     with gr.Row():
         task_dropdown = gr.Dropdown(
             label="Task",
-            choices=list(TASK_PROMPT_MAPPING.keys()) + ["Custom Task Prompt"],  # 新增选项
             value="ASR (Automatic Speech Recognition)"
         )
-        custom_prompt_input = gr.Textbox(label="Custom Task Prompt", placeholder="Please enter a custom task prompt...", visible=False)  # 新增文本输入框
     # 添加按钮（下载按钮在左边，开始处理按钮在右边）
     with gr.Row():
@@ -205,20 +229,24 @@ with gr.Blocks() as demo:
         save_button = gr.Button("Submit Feedback", variant="secondary")
     # 添加底部内容
-    with gr.Row():
-        # 底部内容容器
-        with gr.Column(scale=1, min_width=800):  # 设置最小宽度以确保内容居中
-            gr.Markdown(
-                f"""
-                <div style="position: fixed; bottom: 20px; left: 50%; transform: translateX(-50%); display: flex; align-items: center; justify-content: center; gap: 20px;">
-                    <div style="text-align: center;">
-                        <p style="margin: 0;"><strong>Audio, Speech and Language Processing Group (ASLP@NPU),</strong></p>
-                        <p style="margin: 0;"><strong>Northwestern Polytechnical University</strong></p>
-                    </div>
-                    <img src="data:image/png;base64,{encoded_string}" alt="OSUM Logo" style="height: 80px; width: auto;">
-                </div>
-                """
-            )
     # 绑定事件
     def show_confirmation(output_res, input_wav_path, input_prompt):
@@ -229,12 +257,16 @@ with gr.Blocks() as demo:
         return gr.update(visible=False)
     def handle_submit(input_wav_path, task_choice, custom_prompt):
-        if task_choice == "Custom Task Prompt":
-            input_prompt = custom_prompt  # 使用用户输入的自定义文本
-        else:
-            input_prompt = TASK_PROMPT_MAPPING.get(task_choice, "未知任务类型")  # 使用预定义的提示
-        output_res = do_decode(input_wav_path, input_prompt)
-        return output_res
     # 当任务选择框的值发生变化时，更新自定义输入框的可见性
     task_dropdown.change(
@@ -256,7 +288,7 @@ with gr.Blocks() as demo:
     download_button.click(
         fn=download_audio,
         inputs=[audio_input],
-        outputs=[download_button]  # 输出到 download_button
     )
     save_button.click(

     else:
         return None
+# 自定义 CSS 样式
+CSS = """
+.custom-footer {
+    position: fixed;
+    bottom: 20px;  /* 距离页面底部的距离 */
+    left: 50%;
+    transform: translateX(-50%);
+    display: flex;
+    align-items: center;
+    justify-content: center;
+    gap: 20px;
+    text-align: center;
+    font-weight: bold;
+    padding-bottom: 20px;  /* 在底部添加额外的间距 */
+}
+.custom-footer p {
+    margin: 0;
+}
+.custom-footer img {
+    height: 80px;
+    width: auto;
+}
+"""
 # 创建 Gradio 界面
+with gr.Blocks(css=CSS) as demo:
     # 添加标题
     gr.Markdown(
+        """
         <div style="display: flex; align-items: center; justify-content: center; text-align: center;">
             <h1 style="font-family: 'Arial', sans-serif; color: #014377; font-size: 32px; margin-bottom: 0; display: inline-block; vertical-align: middle;">
                 OSUM Speech Understanding Model Test
     with gr.Row():
         with gr.Column(scale=1):
             audio_input = gr.Audio(label="Record", type="filepath")
+        with gr.Column(scale=1, min_width=300):
             output_text = gr.Textbox(label="Output", lines=8, placeholder="The generated result will be displayed here...", interactive=False)
     # 添加任务选择和自定义输入框
     with gr.Row():
         task_dropdown = gr.Dropdown(
             label="Task",
+            choices=list(TASK_PROMPT_MAPPING.keys()) + ["Custom Task Prompt"],
             value="ASR (Automatic Speech Recognition)"
         )
+        custom_prompt_input = gr.Textbox(label="Custom Task Prompt", placeholder="Please enter a custom task prompt...", visible=False)
     # 添加按钮（下载按钮在左边，开始处理按钮在右边）
     with gr.Row():
         save_button = gr.Button("Submit Feedback", variant="secondary")
     # 添加底部内容
+    gr.HTML(
+        f"""
+        <div class="custom-footer">
+            <div>
+                <p>
+                    <a href="http://www.nwpu-aslp.org/" target="_blank">Audio, Speech and Language Processing Group (ASLP@NPU)</a>,
+                </p>
+                <p>
+                    Northwestern Polytechnical University
+                </p>
+                <p>
+                    <a href="https://github.com/ASLP-lab/OSUM" target="_blank">GitHub</a>
+                </p>
+            </div>
+            <img src="data:image/png;base64,{encoded_string}" alt="OSUM Logo">
+        </div>
+        """
+    )
     # 绑定事件
     def show_confirmation(output_res, input_wav_path, input_prompt):
         return gr.update(visible=False)
     def handle_submit(input_wav_path, task_choice, custom_prompt):
+        try:
+            if task_choice == "Custom Task Prompt":
+                input_prompt = custom_prompt
+            else:
+                input_prompt = TASK_PROMPT_MAPPING.get(task_choice, "未知任务类型")
+            output_res = do_decode(input_wav_path, input_prompt)
+            return output_res
+        except Exception as e:
+            print(f"Error in handle_submit: {e}")
+            return "Error occurred. Please check the input."
     # 当任务选择框的值发生变化时，更新自定义输入框的可见性
     task_dropdown.change(
     download_button.click(
         fn=download_audio,
         inputs=[audio_input],
+        outputs=[download_button]
     )
     save_button.click(