LLM_PLAYGROUND

Running

App Files Files Community

Kims12 commited on 9 days ago

Commit

44cf963

verified ·

1 Parent(s): 0089bb1

Update app.py

Browse files

Files changed (1) hide show

app.py +1 -117

app.py CHANGED Viewed

@@ -4,8 +4,6 @@ import openai
 import anthropic
 import os
 from typing import Optional
-import transformers
-import torch
 #############################
 # [기본코드] - 수정/삭제 불가
@@ -172,62 +170,6 @@ def respond_claude_qna(
     except Exception as e:
         return f"예상치 못한 오류가 발생했습니다: {str(e)}"
-#############################
-# [추가코드] - Llama-3.3-70B-Instruct / Llama-3.2-3B-Instruct 적용 (transformers.pipeline 방식)
-#############################
-def get_llama_client(model_choice: str):
-    """
-    선택된 Llama 모델에 맞춰 transformers의 text-generation 파이프라인을 생성.
-    """
-    if model_choice == "Llama-3.3-70B-Instruct":
-        model_id = "meta-llama/Llama-3.3-70B-Instruct"
-    elif model_choice == "Llama-3.2-3B-Instruct":
-        model_id = "meta-llama/Llama-3.2-3B-Instruct"
-    else:
-        raise ValueError("유효하지 않은 모델 선택입니다.")
-    pipeline_llama = transformers.pipeline(
-        "text-generation",
-        model=model_id,
-        model_kwargs={"torch_dtype": torch.bfloat16},
-        device_map="auto",
-    )
-    return pipeline_llama
-def respond_llama_qna(
-    question: str,
-    system_message: str,
-    max_tokens: int,
-    temperature: float,
-    top_p: float,
-    model_choice: str
-):
-    """
-    선택된 Llama 모델을 이용해 한 번의 질문(question)에 대한 답변을 transformers 파이프라인으로 반환하는 함수.
-    system_message와 question을 하나의 프롬프트로 결합하여 생성합니다.
-    """
-    try:
-        pipeline_llama = get_llama_client(model_choice)
-    except ValueError as e:
-        return f"오류: {str(e)}"
-    # system_message와 question을 연결하여 프롬프트 생성
-    prompt = system_message.strip() + "\n" + question.strip()
-    try:
-        outputs = pipeline_llama(
-            prompt,
-            max_new_tokens=max_tokens,
-            temperature=temperature,
-            top_p=top_p,
-        )
-        # 생성된 텍스트를 추출 (전체 프롬프트 이후의 텍스트만 반환할 수도 있음)
-        generated_text = outputs[0]["generated_text"]
-        return generated_text
-    except Exception as e:
-        return f"오류가 발생했습니다: {str(e)}"
 #############################
 # [기본코드] UI 부분 - 수정/삭제 불가
 #############################
@@ -463,66 +405,8 @@ with gr.Blocks() as demo:
             outputs=deepseek_answer_output
         )
-    #################
-    # Llama 탭 (추가)
-    #################
-    with gr.Tab("Llama"):
-        # 라디오 버튼 추가: Llama-3.3-70B-Instruct (기본) / Llama-3.2-3B-Instruct
-        llama_model_radio = gr.Radio(
-            choices=["Llama-3.3-70B-Instruct", "Llama-3.2-3B-Instruct"],
-            label="모델 선택",
-            value="Llama-3.3-70B-Instruct"
-        )
-        llama_input1 = gr.Textbox(label="입력1", lines=1)
-        llama_input2 = gr.Textbox(label="입력2", lines=1)
-        llama_input3 = gr.Textbox(label="입력3", lines=1)
-        llama_input4 = gr.Textbox(label="입력4", lines=1)
-        llama_input5 = gr.Textbox(label="입력5", lines=1)
-        llama_answer_output = gr.Textbox(label="결과", lines=5, interactive=False)
-        with gr.Accordion("고급 설정 (Llama)", open=False):
-            llama_system_message = gr.Textbox(
-                value="""반드시 한글로 답변할 것.
-너는 최고의 비서이다.
-내가 요구하는 것을 최대한 자세하고 정확하게 답변하라.
-""",
-                label="System Message",
-                lines=3
-            )
-            llama_max_tokens = gr.Slider(minimum=100, maximum=10000, value=4000, step=100, label="Max Tokens")
-            llama_temperature = gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.1, label="Temperature")
-            llama_top_p = gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-P")
-        llama_submit_button = gr.Button("전송")
-        def merge_and_call_llama(i1, i2, i3, i4, i5, sys_msg, mt, temp, top_p_, model_choice):
-            question = " ".join([i1, i2, i3, i4, i5])
-            return respond_llama_qna(
-                question=question,
-                system_message=sys_msg,
-                max_tokens=mt,
-                temperature=temp,
-                top_p=top_p_,
-                model_choice=model_choice
-            )
-        llama_submit_button.click(
-            fn=merge_and_call_llama,
-            inputs=[
-                llama_input1, llama_input2, llama_input3, llama_input4, llama_input5,
-                llama_system_message,
-                llama_max_tokens,
-                llama_temperature,
-                llama_top_p,
-                llama_model_radio  # 라디오 버튼 입력 추가
-            ],
-            outputs=llama_answer_output
-        )
 #############################
 # 메인 실행부
 #############################
 if __name__ == "__main__":
-    demo.launch()

 import anthropic
 import os
 from typing import Optional
 #############################
 # [기본코드] - 수정/삭제 불가
     except Exception as e:
         return f"예상치 못한 오류가 발생했습니다: {str(e)}"
 #############################
 # [기본코드] UI 부분 - 수정/삭제 불가
 #############################
             outputs=deepseek_answer_output
         )
 #############################
 # 메인 실행부
 #############################
 if __name__ == "__main__":
+    demo.launch()