Spaces:

GSridhar1982
/

QA_Llama31_Quantized_GGUF

Sleeping

GSridhar1982 commited on Sep 14

Commit

64be64c

•

1 Parent(s): 1062cdf

Updated the model

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,7 +5,7 @@ import subprocess
 def predict(text):
     # Call llama.cpp with the input text
     result = subprocess.run(
-        ["./llama.cpp/main", "-m", "path/to/your/model", "-p", text],
         capture_output=True,
         text=True
     )
@@ -14,8 +14,8 @@ def predict(text):
 # Create a Gradio interface
 iface = gr.Interface(
     fn=predict,
-    inputs=gr.Textbox(lines=2, placeholder="Enter text here..."),
-    outputs="text",
     title="LLaMA Model Inference",
     description="Enter text to generate using the LLaMA model."
 )

 def predict(text):
     # Call llama.cpp with the input text
     result = subprocess.run(
+        ["./llama.cpp/main", "-m", "GSridhar1982/QA_Llama31_Quantized_GGUF", "-p", text],
         capture_output=True,
         text=True
     )
 # Create a Gradio interface
 iface = gr.Interface(
     fn=predict,
+    inputs=gr.Textbox(lines=2, placeholder="Enter question here..."),
+    outputs="Answer",
     title="LLaMA Model Inference",
     description="Enter text to generate using the LLaMA model."
 )