Spaces:

PhantHive
/

Phearion-bigbrain-v0.0.1

Paused

PhantHive commited on Feb 24

Commit

8ef6e3f

•

1 Parent(s): c0b7aa4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -25,9 +25,7 @@ model = PeftModel.from_pretrained(model, model_id)
 def greet(text):
     with torch.no_grad():
         # Include EOS token for better context
-        input_text = "<s>### Instruction:\nYou are a data analyst tasked with helping students finding resources, respond in JSON format.\n\n" +
-                     f"### Input:\n{text}\n\n" +
-                     "### Response:\n"
         batch = tokenizer(input_text, return_tensors='pt', add_special_tokens=True).to(device)
@@ -42,8 +40,8 @@ def greet(text):
         # Decode only the generated tokens
         response = tokenizer.decode(output_tokens[0][len(batch['input_ids'][0]):], skip_special_tokens=True)
-        # Additional stopping condition at next "\n### Response:"
-        response_parts = response.split("\n### Response:")
         return response_parts[0]  # Return only the first part
 iface = gr.Interface(fn=greet, inputs="text", outputs="text", title="PEFT Model for Big Brain")

 def greet(text):
     with torch.no_grad():
         # Include EOS token for better context
+        input_text = "<s>### User:\n{text}\n\n### Assistant:\n"
         batch = tokenizer(input_text, return_tensors='pt', add_special_tokens=True).to(device)
         # Decode only the generated tokens
         response = tokenizer.decode(output_tokens[0][len(batch['input_ids'][0]):], skip_special_tokens=True)
+        # Additional stopping condition at next "### Response:"
+        response_parts = response.split("### Assistant:")
         return response_parts[0]  # Return only the first part
 iface = gr.Interface(fn=greet, inputs="text", outputs="text", title="PEFT Model for Big Brain")