Spaces:

Tonic
/

Salamandra-2B-Instruct

Runtime error

App Files Files Community

Tonic commited on Oct 3, 2024

Commit

51ce0b9

unverified ·

1 Parent(s): 1223061

add demo

Browse files

Files changed (1) hide show

app.py +9 -9

app.py CHANGED Viewed

@@ -13,10 +13,8 @@ model = AutoModelForCausalLM.from_pretrained(
     device_map="auto",
     torch_dtype=torch.bfloat16
 )
-# Set pad_token_id to eos_token_id if it's not set
-if tokenizer.pad_token_id is None:
-    tokenizer.pad_token_id = tokenizer.eos_token_id
 description = """
 Salamandra-2b-instruct is a Transformer-based decoder-only language model that has been pre-trained on 7.8 trillion tokens of highly curated data.
@@ -47,7 +45,7 @@ def generate_text(system_prompt, user_prompt, temperature, max_new_tokens, top_p
     )
     inputs = tokenizer(chat_prompt, return_tensors="pt", padding=True, truncation=True)
-    inputs = {k: v.to(model.device) for k, v in inputs.items()}
     outputs = model.generate(
         **inputs,
@@ -71,23 +69,25 @@ with gr.Blocks() as demo:
     with gr.Row():
         with gr.Column(scale=1):
-            gr.Markdown(description)
         with gr.Column(scale=1):
-            gr.Markdown(join_us)
     with gr.Row():
         with gr.Column(scale=1):
             system_prompt = gr.Textbox(
                 lines=3,
                 label="🖥️ System Prompt",
-                value="You are a helpful, respectful and honest assistant. Always answer as helpfully as possible, while being safe. Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature. If a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information."
             )
             user_prompt = gr.Textbox(lines=5, label="🙋‍♂️ User Prompt")
             generate_button = gr.Button("Generate with 🦎 Salamandra-2b-instruct")
             with gr.Accordion("🧪 Parameters", open=False):
                 temperature = gr.Slider(0.0, 1.0, value=0.7, label="🌡️ Temperature")
-                max_new_tokens = gr.Slider(1, 1000, value=200, step=1, label="🔢 Max New Tokens")
                 top_p = gr.Slider(0.0, 1.0, value=0.95, label="⚛️ Top P")
                 repetition_penalty = gr.Slider(1.0, 2.0, value=1.2, label="🔁 Repetition Penalty")

     device_map="auto",
     torch_dtype=torch.bfloat16
 )
+# if tokenizer.pad_token_id is None:
+#     tokenizer.pad_token_id = tokenizer.eos_token_id
 description = """
 Salamandra-2b-instruct is a Transformer-based decoder-only language model that has been pre-trained on 7.8 trillion tokens of highly curated data.
     )
     inputs = tokenizer(chat_prompt, return_tensors="pt", padding=True, truncation=True)
+    # inputs = {k: v.to(model.device) for k, v in inputs.items()}
     outputs = model.generate(
         **inputs,
     with gr.Row():
         with gr.Column(scale=1):
+            with gr.Group():
+                gr.Markdown(description)
         with gr.Column(scale=1):
+            with gr.Group():
+                gr.Markdown(join_us)
     with gr.Row():
         with gr.Column(scale=1):
             system_prompt = gr.Textbox(
                 lines=3,
                 label="🖥️ System Prompt",
+                value="You are Tonic-ai a senior expert assistant known for their abilities to explain and answer questions."
             )
             user_prompt = gr.Textbox(lines=5, label="🙋‍♂️ User Prompt")
             generate_button = gr.Button("Generate with 🦎 Salamandra-2b-instruct")
             with gr.Accordion("🧪 Parameters", open=False):
                 temperature = gr.Slider(0.0, 1.0, value=0.7, label="🌡️ Temperature")
+                max_new_tokens = gr.Slider(1, 2046, value=450, step=1, label="🔢 Max New Tokens")
                 top_p = gr.Slider(0.0, 1.0, value=0.95, label="⚛️ Top P")
                 repetition_penalty = gr.Slider(1.0, 2.0, value=1.2, label="🔁 Repetition Penalty")