Spaces:
Sleeping
Sleeping
Elijahbodden
commited on
Update app.py
Browse files
app.py
CHANGED
@@ -10,12 +10,12 @@ from huggingface_hub import upload_file
|
|
10 |
import json
|
11 |
from uuid import uuid4
|
12 |
|
13 |
-
model_id = "Elijahbodden/eliGPTv1.
|
14 |
|
15 |
# MODEL
|
16 |
model = Llama.from_pretrained(
|
17 |
repo_id=model_id,
|
18 |
-
filename="
|
19 |
verbose=True,
|
20 |
n_threads = 2,
|
21 |
n_threads_batch = 2,
|
@@ -73,7 +73,7 @@ def respond(
|
|
73 |
stop=["<|im_end|>"],
|
74 |
min_p=min_p,
|
75 |
max_tokens=max_tokens,
|
76 |
-
# Disable top-
|
77 |
top_k=100000000,
|
78 |
frequency_penalty=frequency_penalty,
|
79 |
presence_penalty=presence_penalty,
|
@@ -90,7 +90,7 @@ demo = gr.ChatInterface(
|
|
90 |
additional_inputs_accordion=gr.Accordion(label="Options", open=True),
|
91 |
css=".bubble-gap {gap: 6px !important}",
|
92 |
theme="shivi/calm_seafoam",
|
93 |
-
description="The model may
|
94 |
title="EliGPT v1.3",
|
95 |
additional_inputs=[
|
96 |
gr.Radio(presets.keys(), label="Personality preset", info="VERY SLIGHTLY influence the model's personality [WARNING, IF YOU CHANGE THIS WHILE THERE ARE MESSAGES IN THE CHAT, THE MODEL WILL BECOME VERY SLOW]", value="Default"),
|
|
|
10 |
import json
|
11 |
from uuid import uuid4
|
12 |
|
13 |
+
model_id = "Elijahbodden/eliGPTv1.3"
|
14 |
|
15 |
# MODEL
|
16 |
model = Llama.from_pretrained(
|
17 |
repo_id=model_id,
|
18 |
+
filename="model.gguf",
|
19 |
verbose=True,
|
20 |
n_threads = 2,
|
21 |
n_threads_batch = 2,
|
|
|
73 |
stop=["<|im_end|>"],
|
74 |
min_p=min_p,
|
75 |
max_tokens=max_tokens,
|
76 |
+
# Disable top-k pruning
|
77 |
top_k=100000000,
|
78 |
frequency_penalty=frequency_penalty,
|
79 |
presence_penalty=presence_penalty,
|
|
|
90 |
additional_inputs_accordion=gr.Accordion(label="Options", open=True),
|
91 |
css=".bubble-gap {gap: 6px !important}",
|
92 |
theme="shivi/calm_seafoam",
|
93 |
+
description="The model may be slow if it hasn't run recently or a lot of people are using it",
|
94 |
title="EliGPT v1.3",
|
95 |
additional_inputs=[
|
96 |
gr.Radio(presets.keys(), label="Personality preset", info="VERY SLIGHTLY influence the model's personality [WARNING, IF YOU CHANGE THIS WHILE THERE ARE MESSAGES IN THE CHAT, THE MODEL WILL BECOME VERY SLOW]", value="Default"),
|