herMaster commited on
Commit
31c311c
1 Parent(s): c315a78

added repetition penalty.

Browse files
Files changed (1) hide show
  1. app.py +1 -4
app.py CHANGED
@@ -36,11 +36,8 @@ print("loading the LLM......................................")
36
  llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7B-Chat-GGUF",
37
  model_file="llama-2-7b-chat.Q3_K_L.gguf",
38
  model_type="llama",
39
- # config = ctransformers.hub.AutoConfig,
40
- # hf = True
41
  temperature = 0.2,
42
- # max_new_tokens = 1024,
43
- # stop = ['\n']
44
  )
45
 
46
 
 
36
  llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7B-Chat-GGUF",
37
  model_file="llama-2-7b-chat.Q3_K_L.gguf",
38
  model_type="llama",
 
 
39
  temperature = 0.2,
40
+ repetition_penalty = 1.5
 
41
  )
42
 
43