mobicham commited on
Commit
16f6691
·
verified ·
1 Parent(s): dc380b4

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -118,7 +118,7 @@ prepare_for_inference(model, backend=backend, verbose=False)
118
  ############################################################
119
  #Generate (streaming)
120
  from hqq.utils.generation_hf import HFGenerator
121
- gen = HFGenerator(model, tokenizer, max_new_tokens=8192, do_sample=True, compile='partial').warmup()
122
 
123
  prompt = "If A equals B, and C equals B - A, what would be the value of C?"
124
  out = gen.generate(prompt, print_tokens=True)
 
118
  ############################################################
119
  #Generate (streaming)
120
  from hqq.utils.generation_hf import HFGenerator
121
+ gen = HFGenerator(model, tokenizer, max_new_tokens=4096, do_sample=True, compile='partial').warmup()
122
 
123
  prompt = "If A equals B, and C equals B - A, what would be the value of C?"
124
  out = gen.generate(prompt, print_tokens=True)