Update README.md
Browse files
README.md
CHANGED
@@ -118,7 +118,7 @@ prepare_for_inference(model, backend=backend, verbose=False)
|
|
118 |
############################################################
|
119 |
#Generate (streaming)
|
120 |
from hqq.utils.generation_hf import HFGenerator
|
121 |
-
gen = HFGenerator(model, tokenizer, max_new_tokens=
|
122 |
|
123 |
prompt = "If A equals B, and C equals B - A, what would be the value of C?"
|
124 |
out = gen.generate(prompt, print_tokens=True)
|
|
|
118 |
############################################################
|
119 |
#Generate (streaming)
|
120 |
from hqq.utils.generation_hf import HFGenerator
|
121 |
+
gen = HFGenerator(model, tokenizer, max_new_tokens=4096, do_sample=True, compile='partial').warmup()
|
122 |
|
123 |
prompt = "If A equals B, and C equals B - A, what would be the value of C?"
|
124 |
out = gen.generate(prompt, print_tokens=True)
|