Update README.md
Browse files
README.md
CHANGED
|
@@ -118,7 +118,7 @@ prepare_for_inference(model, backend=backend, verbose=False)
|
|
| 118 |
############################################################
|
| 119 |
#Generate (streaming)
|
| 120 |
from hqq.utils.generation_hf import HFGenerator
|
| 121 |
-
gen = HFGenerator(model, tokenizer, max_new_tokens=
|
| 122 |
|
| 123 |
prompt = "If A equals B, and C equals B - A, what would be the value of C?"
|
| 124 |
out = gen.generate(prompt, print_tokens=True)
|
|
|
|
| 118 |
############################################################
|
| 119 |
#Generate (streaming)
|
| 120 |
from hqq.utils.generation_hf import HFGenerator
|
| 121 |
+
gen = HFGenerator(model, tokenizer, max_new_tokens=4096, do_sample=True, compile='partial').warmup()
|
| 122 |
|
| 123 |
prompt = "If A equals B, and C equals B - A, what would be the value of C?"
|
| 124 |
out = gen.generate(prompt, print_tokens=True)
|