Update README.md
Browse files
README.md
CHANGED
|
@@ -112,7 +112,7 @@ prepare_for_inference(model, backend=backend, verbose=False)
|
|
| 112 |
############################################################
|
| 113 |
#Generate (streaming)
|
| 114 |
from hqq.utils.generation_hf import HFGenerator
|
| 115 |
-
gen = HFGenerator(model, tokenizer, max_new_tokens=
|
| 116 |
|
| 117 |
prompt = "If A equals B, and C equals B - A, what would be the value of C?"
|
| 118 |
out = gen.generate(prompt, print_tokens=True)
|
|
|
|
| 112 |
############################################################
|
| 113 |
#Generate (streaming)
|
| 114 |
from hqq.utils.generation_hf import HFGenerator
|
| 115 |
+
gen = HFGenerator(model, tokenizer, max_new_tokens=4096, do_sample=True, compile='partial').warmup()
|
| 116 |
|
| 117 |
prompt = "If A equals B, and C equals B - A, what would be the value of C?"
|
| 118 |
out = gen.generate(prompt, print_tokens=True)
|