Update README.md
Browse files
README.md
CHANGED
@@ -112,7 +112,7 @@ prepare_for_inference(model, backend=backend, verbose=False)
|
|
112 |
############################################################
|
113 |
#Generate (streaming)
|
114 |
from hqq.utils.generation_hf import HFGenerator
|
115 |
-
gen = HFGenerator(model, tokenizer, max_new_tokens=
|
116 |
|
117 |
prompt = "If A equals B, and C equals B - A, what would be the value of C?"
|
118 |
out = gen.generate(prompt, print_tokens=True)
|
|
|
112 |
############################################################
|
113 |
#Generate (streaming)
|
114 |
from hqq.utils.generation_hf import HFGenerator
|
115 |
+
gen = HFGenerator(model, tokenizer, max_new_tokens=4096, do_sample=True, compile='partial').warmup()
|
116 |
|
117 |
prompt = "If A equals B, and C equals B - A, what would be the value of C?"
|
118 |
out = gen.generate(prompt, print_tokens=True)
|