mobicham commited on
Commit
40f505b
·
verified ·
1 Parent(s): 47daab5

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -112,7 +112,7 @@ prepare_for_inference(model, backend=backend, verbose=False)
112
  ############################################################
113
  #Generate (streaming)
114
  from hqq.utils.generation_hf import HFGenerator
115
- gen = HFGenerator(model, tokenizer, max_new_tokens=8192, do_sample=True, compile='partial').warmup()
116
 
117
  prompt = "If A equals B, and C equals B - A, what would be the value of C?"
118
  out = gen.generate(prompt, print_tokens=True)
 
112
  ############################################################
113
  #Generate (streaming)
114
  from hqq.utils.generation_hf import HFGenerator
115
+ gen = HFGenerator(model, tokenizer, max_new_tokens=4096, do_sample=True, compile='partial').warmup()
116
 
117
  prompt = "If A equals B, and C equals B - A, what would be the value of C?"
118
  out = gen.generate(prompt, print_tokens=True)