updated max_new_tokens in handler.py
Browse files- handler.py +1 -1
handler.py
CHANGED
@@ -54,7 +54,7 @@ class EndpointHandler:
|
|
54 |
outputs = self.model.generate(
|
55 |
tokenizer_output["input_ids"],
|
56 |
attention_mask=tokenizer_output["attention_mask"],
|
57 |
-
|
58 |
pad_token_id=self.tokenizer.pad_token_id,
|
59 |
do_sample=True,
|
60 |
temperature=0.7,
|
|
|
54 |
outputs = self.model.generate(
|
55 |
tokenizer_output["input_ids"],
|
56 |
attention_mask=tokenizer_output["attention_mask"],
|
57 |
+
max_new_tokens=1024,
|
58 |
pad_token_id=self.tokenizer.pad_token_id,
|
59 |
do_sample=True,
|
60 |
temperature=0.7,
|