Artix

Runtime error

Vitrous commited on Feb 17, 2024

Commit

e0a385c

verified ·

1 Parent(s): c9cc0e9

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -62,11 +62,8 @@ def generate_response(prompt: str) -> dict:
         repetition_penalty=1.1
     )
     # Generate the response
-    #generated_response = pipe(prompt_template)[0]['generated_text']
-    input_ids = tokenizer(prompt_template, return_tensors='pt').input_ids.cuda()
-    output = model.generate(inputs=input_ids, temperature=0.7, do_sample=True, top_p=0.95, top_k=40, max_new_tokens=512)
-    generated_response = (tokenizer.decode(output[0]))
     # Extract the assistant's reply
     assistant_reply = generated_response.split('\n')[1]

         repetition_penalty=1.1
     )
     # Generate the response
+    generated_response = pipe(prompt_template)[0]['generated_text']
     # Extract the assistant's reply
     assistant_reply = generated_response.split('\n')[1]