Spaces:

lakshyaag
/

w3d1-legal-summarizer-app

Paused

lakshyaag commited on Jun 15, 2024

Commit

20c7176

verified ·

1 Parent(s): f40f065

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -42,6 +42,8 @@ base_model = AutoModelForCausalLM.from_pretrained(
 )
 model = PeftModel.from_pretrained(base_model, "lakshyaag/llama38binstruct_summarize")
 # Move model to GPU if available
 if torch.cuda.is_available():
@@ -95,9 +97,7 @@ async def main(message: cl.Message):
     )
     # decode output from tokenized output to str output
-    decoded_output = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)
-    print(decoded_output)
     # return only the generated response (not the prompt) as output
     response = decoded_output[0].split("<|end_header_id|>")[-1]

 )
 model = PeftModel.from_pretrained(base_model, "lakshyaag/llama38binstruct_summarize")
+model.merge_and_unload()
 # Move model to GPU if available
 if torch.cuda.is_available():
     )
     # decode output from tokenized output to str output
+    decoded_output = tokenizer.batch_decode(generated_ids)
     # return only the generated response (not the prompt) as output
     response = decoded_output[0].split("<|end_header_id|>")[-1]