LSX-UniWue
/

LLaMmlein_1B_chat_selected

Generated from Trainer

Inference Endpoints

Model card Files Files and versions Community

JanPf commited on Nov 22, 2024

Commit

15c3ec6

·

verified ·

1 Parent(s): 515d480

Update README.md

Files changed (1) hide show

README.md +1 -2

README.md CHANGED Viewed

@@ -33,7 +33,7 @@ torch.manual_seed(42)
 # script config
 base_model_name = "LSX-UniWue/LLaMmlein_1B"
 chat_adapter_name = "LSX-UniWue/LLaMmlein_1B_chat_selected"
-device = "mps"  # or cuda
 # chat history
 messages = [
@@ -47,7 +47,6 @@ messages = [
 config = PeftConfig.from_pretrained(chat_adapter_name)
 base_model = model = AutoModelForCausalLM.from_pretrained(
     base_model_name,
-    attn_implementation="flash_attention_2" if device == "cuda" else None,
     torch_dtype=torch.bfloat16,
     device_map=device,
 )

 # script config
 base_model_name = "LSX-UniWue/LLaMmlein_1B"
 chat_adapter_name = "LSX-UniWue/LLaMmlein_1B_chat_selected"
+device = "cuda"  # or mps
 # chat history
 messages = [
 config = PeftConfig.from_pretrained(chat_adapter_name)
 base_model = model = AutoModelForCausalLM.from_pretrained(
     base_model_name,
     torch_dtype=torch.bfloat16,
     device_map=device,
 )