PEFT
Safetensors
GGUF
German
trl
sft
Generated from Trainer
Inference Endpoints
conversational
JanPf commited on
Commit
15c3ec6
·
verified ·
1 Parent(s): 515d480

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -2
README.md CHANGED
@@ -33,7 +33,7 @@ torch.manual_seed(42)
33
  # script config
34
  base_model_name = "LSX-UniWue/LLaMmlein_1B"
35
  chat_adapter_name = "LSX-UniWue/LLaMmlein_1B_chat_selected"
36
- device = "mps" # or cuda
37
 
38
  # chat history
39
  messages = [
@@ -47,7 +47,6 @@ messages = [
47
  config = PeftConfig.from_pretrained(chat_adapter_name)
48
  base_model = model = AutoModelForCausalLM.from_pretrained(
49
  base_model_name,
50
- attn_implementation="flash_attention_2" if device == "cuda" else None,
51
  torch_dtype=torch.bfloat16,
52
  device_map=device,
53
  )
 
33
  # script config
34
  base_model_name = "LSX-UniWue/LLaMmlein_1B"
35
  chat_adapter_name = "LSX-UniWue/LLaMmlein_1B_chat_selected"
36
+ device = "cuda" # or mps
37
 
38
  # chat history
39
  messages = [
 
47
  config = PeftConfig.from_pretrained(chat_adapter_name)
48
  base_model = model = AutoModelForCausalLM.from_pretrained(
49
  base_model_name,
 
50
  torch_dtype=torch.bfloat16,
51
  device_map=device,
52
  )