secretmoon commited on
Commit
c88a22d
1 Parent(s): 882b03a

Upload lora.yml

Browse files

axolotl lora train config

Files changed (1) hide show
  1. lora.yml +74 -0
lora.yml ADDED
@@ -0,0 +1,74 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: /mnt/WD/AI/text-generation-webui/models/L3-8B-Stheno-v3.1/
2
+ model_type: AutoModelForCausalLM
3
+ tokenizer_type: AutoTokenizer
4
+
5
+ load_in_8bit: true
6
+ load_in_4bit: false
7
+ strict: false
8
+
9
+ datasets:
10
+ - path: 94_stories.jsonl
11
+ type: completion
12
+ - path: Luna_personality_instruct.json
13
+ type: alpaca
14
+ - path: alpaca_wiki_6144.json
15
+ type: alpaca
16
+ - path: alpaca_Luna.json
17
+ type: alpaca
18
+ dataset_prepared_path: last_run_prepared
19
+ val_set_size: 0
20
+ output_dir: ./lora-out
21
+ lora_on_cpu: true
22
+
23
+ adapter: lora
24
+ lora_model_dir:
25
+
26
+ sequence_len: 6144
27
+ sample_packing: true
28
+ pad_to_sequence_len: true
29
+
30
+ lora_r: 256
31
+ lora_alpha: 64
32
+ lora_dropout: 0.04
33
+ lora_target_modules:
34
+ lora_target_linear: true
35
+ lora_fan_in_fan_out:
36
+
37
+ wandb_project:
38
+ wandb_entity:
39
+ wandb_watch:
40
+ wandb_name:
41
+ wandb_log_model:
42
+
43
+ gradient_accumulation_steps: 1
44
+ micro_batch_size: 2
45
+ num_epochs: 3
46
+ optimizer: adamw_bnb_8bit
47
+ lr_scheduler: cosine
48
+ learning_rate: 0.00033
49
+
50
+ train_on_inputs: false
51
+ group_by_length: false
52
+ bf16: true
53
+ fp16:
54
+ tf32: true
55
+
56
+ gradient_checkpointing: true
57
+ early_stopping_patience:
58
+ resume_from_checkpoint:
59
+ local_rank:
60
+ logging_steps: 1
61
+ xformers_attention:
62
+ flash_attention: true
63
+
64
+ warmup_steps: 50
65
+ evals_per_epoch: 4
66
+ eval_table_size:
67
+ saves_per_epoch: 1
68
+ debug:
69
+ deepspeed:
70
+ weight_decay: 0.0
71
+ fsdp:
72
+ fsdp_config:
73
+ special_tokens:
74
+ pad_token: "<|end_of_text|>"