jpfearnworks
commited on
Commit
β’
ac85c0e
1
Parent(s):
f1fbf66
Add Readme, Clean up comments
Browse files
examples/qlora-openllama-3b/README.md
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# qlora-openllama-3b
|
2 |
+
|
3 |
+
```shell
|
4 |
+
accelerate launch scripts/finetune.py examples/lora-openllama-3b
|
5 |
+
|
6 |
+
```
|
examples/{qlora-openllama-3b.yml β qlora-openllama-3b}/config.yml
RENAMED
@@ -26,15 +26,15 @@ wandb_watch:
|
|
26 |
wandb_run_id:
|
27 |
wandb_log_model:
|
28 |
output_dir: ./qlora-out
|
29 |
-
batch_size:
|
30 |
-
micro_batch_size: 4
|
31 |
-
num_epochs: 2
|
32 |
optimizer: paged_adamw_32bit
|
33 |
torchdistx_path:
|
34 |
lr_scheduler: cosine
|
35 |
learning_rate: 0.0002
|
36 |
train_on_inputs: false
|
37 |
-
group_by_length: true
|
38 |
bf16: true
|
39 |
fp16: false
|
40 |
tf32: true
|
|
|
26 |
wandb_run_id:
|
27 |
wandb_log_model:
|
28 |
output_dir: ./qlora-out
|
29 |
+
batch_size: 4
|
30 |
+
micro_batch_size: 4
|
31 |
+
num_epochs: 2
|
32 |
optimizer: paged_adamw_32bit
|
33 |
torchdistx_path:
|
34 |
lr_scheduler: cosine
|
35 |
learning_rate: 0.0002
|
36 |
train_on_inputs: false
|
37 |
+
group_by_length: true
|
38 |
bf16: true
|
39 |
fp16: false
|
40 |
tf32: true
|