Update README.md
Browse files
README.md
CHANGED
@@ -98,7 +98,7 @@ lora_layers: 32
|
|
98 |
batch_size: 1
|
99 |
|
100 |
# Iterations to train for.
|
101 |
-
iters:
|
102 |
|
103 |
# Number of validation batches, -1 uses the entire validation set.
|
104 |
val_batches: 25
|
@@ -144,9 +144,9 @@ lora_parameters:
|
|
144 |
dropout: 0.05
|
145 |
|
146 |
# Schedule can only be specified in a config file, uncomment to use.
|
147 |
-
lr_schedule:
|
148 |
-
name: cosine_decay
|
149 |
-
warmup: 100 # 0 for no warmup
|
150 |
-
warmup_init: 1e-7 # 0 if not specified
|
151 |
-
arguments: [1e-6, 1000, 1e-7] # passed to scheduler
|
152 |
```
|
|
|
98 |
batch_size: 1
|
99 |
|
100 |
# Iterations to train for.
|
101 |
+
iters: 6000
|
102 |
|
103 |
# Number of validation batches, -1 uses the entire validation set.
|
104 |
val_batches: 25
|
|
|
144 |
dropout: 0.05
|
145 |
|
146 |
# Schedule can only be specified in a config file, uncomment to use.
|
147 |
+
#lr_schedule:
|
148 |
+
# name: cosine_decay
|
149 |
+
# warmup: 100 # 0 for no warmup
|
150 |
+
# warmup_init: 1e-7 # 0 if not specified
|
151 |
+
# arguments: [1e-6, 1000, 1e-7] # passed to scheduler
|
152 |
```
|