winglian commited on
Commit
3b18c96
·
unverified ·
1 Parent(s): 3fbde76

set auto for other params that hf trainer sets for ds. include zero1 json (#570)

Browse files
deepspeed/zero1.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "zero_optimization": {
3
+ "stage": 1,
4
+ "overlap_comm": true
5
+ },
6
+ "bf16": {
7
+ "enabled": "auto"
8
+ },
9
+ "fp16": {
10
+ "enabled": "auto",
11
+ "auto_cast": false,
12
+ "loss_scale": 0,
13
+ "initial_scale_power": 32,
14
+ "loss_scale_window": 1000,
15
+ "hysteresis": 2,
16
+ "min_loss_scale": 1
17
+ },
18
+ "optimizer": {
19
+ "type": "AdamW",
20
+ "params": {
21
+ "lr": "auto",
22
+ "betas": "auto",
23
+ "eps": "auto",
24
+ "weight_decay": "auto"
25
+ }
26
+ },
27
+ "scheduler": {
28
+ "type": "WarmupDecayLR",
29
+ "params": {
30
+ "warmup_min_lr": "auto",
31
+ "warmup_max_lr": "auto",
32
+ "warmup_num_steps": "auto",
33
+ "total_num_steps": "auto"
34
+ }
35
+ },
36
+ "train_batch_size": "auto",
37
+ "train_micro_batch_size_per_gpu": "auto",
38
+ "wall_clock_breakdown": false
39
+ }
deepspeed/zero2.json CHANGED
@@ -23,11 +23,8 @@
23
  "type": "AdamW",
24
  "params": {
25
  "lr": "auto",
26
- "betas": [
27
- 0.9,
28
- 0.999
29
- ],
30
- "eps": 1e-8,
31
  "weight_decay": "auto"
32
  }
33
  },
 
23
  "type": "AdamW",
24
  "params": {
25
  "lr": "auto",
26
+ "betas": "auto",
27
+ "eps": "auto",
 
 
 
28
  "weight_decay": "auto"
29
  }
30
  },
deepspeed/zero3.json CHANGED
@@ -36,7 +36,7 @@
36
  "params": {
37
  "lr": "auto",
38
  "betas": "auto",
39
- "eps": 1e-8,
40
  "weight_decay": "auto"
41
  }
42
  },
 
36
  "params": {
37
  "lr": "auto",
38
  "betas": "auto",
39
+ "eps": "auto",
40
  "weight_decay": "auto"
41
  }
42
  },