kooff11 commited on
Commit
ca6dc1e
·
verified ·
1 Parent(s): 84ec487

Training in progress, step 14, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:332cf6808556d7a494ce2f0aa34b22d4c16c9bc4e8c4834a3f8870bf2f34c47b
3
  size 82460660
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9bafac06c2c177b6873285cba9faa63a0aad0c7fde76726cc9c9ef561423470
3
  size 82460660
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ecefe9cb2134c36ac32f344736764510c8f969de1bcd9fdaedb31d523c78438
3
  size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:297e7ddbc295a07cecddf760a69f80e7807fb90e55e9ae40a8c01ff1aacc7519
3
  size 14512
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:373892a68dd4fdd748ed14777df992f68b324bb9261684875ca84ff9c7bd0fb1
3
  size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3fa8e33d36e4355c9c88316639a14b52060c5a44fe868e2fd61ab111f6ed180
3
  size 14512
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e096882cd5f2725064920833a5d82c69883609bddf4126e13e653e290fdb396a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f1660560e734c40e5470cca2d00d4f738c021882bc0c1304da944a20144bee2
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.25925925925925924,
5
  "eval_steps": 7,
6
- "global_step": 7,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -72,6 +72,63 @@
72
  "eval_samples_per_second": 10.063,
73
  "eval_steps_per_second": 2.543,
74
  "step": 7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
75
  }
76
  ],
77
  "logging_steps": 1,
@@ -91,7 +148,7 @@
91
  "attributes": {}
92
  }
93
  },
94
- "total_flos": 1.5658466354711757e+17,
95
  "train_batch_size": 2,
96
  "trial_name": null,
97
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.5185185185185185,
5
  "eval_steps": 7,
6
+ "global_step": 14,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
72
  "eval_samples_per_second": 10.063,
73
  "eval_steps_per_second": 2.543,
74
  "step": 7
75
+ },
76
+ {
77
+ "epoch": 0.2962962962962963,
78
+ "grad_norm": NaN,
79
+ "learning_rate": 8.644843137107059e-05,
80
+ "loss": 0.0,
81
+ "step": 8
82
+ },
83
+ {
84
+ "epoch": 0.3333333333333333,
85
+ "grad_norm": NaN,
86
+ "learning_rate": 8.18711994874345e-05,
87
+ "loss": 0.0,
88
+ "step": 9
89
+ },
90
+ {
91
+ "epoch": 0.37037037037037035,
92
+ "grad_norm": NaN,
93
+ "learning_rate": 7.679133974894983e-05,
94
+ "loss": 0.0,
95
+ "step": 10
96
+ },
97
+ {
98
+ "epoch": 0.4074074074074074,
99
+ "grad_norm": NaN,
100
+ "learning_rate": 7.128896457825364e-05,
101
+ "loss": 0.0,
102
+ "step": 11
103
+ },
104
+ {
105
+ "epoch": 0.4444444444444444,
106
+ "grad_norm": NaN,
107
+ "learning_rate": 6.545084971874738e-05,
108
+ "loss": 0.0,
109
+ "step": 12
110
+ },
111
+ {
112
+ "epoch": 0.48148148148148145,
113
+ "grad_norm": NaN,
114
+ "learning_rate": 5.9369065729286245e-05,
115
+ "loss": 0.0,
116
+ "step": 13
117
+ },
118
+ {
119
+ "epoch": 0.5185185185185185,
120
+ "grad_norm": NaN,
121
+ "learning_rate": 5.313952597646568e-05,
122
+ "loss": 0.0,
123
+ "step": 14
124
+ },
125
+ {
126
+ "epoch": 0.5185185185185185,
127
+ "eval_loss": NaN,
128
+ "eval_runtime": 18.089,
129
+ "eval_samples_per_second": 10.061,
130
+ "eval_steps_per_second": 2.543,
131
+ "step": 14
132
  }
133
  ],
134
  "logging_steps": 1,
 
148
  "attributes": {}
149
  }
150
  },
151
+ "total_flos": 3.1316932709423514e+17,
152
  "train_batch_size": 2,
153
  "trial_name": null,
154
  "trial_params": null