End of training
Browse files
all_results.json
CHANGED
@@ -1,12 +1,12 @@
|
|
1 |
{
|
2 |
"epoch": 624.0,
|
3 |
"eval_loss": 0.9921010732650757,
|
4 |
-
"eval_runtime":
|
5 |
-
"eval_samples_per_second": 9.
|
6 |
-
"eval_steps_per_second": 0.
|
7 |
"eval_wer": 34.21715788320368,
|
8 |
"train_loss": 0.02765977076081908,
|
9 |
-
"train_runtime":
|
10 |
-
"train_samples_per_second": 12.
|
11 |
"train_steps_per_second": 0.191
|
12 |
}
|
|
|
1 |
{
|
2 |
"epoch": 624.0,
|
3 |
"eval_loss": 0.9921010732650757,
|
4 |
+
"eval_runtime": 135.7332,
|
5 |
+
"eval_samples_per_second": 9.113,
|
6 |
+
"eval_steps_per_second": 0.287,
|
7 |
"eval_wer": 34.21715788320368,
|
8 |
"train_loss": 0.02765977076081908,
|
9 |
+
"train_runtime": 26145.1461,
|
10 |
+
"train_samples_per_second": 12.239,
|
11 |
"train_steps_per_second": 0.191
|
12 |
}
|
eval_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"epoch": 624.0,
|
3 |
"eval_loss": 0.9921010732650757,
|
4 |
-
"eval_runtime":
|
5 |
-
"eval_samples_per_second": 9.
|
6 |
-
"eval_steps_per_second": 0.
|
7 |
"eval_wer": 34.21715788320368
|
8 |
}
|
|
|
1 |
{
|
2 |
"epoch": 624.0,
|
3 |
"eval_loss": 0.9921010732650757,
|
4 |
+
"eval_runtime": 135.7332,
|
5 |
+
"eval_samples_per_second": 9.113,
|
6 |
+
"eval_steps_per_second": 0.287,
|
7 |
"eval_wer": 34.21715788320368
|
8 |
}
|
runs/Dec05_00-34-16_spartan-gpgpu111.hpc.unimelb.edu.au/events.out.tfevents.1670187201.spartan-gpgpu111.hpc.unimelb.edu.au
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:433f5889c525703f31ef1069f851311928d9ad29a52f11d06b4d80a637ac2f58
|
3 |
+
size 40
|
train_results.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"epoch": 624.0,
|
3 |
"train_loss": 0.02765977076081908,
|
4 |
-
"train_runtime":
|
5 |
-
"train_samples_per_second": 12.
|
6 |
"train_steps_per_second": 0.191
|
7 |
}
|
|
|
1 |
{
|
2 |
"epoch": 624.0,
|
3 |
"train_loss": 0.02765977076081908,
|
4 |
+
"train_runtime": 26145.1461,
|
5 |
+
"train_samples_per_second": 12.239,
|
6 |
"train_steps_per_second": 0.191
|
7 |
}
|
trainer_state.json
CHANGED
@@ -250,9 +250,9 @@
|
|
250 |
{
|
251 |
"epoch": 124.0,
|
252 |
"eval_loss": 0.7998368740081787,
|
253 |
-
"eval_runtime":
|
254 |
-
"eval_samples_per_second": 9.
|
255 |
-
"eval_steps_per_second": 0.
|
256 |
"eval_wer": 21.770570833789854,
|
257 |
"step": 1000
|
258 |
},
|
@@ -499,8 +499,8 @@
|
|
499 |
{
|
500 |
"epoch": 249.0,
|
501 |
"eval_loss": 0.8832917213439941,
|
502 |
-
"eval_runtime": 131.
|
503 |
-
"eval_samples_per_second": 9.
|
504 |
"eval_steps_per_second": 0.296,
|
505 |
"eval_wer": 28.968993097403313,
|
506 |
"step": 2000
|
@@ -748,9 +748,9 @@
|
|
748 |
{
|
749 |
"epoch": 374.0,
|
750 |
"eval_loss": 0.9381842613220215,
|
751 |
-
"eval_runtime":
|
752 |
-
"eval_samples_per_second": 9.
|
753 |
-
"eval_steps_per_second": 0.
|
754 |
"eval_wer": 30.820642051057302,
|
755 |
"step": 3000
|
756 |
},
|
@@ -997,9 +997,9 @@
|
|
997 |
{
|
998 |
"epoch": 499.0,
|
999 |
"eval_loss": 0.9754325151443481,
|
1000 |
-
"eval_runtime": 133.
|
1001 |
-
"eval_samples_per_second": 9.
|
1002 |
-
"eval_steps_per_second": 0.
|
1003 |
"eval_wer": 34.436287936890544,
|
1004 |
"step": 4000
|
1005 |
},
|
@@ -1246,9 +1246,9 @@
|
|
1246 |
{
|
1247 |
"epoch": 624.0,
|
1248 |
"eval_loss": 0.9921010732650757,
|
1249 |
-
"eval_runtime":
|
1250 |
-
"eval_samples_per_second": 9.
|
1251 |
-
"eval_steps_per_second": 0.
|
1252 |
"eval_wer": 34.21715788320368,
|
1253 |
"step": 5000
|
1254 |
},
|
@@ -1257,8 +1257,8 @@
|
|
1257 |
"step": 5000,
|
1258 |
"total_flos": 8.94614740992e+19,
|
1259 |
"train_loss": 0.02765977076081908,
|
1260 |
-
"train_runtime":
|
1261 |
-
"train_samples_per_second": 12.
|
1262 |
"train_steps_per_second": 0.191
|
1263 |
}
|
1264 |
],
|
|
|
250 |
{
|
251 |
"epoch": 124.0,
|
252 |
"eval_loss": 0.7998368740081787,
|
253 |
+
"eval_runtime": 130.4981,
|
254 |
+
"eval_samples_per_second": 9.479,
|
255 |
+
"eval_steps_per_second": 0.299,
|
256 |
"eval_wer": 21.770570833789854,
|
257 |
"step": 1000
|
258 |
},
|
|
|
499 |
{
|
500 |
"epoch": 249.0,
|
501 |
"eval_loss": 0.8832917213439941,
|
502 |
+
"eval_runtime": 131.7792,
|
503 |
+
"eval_samples_per_second": 9.387,
|
504 |
"eval_steps_per_second": 0.296,
|
505 |
"eval_wer": 28.968993097403313,
|
506 |
"step": 2000
|
|
|
748 |
{
|
749 |
"epoch": 374.0,
|
750 |
"eval_loss": 0.9381842613220215,
|
751 |
+
"eval_runtime": 133.2813,
|
752 |
+
"eval_samples_per_second": 9.281,
|
753 |
+
"eval_steps_per_second": 0.293,
|
754 |
"eval_wer": 30.820642051057302,
|
755 |
"step": 3000
|
756 |
},
|
|
|
997 |
{
|
998 |
"epoch": 499.0,
|
999 |
"eval_loss": 0.9754325151443481,
|
1000 |
+
"eval_runtime": 133.3867,
|
1001 |
+
"eval_samples_per_second": 9.274,
|
1002 |
+
"eval_steps_per_second": 0.292,
|
1003 |
"eval_wer": 34.436287936890544,
|
1004 |
"step": 4000
|
1005 |
},
|
|
|
1246 |
{
|
1247 |
"epoch": 624.0,
|
1248 |
"eval_loss": 0.9921010732650757,
|
1249 |
+
"eval_runtime": 136.0036,
|
1250 |
+
"eval_samples_per_second": 9.095,
|
1251 |
+
"eval_steps_per_second": 0.287,
|
1252 |
"eval_wer": 34.21715788320368,
|
1253 |
"step": 5000
|
1254 |
},
|
|
|
1257 |
"step": 5000,
|
1258 |
"total_flos": 8.94614740992e+19,
|
1259 |
"train_loss": 0.02765977076081908,
|
1260 |
+
"train_runtime": 26145.1461,
|
1261 |
+
"train_samples_per_second": 12.239,
|
1262 |
"train_steps_per_second": 0.191
|
1263 |
}
|
1264 |
],
|