Commit
•
ebabff2
1
Parent(s):
3e58079
End of training
Browse files
all_results.json
CHANGED
@@ -1,14 +1,14 @@
|
|
1 |
{
|
2 |
"epoch": 3.0,
|
3 |
"eval_loss": 18.79399871826172,
|
4 |
-
"eval_runtime":
|
5 |
"eval_samples": 2642,
|
6 |
-
"eval_samples_per_second": 2.
|
7 |
-
"eval_steps_per_second": 0.
|
8 |
"eval_wer": 1.0,
|
9 |
"train_loss": 5.609615023672491,
|
10 |
-
"train_runtime":
|
11 |
"train_samples": 28538,
|
12 |
-
"train_samples_per_second": 3.
|
13 |
-
"train_steps_per_second": 0.
|
14 |
}
|
|
|
1 |
{
|
2 |
"epoch": 3.0,
|
3 |
"eval_loss": 18.79399871826172,
|
4 |
+
"eval_runtime": 1047.771,
|
5 |
"eval_samples": 2642,
|
6 |
+
"eval_samples_per_second": 2.522,
|
7 |
+
"eval_steps_per_second": 0.316,
|
8 |
"eval_wer": 1.0,
|
9 |
"train_loss": 5.609615023672491,
|
10 |
+
"train_runtime": 24667.9377,
|
11 |
"train_samples": 28538,
|
12 |
+
"train_samples_per_second": 3.471,
|
13 |
+
"train_steps_per_second": 0.217
|
14 |
}
|
eval_results.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"epoch": 3.0,
|
3 |
"eval_loss": 18.79399871826172,
|
4 |
-
"eval_runtime":
|
5 |
"eval_samples": 2642,
|
6 |
-
"eval_samples_per_second": 2.
|
7 |
-
"eval_steps_per_second": 0.
|
8 |
"eval_wer": 1.0
|
9 |
}
|
|
|
1 |
{
|
2 |
"epoch": 3.0,
|
3 |
"eval_loss": 18.79399871826172,
|
4 |
+
"eval_runtime": 1047.771,
|
5 |
"eval_samples": 2642,
|
6 |
+
"eval_samples_per_second": 2.522,
|
7 |
+
"eval_steps_per_second": 0.316,
|
8 |
"eval_wer": 1.0
|
9 |
}
|
runs/Feb21_17-57-39_sanchit--v100/events.out.tfevents.1645492095.sanchit--v100.90840.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f42088e23202217784c98094e222584ea0d3338f6c6bf0987d271ac2cc3db5da
|
3 |
+
size 358
|
train_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"epoch": 3.0,
|
3 |
"train_loss": 5.609615023672491,
|
4 |
-
"train_runtime":
|
5 |
"train_samples": 28538,
|
6 |
-
"train_samples_per_second": 3.
|
7 |
-
"train_steps_per_second": 0.
|
8 |
}
|
|
|
1 |
{
|
2 |
"epoch": 3.0,
|
3 |
"train_loss": 5.609615023672491,
|
4 |
+
"train_runtime": 24667.9377,
|
5 |
"train_samples": 28538,
|
6 |
+
"train_samples_per_second": 3.471,
|
7 |
+
"train_steps_per_second": 0.217
|
8 |
}
|
trainer_state.json
CHANGED
@@ -3010,9 +3010,9 @@
|
|
3010 |
{
|
3011 |
"epoch": 0.28,
|
3012 |
"eval_loss": 9.04012393951416,
|
3013 |
-
"eval_runtime":
|
3014 |
-
"eval_samples_per_second": 3.
|
3015 |
-
"eval_steps_per_second": 0.
|
3016 |
"eval_wer": 1.0119595398651329,
|
3017 |
"step": 500
|
3018 |
},
|
@@ -6019,9 +6019,9 @@
|
|
6019 |
{
|
6020 |
"epoch": 0.56,
|
6021 |
"eval_loss": 9.319939613342285,
|
6022 |
-
"eval_runtime":
|
6023 |
-
"eval_samples_per_second": 3.
|
6024 |
-
"eval_steps_per_second": 0.
|
6025 |
"eval_wer": 1.0,
|
6026 |
"step": 1000
|
6027 |
},
|
@@ -9028,9 +9028,9 @@
|
|
9028 |
{
|
9029 |
"epoch": 0.84,
|
9030 |
"eval_loss": 8.443438529968262,
|
9031 |
-
"eval_runtime":
|
9032 |
-
"eval_samples_per_second": 3.
|
9033 |
-
"eval_steps_per_second": 0.
|
9034 |
"eval_wer": 1.4562673542245141,
|
9035 |
"step": 1500
|
9036 |
},
|
@@ -12037,9 +12037,9 @@
|
|
12037 |
{
|
12038 |
"epoch": 1.12,
|
12039 |
"eval_loss": 15.180464744567871,
|
12040 |
-
"eval_runtime":
|
12041 |
-
"eval_samples_per_second": 3.
|
12042 |
-
"eval_steps_per_second": 0.
|
12043 |
"eval_wer": 0.9999801666005553,
|
12044 |
"step": 2000
|
12045 |
},
|
@@ -15046,9 +15046,9 @@
|
|
15046 |
{
|
15047 |
"epoch": 1.4,
|
15048 |
"eval_loss": 15.79842472076416,
|
15049 |
-
"eval_runtime":
|
15050 |
-
"eval_samples_per_second": 3.
|
15051 |
-
"eval_steps_per_second": 0.
|
15052 |
"eval_wer": 1.0020825069416899,
|
15053 |
"step": 2500
|
15054 |
},
|
@@ -18055,9 +18055,9 @@
|
|
18055 |
{
|
18056 |
"epoch": 1.68,
|
18057 |
"eval_loss": 18.492834091186523,
|
18058 |
-
"eval_runtime":
|
18059 |
-
"eval_samples_per_second": 3.
|
18060 |
-
"eval_steps_per_second": 0.
|
18061 |
"eval_wer": 1.0,
|
18062 |
"step": 3000
|
18063 |
},
|
@@ -21064,9 +21064,9 @@
|
|
21064 |
{
|
21065 |
"epoch": 1.96,
|
21066 |
"eval_loss": 17.48856544494629,
|
21067 |
-
"eval_runtime":
|
21068 |
-
"eval_samples_per_second": 3.
|
21069 |
-
"eval_steps_per_second": 0.
|
21070 |
"eval_wer": 0.9999801666005553,
|
21071 |
"step": 3500
|
21072 |
},
|
@@ -24073,9 +24073,9 @@
|
|
24073 |
{
|
24074 |
"epoch": 2.24,
|
24075 |
"eval_loss": 18.945817947387695,
|
24076 |
-
"eval_runtime":
|
24077 |
-
"eval_samples_per_second":
|
24078 |
-
"eval_steps_per_second": 0.
|
24079 |
"eval_wer": 1.0,
|
24080 |
"step": 4000
|
24081 |
},
|
@@ -27082,9 +27082,9 @@
|
|
27082 |
{
|
27083 |
"epoch": 2.52,
|
27084 |
"eval_loss": 18.279401779174805,
|
27085 |
-
"eval_runtime":
|
27086 |
-
"eval_samples_per_second":
|
27087 |
-
"eval_steps_per_second": 0.
|
27088 |
"eval_wer": 1.0005553351844507,
|
27089 |
"step": 4500
|
27090 |
},
|
@@ -30091,9 +30091,9 @@
|
|
30091 |
{
|
30092 |
"epoch": 2.8,
|
30093 |
"eval_loss": 18.789825439453125,
|
30094 |
-
"eval_runtime":
|
30095 |
-
"eval_samples_per_second": 2.
|
30096 |
-
"eval_steps_per_second": 0.
|
30097 |
"eval_wer": 1.0,
|
30098 |
"step": 5000
|
30099 |
},
|
@@ -32214,9 +32214,9 @@
|
|
32214 |
"step": 5352,
|
32215 |
"total_flos": 0.0,
|
32216 |
"train_loss": 5.609615023672491,
|
32217 |
-
"train_runtime":
|
32218 |
-
"train_samples_per_second": 3.
|
32219 |
-
"train_steps_per_second": 0.
|
32220 |
}
|
32221 |
],
|
32222 |
"max_steps": 5352,
|
|
|
3010 |
{
|
3011 |
"epoch": 0.28,
|
3012 |
"eval_loss": 9.04012393951416,
|
3013 |
+
"eval_runtime": 872.8535,
|
3014 |
+
"eval_samples_per_second": 3.027,
|
3015 |
+
"eval_steps_per_second": 0.379,
|
3016 |
"eval_wer": 1.0119595398651329,
|
3017 |
"step": 500
|
3018 |
},
|
|
|
6019 |
{
|
6020 |
"epoch": 0.56,
|
6021 |
"eval_loss": 9.319939613342285,
|
6022 |
+
"eval_runtime": 873.1949,
|
6023 |
+
"eval_samples_per_second": 3.026,
|
6024 |
+
"eval_steps_per_second": 0.379,
|
6025 |
"eval_wer": 1.0,
|
6026 |
"step": 1000
|
6027 |
},
|
|
|
9028 |
{
|
9029 |
"epoch": 0.84,
|
9030 |
"eval_loss": 8.443438529968262,
|
9031 |
+
"eval_runtime": 873.0258,
|
9032 |
+
"eval_samples_per_second": 3.026,
|
9033 |
+
"eval_steps_per_second": 0.379,
|
9034 |
"eval_wer": 1.4562673542245141,
|
9035 |
"step": 1500
|
9036 |
},
|
|
|
12037 |
{
|
12038 |
"epoch": 1.12,
|
12039 |
"eval_loss": 15.180464744567871,
|
12040 |
+
"eval_runtime": 877.3652,
|
12041 |
+
"eval_samples_per_second": 3.011,
|
12042 |
+
"eval_steps_per_second": 0.377,
|
12043 |
"eval_wer": 0.9999801666005553,
|
12044 |
"step": 2000
|
12045 |
},
|
|
|
15046 |
{
|
15047 |
"epoch": 1.4,
|
15048 |
"eval_loss": 15.79842472076416,
|
15049 |
+
"eval_runtime": 879.1328,
|
15050 |
+
"eval_samples_per_second": 3.005,
|
15051 |
+
"eval_steps_per_second": 0.377,
|
15052 |
"eval_wer": 1.0020825069416899,
|
15053 |
"step": 2500
|
15054 |
},
|
|
|
18055 |
{
|
18056 |
"epoch": 1.68,
|
18057 |
"eval_loss": 18.492834091186523,
|
18058 |
+
"eval_runtime": 877.1195,
|
18059 |
+
"eval_samples_per_second": 3.012,
|
18060 |
+
"eval_steps_per_second": 0.377,
|
18061 |
"eval_wer": 1.0,
|
18062 |
"step": 3000
|
18063 |
},
|
|
|
21064 |
{
|
21065 |
"epoch": 1.96,
|
21066 |
"eval_loss": 17.48856544494629,
|
21067 |
+
"eval_runtime": 876.0525,
|
21068 |
+
"eval_samples_per_second": 3.016,
|
21069 |
+
"eval_steps_per_second": 0.378,
|
21070 |
"eval_wer": 0.9999801666005553,
|
21071 |
"step": 3500
|
21072 |
},
|
|
|
24073 |
{
|
24074 |
"epoch": 2.24,
|
24075 |
"eval_loss": 18.945817947387695,
|
24076 |
+
"eval_runtime": 874.0614,
|
24077 |
+
"eval_samples_per_second": 3.023,
|
24078 |
+
"eval_steps_per_second": 0.379,
|
24079 |
"eval_wer": 1.0,
|
24080 |
"step": 4000
|
24081 |
},
|
|
|
27082 |
{
|
27083 |
"epoch": 2.52,
|
27084 |
"eval_loss": 18.279401779174805,
|
27085 |
+
"eval_runtime": 876.9552,
|
27086 |
+
"eval_samples_per_second": 3.013,
|
27087 |
+
"eval_steps_per_second": 0.377,
|
27088 |
"eval_wer": 1.0005553351844507,
|
27089 |
"step": 4500
|
27090 |
},
|
|
|
30091 |
{
|
30092 |
"epoch": 2.8,
|
30093 |
"eval_loss": 18.789825439453125,
|
30094 |
+
"eval_runtime": 881.3583,
|
30095 |
+
"eval_samples_per_second": 2.998,
|
30096 |
+
"eval_steps_per_second": 0.376,
|
30097 |
"eval_wer": 1.0,
|
30098 |
"step": 5000
|
30099 |
},
|
|
|
32214 |
"step": 5352,
|
32215 |
"total_flos": 0.0,
|
32216 |
"train_loss": 5.609615023672491,
|
32217 |
+
"train_runtime": 24667.9377,
|
32218 |
+
"train_samples_per_second": 3.471,
|
32219 |
+
"train_steps_per_second": 0.217
|
32220 |
}
|
32221 |
],
|
32222 |
"max_steps": 5352,
|