Training in progress, epoch 1, checkpoint
Browse files- last-checkpoint/model-00001-of-00002.safetensors +1 -1
- last-checkpoint/model-00002-of-00002.safetensors +1 -1
- last-checkpoint/optimizer.pt +2 -2
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +26 -28
- last-checkpoint/training_args.bin +1 -1
last-checkpoint/model-00001-of-00002.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4993448880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af607956bb836bd30abffeab7e595a2ad7bcbbbdeda65c843e8bb6be5393c030
|
3 |
size 4993448880
|
last-checkpoint/model-00002-of-00002.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1180663192
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68d963fb613c0fdebdca7001b1d4d7ff4cf7136e76fac49dc4c9993cff7b0f1b
|
3 |
size 1180663192
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87608d67c06604df24518b25c089309e509a99209c77fbf6483710447e67e32c
|
3 |
+
size 3137574192
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aeb3365cb23fc0ad7ef103f7e7c20c5f3cb4c39bbc3781411623d0ecc15fdec8
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b12deca4eebf12493c0f50cc78084223762e2e6f4349141d6e6d1e5efd0ae7b7
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfb18fd20d740d864e7a6cec82e5cde8914525ecfd5545ced227f05f64807011
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46f2bb6abf3eb51a791cbe95c0d4cdd70b37ff3bbb853fa053882b049478436f
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d630d518d61962a1cef0800a6c56a709c5f2ad6682a72036d2bee9b4ec793c47
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,41 +1,39 @@
|
|
1 |
{
|
2 |
-
"best_metric":
|
3 |
-
"best_model_checkpoint": "./models/rootflo/fauna-v3.2/checkpoint-
|
4 |
-
"epoch":
|
5 |
-
"eval_steps":
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
10 |
"log_history": [
|
11 |
{
|
12 |
-
"epoch":
|
13 |
-
"
|
14 |
-
"
|
15 |
-
"
|
16 |
-
"
|
17 |
-
"eval_wer": 85.91749644381224,
|
18 |
-
"step": 1
|
19 |
},
|
20 |
{
|
21 |
-
"epoch":
|
22 |
-
"grad_norm":
|
23 |
-
"learning_rate":
|
24 |
-
"loss": 0.
|
25 |
-
"step":
|
26 |
},
|
27 |
{
|
28 |
-
"epoch":
|
29 |
-
"eval_loss": 0.
|
30 |
-
"eval_runtime":
|
31 |
-
"eval_samples_per_second":
|
32 |
-
"eval_steps_per_second": 0.
|
33 |
-
"eval_wer":
|
34 |
-
"step":
|
35 |
}
|
36 |
],
|
37 |
-
"logging_steps":
|
38 |
-
"max_steps":
|
39 |
"num_input_tokens_seen": 0,
|
40 |
"num_train_epochs": 8,
|
41 |
"save_steps": 500,
|
@@ -46,7 +44,7 @@
|
|
46 |
"early_stopping_threshold": 0.01
|
47 |
},
|
48 |
"attributes": {
|
49 |
-
"early_stopping_patience_counter":
|
50 |
}
|
51 |
},
|
52 |
"TrainerControl": {
|
@@ -60,7 +58,7 @@
|
|
60 |
"attributes": {}
|
61 |
}
|
62 |
},
|
63 |
-
"total_flos":
|
64 |
"train_batch_size": 96,
|
65 |
"trial_name": null,
|
66 |
"trial_params": null
|
|
|
1 |
{
|
2 |
+
"best_metric": 108.55545060029843,
|
3 |
+
"best_model_checkpoint": "./models/rootflo/fauna-v3.2/checkpoint-460",
|
4 |
+
"epoch": 1.0,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 460,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
10 |
"log_history": [
|
11 |
{
|
12 |
+
"epoch": 0.43478260869565216,
|
13 |
+
"grad_norm": 0.5209075808525085,
|
14 |
+
"learning_rate": 1.9919182516351267e-06,
|
15 |
+
"loss": 0.4607,
|
16 |
+
"step": 200
|
|
|
|
|
17 |
},
|
18 |
{
|
19 |
+
"epoch": 0.8695652173913043,
|
20 |
+
"grad_norm": 0.5061023235321045,
|
21 |
+
"learning_rate": 1.955244232925309e-06,
|
22 |
+
"loss": 0.2067,
|
23 |
+
"step": 400
|
24 |
},
|
25 |
{
|
26 |
+
"epoch": 1.0,
|
27 |
+
"eval_loss": 0.08908500522375107,
|
28 |
+
"eval_runtime": 28373.2469,
|
29 |
+
"eval_samples_per_second": 1.383,
|
30 |
+
"eval_steps_per_second": 0.004,
|
31 |
+
"eval_wer": 108.55545060029843,
|
32 |
+
"step": 460
|
33 |
}
|
34 |
],
|
35 |
+
"logging_steps": 200,
|
36 |
+
"max_steps": 3680,
|
37 |
"num_input_tokens_seen": 0,
|
38 |
"num_train_epochs": 8,
|
39 |
"save_steps": 500,
|
|
|
44 |
"early_stopping_threshold": 0.01
|
45 |
},
|
46 |
"attributes": {
|
47 |
+
"early_stopping_patience_counter": 0
|
48 |
}
|
49 |
},
|
50 |
"TrainerControl": {
|
|
|
58 |
"attributes": {}
|
59 |
}
|
60 |
},
|
61 |
+
"total_flos": 1.2002681817409278e+21,
|
62 |
"train_batch_size": 96,
|
63 |
"trial_name": null,
|
64 |
"trial_params": null
|
last-checkpoint/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5432
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91ac8723f36b532927f549ae9030c1cf0c332747e6f415dca7f60bb56fa5e0bb
|
3 |
size 5432
|