anamelchor
commited on
Commit
•
9257f02
1
Parent(s):
3f7a1c8
Training in progress, epoch 1
Browse files- model.safetensors +1 -1
- run-1/checkpoint-428/model.safetensors +1 -1
- run-1/checkpoint-428/optimizer.pt +1 -1
- run-1/checkpoint-428/rng_state.pth +1 -1
- run-1/checkpoint-428/scheduler.pt +1 -1
- run-1/checkpoint-428/trainer_state.json +16 -16
- run-1/checkpoint-428/training_args.bin +1 -1
- run-2/checkpoint-54/model.safetensors +1 -1
- run-2/checkpoint-54/optimizer.pt +1 -1
- run-2/checkpoint-54/rng_state.pth +1 -1
- run-2/checkpoint-54/scheduler.pt +1 -1
- run-2/checkpoint-54/trainer_state.json +13 -22
- run-2/checkpoint-54/training_args.bin +1 -1
- runs/Feb28_18-10-00_5620ed9b2fff/events.out.tfevents.1709144639.5620ed9b2fff.209.4 +3 -0
- training_args.bin +1 -1
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267832560
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:951f38e98d13e21dc75cc9bd9b2cdeaa5a6f08f0892623ca0324878e99204599
|
3 |
size 267832560
|
run-1/checkpoint-428/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267832560
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8220f206622c6f496381eba1d07bd6ca75d91e74d50afa7e44799ad9c5be7d7d
|
3 |
size 267832560
|
run-1/checkpoint-428/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 535727290
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e02fdb1e8930d0fc3489386465b2180991e69247221cc87c1151b1dbd15512a
|
3 |
size 535727290
|
run-1/checkpoint-428/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e87fe3c36d691ac6c42bca874c74ed014eefdbb6108564f8658fb9e5b9febc83
|
3 |
size 14244
|
run-1/checkpoint-428/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c25e2e9cf1ce0cd951d12d306061617bdab3f567ca512f75957cae4f113da48
|
3 |
size 1064
|
run-1/checkpoint-428/trainer_state.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
"best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-428",
|
4 |
"epoch": 2.0,
|
5 |
"eval_steps": 500,
|
@@ -10,35 +10,35 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 1.0,
|
13 |
-
"eval_loss": 0.
|
14 |
-
"eval_matthews_correlation": 0.
|
15 |
-
"eval_runtime": 0.
|
16 |
-
"eval_samples_per_second":
|
17 |
-
"eval_steps_per_second":
|
18 |
"step": 214
|
19 |
},
|
20 |
{
|
21 |
"epoch": 2.0,
|
22 |
-
"eval_loss": 0.
|
23 |
-
"eval_matthews_correlation": 0.
|
24 |
-
"eval_runtime": 1.
|
25 |
-
"eval_samples_per_second":
|
26 |
-
"eval_steps_per_second":
|
27 |
"step": 428
|
28 |
}
|
29 |
],
|
30 |
"logging_steps": 500,
|
31 |
-
"max_steps":
|
32 |
"num_input_tokens_seen": 0,
|
33 |
-
"num_train_epochs":
|
34 |
"save_steps": 500,
|
35 |
"total_flos": 0,
|
36 |
"train_batch_size": 4,
|
37 |
"trial_name": null,
|
38 |
"trial_params": {
|
39 |
-
"learning_rate":
|
40 |
-
"num_train_epochs":
|
41 |
"per_device_train_batch_size": 4,
|
42 |
-
"seed":
|
43 |
}
|
44 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.3005246361638528,
|
3 |
"best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-428",
|
4 |
"epoch": 2.0,
|
5 |
"eval_steps": 500,
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 1.0,
|
13 |
+
"eval_loss": 0.6478912234306335,
|
14 |
+
"eval_matthews_correlation": 0.18118799119487816,
|
15 |
+
"eval_runtime": 0.7571,
|
16 |
+
"eval_samples_per_second": 1377.58,
|
17 |
+
"eval_steps_per_second": 87.172,
|
18 |
"step": 214
|
19 |
},
|
20 |
{
|
21 |
"epoch": 2.0,
|
22 |
+
"eval_loss": 0.9094101190567017,
|
23 |
+
"eval_matthews_correlation": 0.3005246361638528,
|
24 |
+
"eval_runtime": 1.0485,
|
25 |
+
"eval_samples_per_second": 994.768,
|
26 |
+
"eval_steps_per_second": 62.948,
|
27 |
"step": 428
|
28 |
}
|
29 |
],
|
30 |
"logging_steps": 500,
|
31 |
+
"max_steps": 428,
|
32 |
"num_input_tokens_seen": 0,
|
33 |
+
"num_train_epochs": 2,
|
34 |
"save_steps": 500,
|
35 |
"total_flos": 0,
|
36 |
"train_batch_size": 4,
|
37 |
"trial_name": null,
|
38 |
"trial_params": {
|
39 |
+
"learning_rate": 3.45845102664945e-05,
|
40 |
+
"num_train_epochs": 2,
|
41 |
"per_device_train_batch_size": 4,
|
42 |
+
"seed": 15
|
43 |
}
|
44 |
}
|
run-1/checkpoint-428/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8bfed4abe7904aebfa29146a26419ad532e218a199dc08365bb4ca5a35eafdb
|
3 |
size 4984
|
run-2/checkpoint-54/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267832560
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:951f38e98d13e21dc75cc9bd9b2cdeaa5a6f08f0892623ca0324878e99204599
|
3 |
size 267832560
|
run-2/checkpoint-54/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 535727290
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5740171fee8b11d2fbb61832c047c97d81240537dace9d499fca0fe4dddff88c
|
3 |
size 535727290
|
run-2/checkpoint-54/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df090108457d96817be2199667108a02455609ad929d99fa814d2ee7bd50d185
|
3 |
size 14244
|
run-2/checkpoint-54/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:303844bf75ccfc607f59353a7880410a50503f4e94b34d2f10013216f0e88a2a
|
3 |
size 1064
|
run-2/checkpoint-54/trainer_state.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
"best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-54",
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 54,
|
7 |
"is_hyper_param_search": true,
|
@@ -10,35 +10,26 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 1.0,
|
13 |
-
"eval_loss": 0.
|
14 |
"eval_matthews_correlation": 0.0,
|
15 |
-
"eval_runtime": 0.
|
16 |
-
"eval_samples_per_second":
|
17 |
-
"eval_steps_per_second":
|
18 |
-
"step": 27
|
19 |
-
},
|
20 |
-
{
|
21 |
-
"epoch": 2.0,
|
22 |
-
"eval_loss": 0.5790226459503174,
|
23 |
-
"eval_matthews_correlation": 0.2712686505720511,
|
24 |
-
"eval_runtime": 0.7744,
|
25 |
-
"eval_samples_per_second": 1346.766,
|
26 |
-
"eval_steps_per_second": 85.222,
|
27 |
"step": 54
|
28 |
}
|
29 |
],
|
30 |
"logging_steps": 500,
|
31 |
-
"max_steps":
|
32 |
"num_input_tokens_seen": 0,
|
33 |
-
"num_train_epochs":
|
34 |
"save_steps": 500,
|
35 |
"total_flos": 0,
|
36 |
-
"train_batch_size":
|
37 |
"trial_name": null,
|
38 |
"trial_params": {
|
39 |
-
"learning_rate":
|
40 |
-
"num_train_epochs":
|
41 |
-
"per_device_train_batch_size":
|
42 |
-
"seed":
|
43 |
}
|
44 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.0,
|
3 |
"best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-54",
|
4 |
+
"epoch": 1.0,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 54,
|
7 |
"is_hyper_param_search": true,
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 1.0,
|
13 |
+
"eval_loss": 0.5896052122116089,
|
14 |
"eval_matthews_correlation": 0.0,
|
15 |
+
"eval_runtime": 0.7382,
|
16 |
+
"eval_samples_per_second": 1412.91,
|
17 |
+
"eval_steps_per_second": 89.408,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
18 |
"step": 54
|
19 |
}
|
20 |
],
|
21 |
"logging_steps": 500,
|
22 |
+
"max_steps": 162,
|
23 |
"num_input_tokens_seen": 0,
|
24 |
+
"num_train_epochs": 3,
|
25 |
"save_steps": 500,
|
26 |
"total_flos": 0,
|
27 |
+
"train_batch_size": 16,
|
28 |
"trial_name": null,
|
29 |
"trial_params": {
|
30 |
+
"learning_rate": 4.44263313595678e-05,
|
31 |
+
"num_train_epochs": 3,
|
32 |
+
"per_device_train_batch_size": 16,
|
33 |
+
"seed": 36
|
34 |
}
|
35 |
}
|
run-2/checkpoint-54/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64b88362824c828734d46d9219cae04a83c937724d8224d58b37d769b6b5a4e8
|
3 |
size 4984
|
runs/Feb28_18-10-00_5620ed9b2fff/events.out.tfevents.1709144639.5620ed9b2fff.209.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aab91ac1e0a164f942e98bb69c1148a4711749f1e19200cf9e8d0d19bf3edfcc
|
3 |
+
size 5888
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64b88362824c828734d46d9219cae04a83c937724d8224d58b37d769b6b5a4e8
|
3 |
size 4984
|