anamelchor commited on
Commit
9257f02
1 Parent(s): 3f7a1c8

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c045372f29e6a3f37f3f88e140fc38258f54572ecc9ac94f101c483b9cc8c37a
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:951f38e98d13e21dc75cc9bd9b2cdeaa5a6f08f0892623ca0324878e99204599
3
  size 267832560
run-1/checkpoint-428/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f5e5e12cac969229af19d5cc7e20d9dd28b58d83480d2f3f341a4edb226f21e
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8220f206622c6f496381eba1d07bd6ca75d91e74d50afa7e44799ad9c5be7d7d
3
  size 267832560
run-1/checkpoint-428/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eadb1fadb61f6a7641544ddbe29956168ba4da83b036b9363f9861969ced5ba0
3
  size 535727290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e02fdb1e8930d0fc3489386465b2180991e69247221cc87c1151b1dbd15512a
3
  size 535727290
run-1/checkpoint-428/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd01b2476b9fd2a1c227088b0c96b8416829b65b2617d2ef2215b5bf1d325ff4
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e87fe3c36d691ac6c42bca874c74ed014eefdbb6108564f8658fb9e5b9febc83
3
  size 14244
run-1/checkpoint-428/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d27394d0580c0938e9e973527b4d373c693291de7929426d26b8c19e9b62200
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c25e2e9cf1ce0cd951d12d306061617bdab3f567ca512f75957cae4f113da48
3
  size 1064
run-1/checkpoint-428/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.3432921557472473,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-428",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
@@ -10,35 +10,35 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_loss": 0.5924310088157654,
14
- "eval_matthews_correlation": 0.06558874629318973,
15
- "eval_runtime": 0.7705,
16
- "eval_samples_per_second": 1353.67,
17
- "eval_steps_per_second": 85.659,
18
  "step": 214
19
  },
20
  {
21
  "epoch": 2.0,
22
- "eval_loss": 0.5929568409919739,
23
- "eval_matthews_correlation": 0.3432921557472473,
24
- "eval_runtime": 1.2272,
25
- "eval_samples_per_second": 849.906,
26
- "eval_steps_per_second": 53.781,
27
  "step": 428
28
  }
29
  ],
30
  "logging_steps": 500,
31
- "max_steps": 856,
32
  "num_input_tokens_seen": 0,
33
- "num_train_epochs": 4,
34
  "save_steps": 500,
35
  "total_flos": 0,
36
  "train_batch_size": 4,
37
  "trial_name": null,
38
  "trial_params": {
39
- "learning_rate": 1.674218791607766e-05,
40
- "num_train_epochs": 4,
41
  "per_device_train_batch_size": 4,
42
- "seed": 16
43
  }
44
  }
 
1
  {
2
+ "best_metric": 0.3005246361638528,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-428",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_loss": 0.6478912234306335,
14
+ "eval_matthews_correlation": 0.18118799119487816,
15
+ "eval_runtime": 0.7571,
16
+ "eval_samples_per_second": 1377.58,
17
+ "eval_steps_per_second": 87.172,
18
  "step": 214
19
  },
20
  {
21
  "epoch": 2.0,
22
+ "eval_loss": 0.9094101190567017,
23
+ "eval_matthews_correlation": 0.3005246361638528,
24
+ "eval_runtime": 1.0485,
25
+ "eval_samples_per_second": 994.768,
26
+ "eval_steps_per_second": 62.948,
27
  "step": 428
28
  }
29
  ],
30
  "logging_steps": 500,
31
+ "max_steps": 428,
32
  "num_input_tokens_seen": 0,
33
+ "num_train_epochs": 2,
34
  "save_steps": 500,
35
  "total_flos": 0,
36
  "train_batch_size": 4,
37
  "trial_name": null,
38
  "trial_params": {
39
+ "learning_rate": 3.45845102664945e-05,
40
+ "num_train_epochs": 2,
41
  "per_device_train_batch_size": 4,
42
+ "seed": 15
43
  }
44
  }
run-1/checkpoint-428/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36613bcef60bcf7fd2c5bce911434f81154fc143b65a8b57de2003769014ca00
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8bfed4abe7904aebfa29146a26419ad532e218a199dc08365bb4ca5a35eafdb
3
  size 4984
run-2/checkpoint-54/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa0fee7546ff58c6ec3390bde5cecd927681e055eef69980256766b8e949510b
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:951f38e98d13e21dc75cc9bd9b2cdeaa5a6f08f0892623ca0324878e99204599
3
  size 267832560
run-2/checkpoint-54/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:79f7f242c330bc7344d80b82b5a5744020478114d6b0ddd5297974b2c9489275
3
  size 535727290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5740171fee8b11d2fbb61832c047c97d81240537dace9d499fca0fe4dddff88c
3
  size 535727290
run-2/checkpoint-54/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:56e134a945a8c09dbe3c3e74ec36d9a17c0f35f9759b7fc9e96fefe249cf37f0
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df090108457d96817be2199667108a02455609ad929d99fa814d2ee7bd50d185
3
  size 14244
run-2/checkpoint-54/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9afcab2bcd613780244f936803a32ad4b09ef30bad1a438d264ad9700e3668e0
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:303844bf75ccfc607f59353a7880410a50503f4e94b34d2f10013216f0e88a2a
3
  size 1064
run-2/checkpoint-54/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.2712686505720511,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-54",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 54,
7
  "is_hyper_param_search": true,
@@ -10,35 +10,26 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_loss": 0.5924028158187866,
14
  "eval_matthews_correlation": 0.0,
15
- "eval_runtime": 0.7139,
16
- "eval_samples_per_second": 1460.954,
17
- "eval_steps_per_second": 92.448,
18
- "step": 27
19
- },
20
- {
21
- "epoch": 2.0,
22
- "eval_loss": 0.5790226459503174,
23
- "eval_matthews_correlation": 0.2712686505720511,
24
- "eval_runtime": 0.7744,
25
- "eval_samples_per_second": 1346.766,
26
- "eval_steps_per_second": 85.222,
27
  "step": 54
28
  }
29
  ],
30
  "logging_steps": 500,
31
- "max_steps": 135,
32
  "num_input_tokens_seen": 0,
33
- "num_train_epochs": 5,
34
  "save_steps": 500,
35
  "total_flos": 0,
36
- "train_batch_size": 32,
37
  "trial_name": null,
38
  "trial_params": {
39
- "learning_rate": 3.196781434256157e-05,
40
- "num_train_epochs": 5,
41
- "per_device_train_batch_size": 32,
42
- "seed": 15
43
  }
44
  }
 
1
  {
2
+ "best_metric": 0.0,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-54",
4
+ "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 54,
7
  "is_hyper_param_search": true,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_loss": 0.5896052122116089,
14
  "eval_matthews_correlation": 0.0,
15
+ "eval_runtime": 0.7382,
16
+ "eval_samples_per_second": 1412.91,
17
+ "eval_steps_per_second": 89.408,
 
 
 
 
 
 
 
 
 
18
  "step": 54
19
  }
20
  ],
21
  "logging_steps": 500,
22
+ "max_steps": 162,
23
  "num_input_tokens_seen": 0,
24
+ "num_train_epochs": 3,
25
  "save_steps": 500,
26
  "total_flos": 0,
27
+ "train_batch_size": 16,
28
  "trial_name": null,
29
  "trial_params": {
30
+ "learning_rate": 4.44263313595678e-05,
31
+ "num_train_epochs": 3,
32
+ "per_device_train_batch_size": 16,
33
+ "seed": 36
34
  }
35
  }
run-2/checkpoint-54/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69153e9bbab207ff12f995d64fcbc179aebf9c056495013eeb831a9bd3f09fb4
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64b88362824c828734d46d9219cae04a83c937724d8224d58b37d769b6b5a4e8
3
  size 4984
runs/Feb28_18-10-00_5620ed9b2fff/events.out.tfevents.1709144639.5620ed9b2fff.209.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aab91ac1e0a164f942e98bb69c1148a4711749f1e19200cf9e8d0d19bf3edfcc
3
+ size 5888
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8bfed4abe7904aebfa29146a26419ad532e218a199dc08365bb4ca5a35eafdb
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64b88362824c828734d46d9219cae04a83c937724d8224d58b37d769b6b5a4e8
3
  size 4984