kbberendsen commited on
Commit
821263a
·
verified ·
1 Parent(s): 6694ba8

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:362787337e763ae671c0d6f586075e16ed1ee0b7814d9f4a66bd9c573b910b06
3
  size 1740304440
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db25cee7efaa01864d9a77a4f74d0c9d2326018ba142cbe1a036d5a07c453429
3
  size 1740304440
run-0/checkpoint-54/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:03fb2b2a9d576350e998ab84c9a0a5dbecbb7ac701c4afedac1c2dd2cd08c867
3
  size 1740304440
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db25cee7efaa01864d9a77a4f74d0c9d2326018ba142cbe1a036d5a07c453429
3
  size 1740304440
run-0/checkpoint-54/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2f34d72897c7fd7ffa4e2abc269d4f6eb9ad8c5c1616901f497cdcb85ac7653
3
  size 3480840240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f5b3b6ade9c56e825e668910d5ab939bc488a51bdabc63d4539a124f9083b4a
3
  size 3480840240
run-0/checkpoint-54/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:648b2400f4e4973b94aea633be1462ef78f024c0982d2f0c48011013c10a7392
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72a45d58deab7b40d9aeb8b53350029d22a9ff60fdf1c1b2e911c09dd065d85c
3
  size 14244
run-0/checkpoint-54/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7cdbb884730829f1bb86d31f66987468d71aa581c0d6f57ffbb087f18e098aef
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24ba1810c98b8defe45bf5ba34ee6195e35b1ba63433d1bef77b9c14523c344f
3
  size 1064
run-0/checkpoint-54/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.0,
3
  "best_model_checkpoint": "deberta-v3-large-finetuned-cola-midterm/run-0/checkpoint-54",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,26 +10,26 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_loss": 0.748440146446228,
14
- "eval_matthews_correlation": 0.0,
15
- "eval_runtime": 7.8276,
16
- "eval_samples_per_second": 133.246,
17
- "eval_steps_per_second": 8.432,
18
  "step": 54
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 54,
23
  "num_input_tokens_seen": 0,
24
- "num_train_epochs": 1,
25
  "save_steps": 500,
26
  "total_flos": 0,
27
- "train_batch_size": 16,
28
  "trial_name": null,
29
  "trial_params": {
30
- "learning_rate": 1.1781421569396437e-06,
31
- "num_train_epochs": 1,
32
- "per_device_train_batch_size": 16,
33
- "seed": 36
34
  }
35
  }
 
1
  {
2
+ "best_metric": 0.4307702429617212,
3
  "best_model_checkpoint": "deberta-v3-large-finetuned-cola-midterm/run-0/checkpoint-54",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_loss": 0.6075441837310791,
14
+ "eval_matthews_correlation": 0.4307702429617212,
15
+ "eval_runtime": 3.4416,
16
+ "eval_samples_per_second": 303.053,
17
+ "eval_steps_per_second": 19.177,
18
  "step": 54
19
  }
20
  ],
21
  "logging_steps": 500,
22
+ "max_steps": 216,
23
  "num_input_tokens_seen": 0,
24
+ "num_train_epochs": 4,
25
  "save_steps": 500,
26
  "total_flos": 0,
27
+ "train_batch_size": 8,
28
  "trial_name": null,
29
  "trial_params": {
30
+ "learning_rate": 2.0352764481854907e-05,
31
+ "num_train_epochs": 4,
32
+ "per_device_train_batch_size": 8,
33
+ "seed": 4
34
  }
35
  }
run-0/checkpoint-54/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bff223a0f00786a825df06c5c10b8ee13c387ff40002327815eb037bc53607a2
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:809a0430adc83b27e312907f1dee6ad0edefa61c1f8ccdf999f9172f36110b1e
3
  size 4984
runs/Feb29_12-44-12_8e30624cc7d3/events.out.tfevents.1709210924.8e30624cc7d3.205.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b5b3e768e937b36a7480373fbf66527dd19f42e3d2d0b514d4422a34bcc0348
3
+ size 5466
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b511e0093eff2e18a9a8913c53e4c6377789256044eb610b864499c14d17e4f5
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:809a0430adc83b27e312907f1dee6ad0edefa61c1f8ccdf999f9172f36110b1e
3
  size 4984