jssky commited on
Commit
d543de7
·
verified ·
1 Parent(s): 57353aa

Training in progress, step 6, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7706632fc7e44e229e7e2f785c58c45761976b78f2c3fdb166adb78aa1116031
3
  size 167832240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa87b9c2e88a77fb9c0c732faa9bcf46ce35fea4844abd99554710c8e10420a8
3
  size 167832240
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dae31359390ebd44baeca72772348828cbb370f33737791b739de72f9d91a9c2
3
- size 2280
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3c968a8a0504f0b1759f3919e2e97f2ead66cfcc2978117ff15163a15194db7
3
+ size 85723284
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e0d2c38231e94b9ec25168267a3390e377c7e96b8c366407e5710cbc8c44d5d
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4015cf50661106d4c867455d8fcb77ddec867e70f0f882bba91a3ca1ad588408
3
  size 15984
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a314a5d18c765e4391952313db28bb66a33f4a6331471d415f71a3501c38a6c
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49fc59e53e240b3838dadf2af67159484079789c12a330a205e27c230ccee1c9
3
  size 15984
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:941015a43600f0029776dc6d9d56f1625fb007b61acaea790e2657d8592b44d5
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11722b6394ecb3833f200e9d6276276d305ce41580dceb70733998603948c9fc
3
  size 15984
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6047659e7e57219e01f2d0aec27643dc145b7deb70cbf9fd16ba27f1bbe17782
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd64b1aeac101aad3ba6d07f9650b71a9fb5556ba4d6b15ea569bef72eb6f8a8
3
  size 15984
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96235b77ebcd46e5ea0dfbbaa3dd31608205a209d4a05cd49d1fadc6d43ae041
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d5ac429c02100c8ea139dc1bcd52228cac30b904cf2277e02640b844afb2bf8
3
  size 15984
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f66d633de5f92f220598195851371ad9a060b558826c9694f93ce4324ed8cea5
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa0e4c1cc21bbb8ce749c794ec6e7606eb777967d6020afb33f90761e165cff8
3
  size 15984
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d90eb28075ce42b35f16f8a71090ab3f890d8eb5481fe805620601503e380ff
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a5c2dab0c365a1d31bee5cff9b44deecc376511a9331204b441812b880c65e5
3
  size 15984
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:783a581c253b79a52148bf899b22b99e854f8be7682acbec120e86e3921fa257
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9cad6b44df5f70ced5eafddb1c84bd1a3ffb87a9e3b79a3b70e4204f0ed6e8a
3
  size 15984
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:219c62af0a99d0a3db4c57e4189ef3b142499e30571ad5cc800b8b67c9ce1583
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffd8c58e5d02492554dbaa495f8cf80dff41fabc0e1288cb2fd18a103d402219
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.024291497975708502,
5
  "eval_steps": 3,
6
- "global_step": 3,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -44,6 +44,35 @@
44
  "eval_samples_per_second": 33.665,
45
  "eval_steps_per_second": 4.208,
46
  "step": 3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
47
  }
48
  ],
49
  "logging_steps": 1,
@@ -63,7 +92,7 @@
63
  "attributes": {}
64
  }
65
  },
66
- "total_flos": 1.7805294805450752e+16,
67
  "train_batch_size": 1,
68
  "trial_name": null,
69
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.048582995951417005,
5
  "eval_steps": 3,
6
+ "global_step": 6,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
44
  "eval_samples_per_second": 33.665,
45
  "eval_steps_per_second": 4.208,
46
  "step": 3
47
+ },
48
+ {
49
+ "epoch": 0.032388663967611336,
50
+ "grad_norm": 7.104294776916504,
51
+ "learning_rate": 2e-05,
52
+ "loss": 5.596,
53
+ "step": 4
54
+ },
55
+ {
56
+ "epoch": 0.04048582995951417,
57
+ "grad_norm": 7.289365291595459,
58
+ "learning_rate": 4e-05,
59
+ "loss": 5.7354,
60
+ "step": 5
61
+ },
62
+ {
63
+ "epoch": 0.048582995951417005,
64
+ "grad_norm": 7.546472549438477,
65
+ "learning_rate": 6e-05,
66
+ "loss": 5.2959,
67
+ "step": 6
68
+ },
69
+ {
70
+ "epoch": 0.048582995951417005,
71
+ "eval_loss": 4.9584832191467285,
72
+ "eval_runtime": 6.0022,
73
+ "eval_samples_per_second": 34.654,
74
+ "eval_steps_per_second": 4.332,
75
+ "step": 6
76
  }
77
  ],
78
  "logging_steps": 1,
 
92
  "attributes": {}
93
  }
94
  },
95
+ "total_flos": 3.5610589610901504e+16,
96
  "train_batch_size": 1,
97
  "trial_name": null,
98
  "trial_params": null