Femboyuwu2000 commited on
Commit
da24497
1 Parent(s): e44eff1

Training in progress, step 2840, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b10f7bc2c65141fa4ebded03f209c967b4ffb87e1cc778dfc9b4a86634ba57d6
3
  size 13982248
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10ea9419bc897f8127b2a76b23cadb89107b0764e27a08a91562681dfb2de8a6
3
  size 13982248
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3615fe2b2b9addb6c497cc609999c34f4e448914d69744ff96b2430756df5daa
3
  size 7062522
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1dd82c95168c3e2554246bf42378f05037dfc985cac616a5e4d4886c53dc3e7
3
  size 7062522
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:380a1cca63ce963571458aaefc36eab189734f962738f8e4fb44ec662db4894a
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8de38d9f67df6f278483c5a632a2e9d174866bbdfabf05a223a9fdb149cbf2d
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad9945089316ed307f5a98e36c0ec8641c94a4f12f863d3c953fe640032aaa7e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c37131dd33a265ba693e5db1412fd69c16e20dba1f6320386e84def93d115d7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.2256,
5
  "eval_steps": 500,
6
- "global_step": 2820,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -994,6 +994,13 @@
994
  "learning_rate": 2.90410829484944e-05,
995
  "loss": 3.5148,
996
  "step": 2820
 
 
 
 
 
 
 
997
  }
998
  ],
999
  "logging_steps": 20,
@@ -1001,7 +1008,7 @@
1001
  "num_input_tokens_seen": 0,
1002
  "num_train_epochs": 2,
1003
  "save_steps": 20,
1004
- "total_flos": 6674198884024320.0,
1005
  "train_batch_size": 8,
1006
  "trial_name": null,
1007
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.2272,
5
  "eval_steps": 500,
6
+ "global_step": 2840,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
994
  "learning_rate": 2.90410829484944e-05,
995
  "loss": 3.5148,
996
  "step": 2820
997
+ },
998
+ {
999
+ "epoch": 0.23,
1000
+ "grad_norm": 34.077083587646484,
1001
+ "learning_rate": 2.902391803757764e-05,
1002
+ "loss": 3.5561,
1003
+ "step": 2840
1004
  }
1005
  ],
1006
  "logging_steps": 20,
 
1008
  "num_input_tokens_seen": 0,
1009
  "num_train_epochs": 2,
1010
  "save_steps": 20,
1011
+ "total_flos": 6720553638494208.0,
1012
  "train_batch_size": 8,
1013
  "trial_name": null,
1014
  "trial_params": null