tuanna08go commited on
Commit
b64e247
·
verified ·
1 Parent(s): ed88831

Training in progress, step 9, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:646c144b477247a281155c00d73edf80cbc92114df821385ec9f8d51dd3c9a4c
3
  size 83945296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a0e0d237c6db689e95798e50eb592055c24c6df12f3f33823d0758034cd63a0
3
  size 83945296
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:369940c5a3787d59062c2769c230bdde483fa743398ba2e4d8f66ee03cdb349e
3
  size 43122580
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dae60cbcfb9d977a3d925b3cab6ee9727c881308677c1fea0fee72e316d3c399
3
  size 43122580
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf3a48248233b81e3f746e3d9f557dd750b90f8b04de7b95486ad9ac9a4f03ff
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f00db97249fd560a6e1afb3a8bcbbd836998d202bbad32bbe904fee54f30cbe
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4adb065e8c7ee3fd0605a6d2c5e5b87339b435d7f44ee128ff65fc58e188fae9
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04f2377114f0045a9573af2c1b5089c23c13db9f92c475ef08d7a6bc3481f940
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.6713286713286714,
5
  "eval_steps": 2,
6
- "global_step": 6,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -39,6 +39,14 @@
39
  "eval_samples_per_second": 18.94,
40
  "eval_steps_per_second": 2.484,
41
  "step": 6
 
 
 
 
 
 
 
 
42
  }
43
  ],
44
  "logging_steps": 10,
@@ -53,12 +61,12 @@
53
  "should_evaluate": false,
54
  "should_log": false,
55
  "should_save": true,
56
- "should_training_stop": false
57
  },
58
  "attributes": {}
59
  }
60
  },
61
- "total_flos": 1.6825649272455168e+16,
62
  "train_batch_size": 8,
63
  "trial_name": null,
64
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.062937062937063,
5
  "eval_steps": 2,
6
+ "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
39
  "eval_samples_per_second": 18.94,
40
  "eval_steps_per_second": 2.484,
41
  "step": 6
42
+ },
43
+ {
44
+ "epoch": 0.8951048951048951,
45
+ "eval_loss": 1.0419520139694214,
46
+ "eval_runtime": 3.2123,
47
+ "eval_samples_per_second": 18.99,
48
+ "eval_steps_per_second": 2.49,
49
+ "step": 8
50
  }
51
  ],
52
  "logging_steps": 10,
 
61
  "should_evaluate": false,
62
  "should_log": false,
63
  "should_save": true,
64
+ "should_training_stop": true
65
  },
66
  "attributes": {}
67
  }
68
  },
69
+ "total_flos": 2.523847390868275e+16,
70
  "train_batch_size": 8,
71
  "trial_name": null,
72
  "trial_params": null