TracyTank commited on
Commit
e83e0d4
1 Parent(s): a1b7936

Training in progress, step 724, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9515a7002cfa7f67e6c746a7e59b868de77da444db2b95a7c9cb039f0922f08
3
  size 2145944
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:227f14b5a2687735006c73ead50afcc55eac9584005c145efe00d779c806789b
3
  size 2145944
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7971e0a79864672f8071d25876b2985e088af6d6ac063d1237778d2eaf4fd19b
3
  size 4310020
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1a76c406a7be9b2b100b768746eaa7355f01cf42dc4eefe6eabcce6f8e87594
3
  size 4310020
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b753a7aacbc56b237a570162811e1a71ee10b02e1bee93e6daab70cd4680802
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a35e5c3617dd4cf3452d6d89bc6fd0ebe6a2b8784de42225a2fdf51d60521b82
3
  size 14960
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1fb5420c0f25e5f6b2392bd3436352035eb0debaec1745bf48bdc44f8008fc2
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd30e2f855940fa3e33d3978da3fd180418222584fe4f4d19f30d42f33e20efd
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2c82e31e1ac17c78c3d52136bae19d297a1c91d03f90b220e02fe92fb6cac45
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34c3af6f3adec49d0d0a6e9b544ac580b2e3a13bb94ed7476a3711d95a9ef6c6
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1705ef3a08286669695bd3c71729dc6c292514e0dbba93fac60bc2587d6740cc
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67b2f832bdf633a8fbe2bd9786fa9777f8898f5039f16a5b1ec23b42e8ba211f
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27ebf93c877c54673a5776fbfe0e2f8ca99926be562e6e5f55038ce1f0e80b42
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f34e97a6907c815b8e7fd063af05c447efd3bc0a06dcb158bac0d08e94243947
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9893066574680924,
5
  "eval_steps": 500,
6
- "global_step": 717,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -5026,6 +5026,55 @@
5026
  "learning_rate": 3.10471474516183e-08,
5027
  "loss": 9.782,
5028
  "step": 717
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5029
  }
5030
  ],
5031
  "logging_steps": 1,
@@ -5040,12 +5089,12 @@
5040
  "should_evaluate": false,
5041
  "should_log": false,
5042
  "should_save": true,
5043
- "should_training_stop": false
5044
  },
5045
  "attributes": {}
5046
  }
5047
  },
5048
- "total_flos": 595349320237056.0,
5049
  "train_batch_size": 4,
5050
  "trial_name": null,
5051
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9989651604001379,
5
  "eval_steps": 500,
6
+ "global_step": 724,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
5026
  "learning_rate": 3.10471474516183e-08,
5027
  "loss": 9.782,
5028
  "step": 717
5029
+ },
5030
+ {
5031
+ "epoch": 0.9906864436012418,
5032
+ "grad_norm": 1.1444123983383179,
5033
+ "learning_rate": 2.2810775523329773e-08,
5034
+ "loss": 9.7736,
5035
+ "step": 718
5036
+ },
5037
+ {
5038
+ "epoch": 0.9920662297343912,
5039
+ "grad_norm": 1.2123403549194336,
5040
+ "learning_rate": 1.5841184405462895e-08,
5041
+ "loss": 9.7574,
5042
+ "step": 719
5043
+ },
5044
+ {
5045
+ "epoch": 0.9934460158675406,
5046
+ "grad_norm": 1.313451886177063,
5047
+ "learning_rate": 1.0138550757493592e-08,
5048
+ "loss": 9.757,
5049
+ "step": 720
5050
+ },
5051
+ {
5052
+ "epoch": 0.9948258020006899,
5053
+ "grad_norm": 1.2594588994979858,
5054
+ "learning_rate": 5.703019125102849e-09,
5055
+ "loss": 9.744,
5056
+ "step": 721
5057
+ },
5058
+ {
5059
+ "epoch": 0.9962055881338393,
5060
+ "grad_norm": 1.3528109788894653,
5061
+ "learning_rate": 2.534701936512951e-09,
5062
+ "loss": 9.7332,
5063
+ "step": 722
5064
+ },
5065
+ {
5066
+ "epoch": 0.9975853742669886,
5067
+ "grad_norm": 1.4873722791671753,
5068
+ "learning_rate": 6.336794996231188e-10,
5069
+ "loss": 9.7142,
5070
+ "step": 723
5071
+ },
5072
+ {
5073
+ "epoch": 0.9989651604001379,
5074
+ "grad_norm": 1.4233864545822144,
5075
+ "learning_rate": 0.0,
5076
+ "loss": 9.7126,
5077
+ "step": 724
5078
  }
5079
  ],
5080
  "logging_steps": 1,
 
5089
  "should_evaluate": false,
5090
  "should_log": false,
5091
  "should_save": true,
5092
+ "should_training_stop": true
5093
  },
5094
  "attributes": {}
5095
  }
5096
  },
5097
+ "total_flos": 601161656696832.0,
5098
  "train_batch_size": 4,
5099
  "trial_name": null,
5100
  "trial_params": null