Training in progress, step 724, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +53 -4
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2145944
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:227f14b5a2687735006c73ead50afcc55eac9584005c145efe00d779c806789b
|
3 |
size 2145944
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4310020
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1a76c406a7be9b2b100b768746eaa7355f01cf42dc4eefe6eabcce6f8e87594
|
3 |
size 4310020
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14960
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a35e5c3617dd4cf3452d6d89bc6fd0ebe6a2b8784de42225a2fdf51d60521b82
|
3 |
size 14960
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd30e2f855940fa3e33d3978da3fd180418222584fe4f4d19f30d42f33e20efd
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34c3af6f3adec49d0d0a6e9b544ac580b2e3a13bb94ed7476a3711d95a9ef6c6
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67b2f832bdf633a8fbe2bd9786fa9777f8898f5039f16a5b1ec23b42e8ba211f
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f34e97a6907c815b8e7fd063af05c447efd3bc0a06dcb158bac0d08e94243947
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 0.
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -5026,6 +5026,55 @@
|
|
5026 |
"learning_rate": 3.10471474516183e-08,
|
5027 |
"loss": 9.782,
|
5028 |
"step": 717
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5029 |
}
|
5030 |
],
|
5031 |
"logging_steps": 1,
|
@@ -5040,12 +5089,12 @@
|
|
5040 |
"should_evaluate": false,
|
5041 |
"should_log": false,
|
5042 |
"should_save": true,
|
5043 |
-
"should_training_stop":
|
5044 |
},
|
5045 |
"attributes": {}
|
5046 |
}
|
5047 |
},
|
5048 |
-
"total_flos":
|
5049 |
"train_batch_size": 4,
|
5050 |
"trial_name": null,
|
5051 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 0.9989651604001379,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 724,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
5026 |
"learning_rate": 3.10471474516183e-08,
|
5027 |
"loss": 9.782,
|
5028 |
"step": 717
|
5029 |
+
},
|
5030 |
+
{
|
5031 |
+
"epoch": 0.9906864436012418,
|
5032 |
+
"grad_norm": 1.1444123983383179,
|
5033 |
+
"learning_rate": 2.2810775523329773e-08,
|
5034 |
+
"loss": 9.7736,
|
5035 |
+
"step": 718
|
5036 |
+
},
|
5037 |
+
{
|
5038 |
+
"epoch": 0.9920662297343912,
|
5039 |
+
"grad_norm": 1.2123403549194336,
|
5040 |
+
"learning_rate": 1.5841184405462895e-08,
|
5041 |
+
"loss": 9.7574,
|
5042 |
+
"step": 719
|
5043 |
+
},
|
5044 |
+
{
|
5045 |
+
"epoch": 0.9934460158675406,
|
5046 |
+
"grad_norm": 1.313451886177063,
|
5047 |
+
"learning_rate": 1.0138550757493592e-08,
|
5048 |
+
"loss": 9.757,
|
5049 |
+
"step": 720
|
5050 |
+
},
|
5051 |
+
{
|
5052 |
+
"epoch": 0.9948258020006899,
|
5053 |
+
"grad_norm": 1.2594588994979858,
|
5054 |
+
"learning_rate": 5.703019125102849e-09,
|
5055 |
+
"loss": 9.744,
|
5056 |
+
"step": 721
|
5057 |
+
},
|
5058 |
+
{
|
5059 |
+
"epoch": 0.9962055881338393,
|
5060 |
+
"grad_norm": 1.3528109788894653,
|
5061 |
+
"learning_rate": 2.534701936512951e-09,
|
5062 |
+
"loss": 9.7332,
|
5063 |
+
"step": 722
|
5064 |
+
},
|
5065 |
+
{
|
5066 |
+
"epoch": 0.9975853742669886,
|
5067 |
+
"grad_norm": 1.4873722791671753,
|
5068 |
+
"learning_rate": 6.336794996231188e-10,
|
5069 |
+
"loss": 9.7142,
|
5070 |
+
"step": 723
|
5071 |
+
},
|
5072 |
+
{
|
5073 |
+
"epoch": 0.9989651604001379,
|
5074 |
+
"grad_norm": 1.4233864545822144,
|
5075 |
+
"learning_rate": 0.0,
|
5076 |
+
"loss": 9.7126,
|
5077 |
+
"step": 724
|
5078 |
}
|
5079 |
],
|
5080 |
"logging_steps": 1,
|
|
|
5089 |
"should_evaluate": false,
|
5090 |
"should_log": false,
|
5091 |
"should_save": true,
|
5092 |
+
"should_training_stop": true
|
5093 |
},
|
5094 |
"attributes": {}
|
5095 |
}
|
5096 |
},
|
5097 |
+
"total_flos": 601161656696832.0,
|
5098 |
"train_batch_size": 4,
|
5099 |
"trial_name": null,
|
5100 |
"trial_params": null
|