File size: 2,222 Bytes
68c0706 50808b6 d7eb129 68c0706 50808b6 68c0706 50808b6 68c0706 50808b6 68c0706 50808b6 68c0706 50808b6 d7eb129 c537bc2 50808b6 d7eb129 50808b6 25946e5 16c8fbd 50808b6 16c8fbd 50808b6 d7eb129 50808b6 16c8fbd 50808b6 16c8fbd 50808b6 16c8fbd 50808b6 16c8fbd 50808b6 16c8fbd 68c0706 50808b6 68c0706 50808b6 68c0706 50808b6 68c0706 50808b6 68c0706 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.5,
"eval_steps": 3,
"global_step": 6,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.08333333333333333,
"grad_norm": NaN,
"learning_rate": 0.0,
"loss": 1.4927,
"step": 1
},
{
"epoch": 0.08333333333333333,
"eval_loss": 1.4977792501449585,
"eval_runtime": 0.3019,
"eval_samples_per_second": 9.937,
"eval_steps_per_second": 9.937,
"step": 1
},
{
"epoch": 0.16666666666666666,
"grad_norm": 4.949731349945068,
"learning_rate": 2e-05,
"loss": 1.307,
"step": 2
},
{
"epoch": 0.25,
"grad_norm": 5.8763322830200195,
"learning_rate": 4e-05,
"loss": 1.5735,
"step": 3
},
{
"epoch": 0.25,
"eval_loss": 1.4451128244400024,
"eval_runtime": 0.4158,
"eval_samples_per_second": 7.215,
"eval_steps_per_second": 7.215,
"step": 3
},
{
"epoch": 0.3333333333333333,
"grad_norm": 4.730646133422852,
"learning_rate": 6e-05,
"loss": 1.2767,
"step": 4
},
{
"epoch": 0.4166666666666667,
"grad_norm": 3.4440248012542725,
"learning_rate": 8e-05,
"loss": 1.3011,
"step": 5
},
{
"epoch": 0.5,
"grad_norm": 2.8259096145629883,
"learning_rate": 0.0001,
"loss": 1.0815,
"step": 6
},
{
"epoch": 0.5,
"eval_loss": 0.816199779510498,
"eval_runtime": 0.4516,
"eval_samples_per_second": 6.643,
"eval_steps_per_second": 6.643,
"step": 6
}
],
"logging_steps": 1,
"max_steps": 10,
"num_input_tokens_seen": 0,
"num_train_epochs": 1,
"save_steps": 3,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 1109738548887552.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}
|