File size: 1,696 Bytes
3a3b1b6 e1a84d3 b1477f3 3a3b1b6 b1477f3 3a3b1b6 e1a84d3 3a3b1b6 e1a84d3 3a3b1b6 e5c5089 e1a84d3 e5c5089 e1a84d3 e5c5089 d68298f e1a84d3 d68298f e1a84d3 ef3b019 d68298f d27a2cf e1a84d3 d27a2cf e1a84d3 d27a2cf 3a3b1b6 b1477f3 3a3b1b6 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 |
{
"best_metric": 2.5222103595733643,
"best_model_checkpoint": "./outputs/checkpoint-400",
"epoch": 0.29143897996357016,
"eval_steps": 100,
"global_step": 400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.07,
"learning_rate": 0.0002,
"loss": 2.7406,
"step": 100
},
{
"epoch": 0.07,
"eval_loss": 2.6424405574798584,
"eval_runtime": 206.8728,
"eval_samples_per_second": 30.328,
"eval_steps_per_second": 3.795,
"step": 100
},
{
"epoch": 0.15,
"learning_rate": 0.0002,
"loss": 2.6056,
"step": 200
},
{
"epoch": 0.15,
"eval_loss": 2.591430187225342,
"eval_runtime": 206.9647,
"eval_samples_per_second": 30.314,
"eval_steps_per_second": 3.793,
"step": 200
},
{
"epoch": 0.22,
"learning_rate": 0.0002,
"loss": 2.5631,
"step": 300
},
{
"epoch": 0.22,
"eval_loss": 2.5565075874328613,
"eval_runtime": 206.6263,
"eval_samples_per_second": 30.364,
"eval_steps_per_second": 3.799,
"step": 300
},
{
"epoch": 0.29,
"learning_rate": 0.0002,
"loss": 2.5363,
"step": 400
},
{
"epoch": 0.29,
"eval_loss": 2.5222103595733643,
"eval_runtime": 234.7988,
"eval_samples_per_second": 26.721,
"eval_steps_per_second": 3.343,
"step": 400
}
],
"logging_steps": 100,
"max_steps": 4116,
"num_train_epochs": 3,
"save_steps": 100,
"total_flos": 1.167856193839104e+16,
"trial_name": null,
"trial_params": null
}
|