File size: 2,613 Bytes
3a3b1b6 40e6666 3a3b1b6 40e6666 3a3b1b6 40e6666 3a3b1b6 40e6666 3a3b1b6 e5c5089 40e6666 e5c5089 40e6666 e5c5089 d68298f 40e6666 d68298f 40e6666 d68298f d27a2cf 40e6666 d27a2cf 40e6666 d27a2cf 4d3928e 40e6666 4d3928e 40e6666 4d3928e f51b3be 40e6666 f51b3be 40e6666 f51b3be f288b13 40e6666 f288b13 40e6666 f288b13 3a3b1b6 40e6666 3a3b1b6 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 |
{
"best_metric": 2.451620578765869,
"best_model_checkpoint": "./outputs/checkpoint-700",
"epoch": 0.5100182149362478,
"eval_steps": 100,
"global_step": 700,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.07,
"learning_rate": 0.0002,
"loss": 2.7401,
"step": 100
},
{
"epoch": 0.07,
"eval_loss": 2.6424810886383057,
"eval_runtime": 206.4108,
"eval_samples_per_second": 30.396,
"eval_steps_per_second": 3.803,
"step": 100
},
{
"epoch": 0.15,
"learning_rate": 0.0002,
"loss": 2.6061,
"step": 200
},
{
"epoch": 0.15,
"eval_loss": 2.5929574966430664,
"eval_runtime": 206.2177,
"eval_samples_per_second": 30.424,
"eval_steps_per_second": 3.807,
"step": 200
},
{
"epoch": 0.22,
"learning_rate": 0.0002,
"loss": 2.5643,
"step": 300
},
{
"epoch": 0.22,
"eval_loss": 2.5578970909118652,
"eval_runtime": 206.509,
"eval_samples_per_second": 30.381,
"eval_steps_per_second": 3.801,
"step": 300
},
{
"epoch": 0.29,
"learning_rate": 0.0002,
"loss": 2.5383,
"step": 400
},
{
"epoch": 0.29,
"eval_loss": 2.5257716178894043,
"eval_runtime": 206.1349,
"eval_samples_per_second": 30.436,
"eval_steps_per_second": 3.808,
"step": 400
},
{
"epoch": 0.36,
"learning_rate": 0.0002,
"loss": 2.4959,
"step": 500
},
{
"epoch": 0.36,
"eval_loss": 2.5014102458953857,
"eval_runtime": 282.6461,
"eval_samples_per_second": 22.197,
"eval_steps_per_second": 2.777,
"step": 500
},
{
"epoch": 0.44,
"learning_rate": 0.0002,
"loss": 2.4693,
"step": 600
},
{
"epoch": 0.44,
"eval_loss": 2.475057601928711,
"eval_runtime": 205.7759,
"eval_samples_per_second": 30.489,
"eval_steps_per_second": 3.815,
"step": 600
},
{
"epoch": 0.51,
"learning_rate": 0.0002,
"loss": 2.4523,
"step": 700
},
{
"epoch": 0.51,
"eval_loss": 2.451620578765869,
"eval_runtime": 322.0554,
"eval_samples_per_second": 19.481,
"eval_steps_per_second": 2.437,
"step": 700
}
],
"logging_steps": 100,
"max_steps": 4116,
"num_train_epochs": 3,
"save_steps": 100,
"total_flos": 2.042513200078848e+16,
"trial_name": null,
"trial_params": null
}
|