File size: 2,003 Bytes
3a3b1b6 33f651f b6f00ee 3a3b1b6 b6f00ee 3a3b1b6 33f651f 3a3b1b6 33f651f 3a3b1b6 e5c5089 33f651f e5c5089 33f651f e5c5089 d68298f 33f651f d68298f 33f651f 83e2db3 d68298f d27a2cf 33f651f d27a2cf 33f651f d27a2cf 4d3928e 33f651f 4d3928e 33f651f 4d3928e 3a3b1b6 b6f00ee 3a3b1b6 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 |
{
"best_metric": 2.4934604167938232,
"best_model_checkpoint": "./outputs/checkpoint-500",
"epoch": 0.36429872495446264,
"eval_steps": 100,
"global_step": 500,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.07,
"learning_rate": 0.0002,
"loss": 2.7406,
"step": 100
},
{
"epoch": 0.07,
"eval_loss": 2.6424405574798584,
"eval_runtime": 206.8728,
"eval_samples_per_second": 30.328,
"eval_steps_per_second": 3.795,
"step": 100
},
{
"epoch": 0.15,
"learning_rate": 0.0002,
"loss": 2.6056,
"step": 200
},
{
"epoch": 0.15,
"eval_loss": 2.591430187225342,
"eval_runtime": 206.9647,
"eval_samples_per_second": 30.314,
"eval_steps_per_second": 3.793,
"step": 200
},
{
"epoch": 0.22,
"learning_rate": 0.0002,
"loss": 2.5631,
"step": 300
},
{
"epoch": 0.22,
"eval_loss": 2.5565075874328613,
"eval_runtime": 206.6263,
"eval_samples_per_second": 30.364,
"eval_steps_per_second": 3.799,
"step": 300
},
{
"epoch": 0.29,
"learning_rate": 0.0002,
"loss": 2.5363,
"step": 400
},
{
"epoch": 0.29,
"eval_loss": 2.5222103595733643,
"eval_runtime": 234.7988,
"eval_samples_per_second": 26.721,
"eval_steps_per_second": 3.343,
"step": 400
},
{
"epoch": 0.36,
"learning_rate": 0.0002,
"loss": 2.4935,
"step": 500
},
{
"epoch": 0.36,
"eval_loss": 2.4934604167938232,
"eval_runtime": 206.7039,
"eval_samples_per_second": 30.353,
"eval_steps_per_second": 3.798,
"step": 500
}
],
"logging_steps": 100,
"max_steps": 4116,
"num_train_epochs": 3,
"save_steps": 100,
"total_flos": 1.459702746464256e+16,
"trial_name": null,
"trial_params": null
}
|