File size: 5,293 Bytes
a9b258a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 20.13422818791946,
"global_step": 3000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 3.36,
"eval_accuracy": 0.9206798866855525,
"eval_f1": 0.9303482587064678,
"eval_loss": 0.2345595508813858,
"eval_precision": 0.919672131147541,
"eval_recall": 0.9412751677852349,
"eval_report": " precision recall f1-score support\n\n 0 0.92 0.89 0.91 463\n 1 0.92 0.94 0.93 596\n\n accuracy 0.92 1059\n macro avg 0.92 0.92 0.92 1059\nweighted avg 0.92 0.92 0.92 1059\n",
"eval_runtime": 8.0364,
"eval_samples_per_second": 131.775,
"eval_steps_per_second": 8.337,
"step": 500
},
{
"epoch": 6.71,
"learning_rate": 4e-05,
"loss": 0.2212,
"step": 1000
},
{
"epoch": 6.71,
"eval_accuracy": 0.9046270066100094,
"eval_f1": 0.9141886151231945,
"eval_loss": 0.31608325242996216,
"eval_precision": 0.9259896729776248,
"eval_recall": 0.9026845637583892,
"eval_report": " precision recall f1-score support\n\n 0 0.88 0.91 0.89 463\n 1 0.93 0.90 0.91 596\n\n accuracy 0.90 1059\n macro avg 0.90 0.90 0.90 1059\nweighted avg 0.91 0.90 0.90 1059\n",
"eval_runtime": 8.0054,
"eval_samples_per_second": 132.285,
"eval_steps_per_second": 8.369,
"step": 1000
},
{
"epoch": 10.07,
"eval_accuracy": 0.9065155807365439,
"eval_f1": 0.9167367535744324,
"eval_loss": 0.43374723196029663,
"eval_precision": 0.9190556492411467,
"eval_recall": 0.9144295302013423,
"eval_report": " precision recall f1-score support\n\n 0 0.89 0.90 0.89 463\n 1 0.92 0.91 0.92 596\n\n accuracy 0.91 1059\n macro avg 0.90 0.91 0.91 1059\nweighted avg 0.91 0.91 0.91 1059\n",
"eval_runtime": 8.0154,
"eval_samples_per_second": 132.12,
"eval_steps_per_second": 8.359,
"step": 1500
},
{
"epoch": 13.42,
"learning_rate": 2e-05,
"loss": 0.0651,
"step": 2000
},
{
"epoch": 13.42,
"eval_accuracy": 0.9178470254957507,
"eval_f1": 0.9271966527196652,
"eval_loss": 0.47431105375289917,
"eval_precision": 0.9248747913188647,
"eval_recall": 0.9295302013422819,
"eval_report": " precision recall f1-score support\n\n 0 0.91 0.90 0.91 463\n 1 0.92 0.93 0.93 596\n\n accuracy 0.92 1059\n macro avg 0.92 0.92 0.92 1059\nweighted avg 0.92 0.92 0.92 1059\n",
"eval_runtime": 8.0135,
"eval_samples_per_second": 132.152,
"eval_steps_per_second": 8.361,
"step": 2000
},
{
"epoch": 16.78,
"eval_accuracy": 0.9102927289896129,
"eval_f1": 0.9203688181056161,
"eval_loss": 0.5537705421447754,
"eval_precision": 0.9195979899497487,
"eval_recall": 0.9211409395973155,
"eval_report": " precision recall f1-score support\n\n 0 0.90 0.90 0.90 463\n 1 0.92 0.92 0.92 596\n\n accuracy 0.91 1059\n macro avg 0.91 0.91 0.91 1059\nweighted avg 0.91 0.91 0.91 1059\n",
"eval_runtime": 8.0263,
"eval_samples_per_second": 131.941,
"eval_steps_per_second": 8.348,
"step": 2500
},
{
"epoch": 20.13,
"learning_rate": 0.0,
"loss": 0.0296,
"step": 3000
},
{
"epoch": 20.13,
"eval_accuracy": 0.9102927289896129,
"eval_f1": 0.9199663016006739,
"eval_loss": 0.6190621256828308,
"eval_precision": 0.9238578680203046,
"eval_recall": 0.9161073825503355,
"eval_report": " precision recall f1-score support\n\n 0 0.89 0.90 0.90 463\n 1 0.92 0.92 0.92 596\n\n accuracy 0.91 1059\n macro avg 0.91 0.91 0.91 1059\nweighted avg 0.91 0.91 0.91 1059\n",
"eval_runtime": 8.0249,
"eval_samples_per_second": 131.965,
"eval_steps_per_second": 8.349,
"step": 3000
},
{
"epoch": 20.13,
"step": 3000,
"total_flos": 5.04436515336192e+16,
"train_loss": 0.10527635129292806,
"train_runtime": 3964.4436,
"train_samples_per_second": 48.431,
"train_steps_per_second": 0.757
}
],
"max_steps": 3000,
"num_train_epochs": 21,
"total_flos": 5.04436515336192e+16,
"trial_name": null,
"trial_params": null
}
|