|
{ |
|
"best_metric": 0.741686227084744, |
|
"best_model_checkpoint": "bart-base-lora/checkpoint-2400", |
|
"epoch": 14.930015552099533, |
|
"eval_steps": 500, |
|
"global_step": 2400, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.715724244771495, |
|
"eval_f1_macro": 0.3957532686340496, |
|
"eval_f1_micro": 0.715724244771495, |
|
"eval_f1_weighted": 0.6834645556416842, |
|
"eval_loss": 0.9525313973426819, |
|
"eval_macro_fpr": 0.028501626692807605, |
|
"eval_macro_sensitivity": 0.4415906678049911, |
|
"eval_macro_specificity": 0.9786637894661117, |
|
"eval_precision": 0.6787596592263883, |
|
"eval_precision_macro": 0.38751339695744513, |
|
"eval_recall": 0.715724244771495, |
|
"eval_recall_macro": 0.4415906678049911, |
|
"eval_runtime": 120.9594, |
|
"eval_samples_per_second": 10.673, |
|
"eval_steps_per_second": 1.339, |
|
"eval_weighted_fpr": 0.027587762158911525, |
|
"eval_weighted_sensitivity": 0.715724244771495, |
|
"eval_weighted_specificity": 0.9642325972201805, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7412858249419055, |
|
"eval_f1_macro": 0.43370046411892155, |
|
"eval_f1_micro": 0.7412858249419055, |
|
"eval_f1_weighted": 0.7231329193382661, |
|
"eval_loss": 0.7733433842658997, |
|
"eval_macro_fpr": 0.025167370687133015, |
|
"eval_macro_sensitivity": 0.4686708989603177, |
|
"eval_macro_specificity": 0.9805374797463638, |
|
"eval_precision": 0.729625861926521, |
|
"eval_precision_macro": 0.4491323101141271, |
|
"eval_recall": 0.7412858249419055, |
|
"eval_recall_macro": 0.4686708989603177, |
|
"eval_runtime": 119.8649, |
|
"eval_samples_per_second": 10.77, |
|
"eval_steps_per_second": 1.352, |
|
"eval_weighted_fpr": 0.024322749781532187, |
|
"eval_weighted_sensitivity": 0.7412858249419055, |
|
"eval_weighted_specificity": 0.9667763712535515, |
|
"step": 321 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7738187451587917, |
|
"eval_f1_macro": 0.5270593942960143, |
|
"eval_f1_micro": 0.7738187451587917, |
|
"eval_f1_weighted": 0.7610767338978833, |
|
"eval_loss": 0.7104586958885193, |
|
"eval_macro_fpr": 0.021211805484311928, |
|
"eval_macro_sensitivity": 0.5407847836684627, |
|
"eval_macro_specificity": 0.9830897092527341, |
|
"eval_precision": 0.7630858215778352, |
|
"eval_precision_macro": 0.5565386466479504, |
|
"eval_recall": 0.7738187451587917, |
|
"eval_recall_macro": 0.5407847836684627, |
|
"eval_runtime": 119.5419, |
|
"eval_samples_per_second": 10.8, |
|
"eval_steps_per_second": 1.355, |
|
"eval_weighted_fpr": 0.020451043563524302, |
|
"eval_weighted_sensitivity": 0.7738187451587917, |
|
"eval_weighted_specificity": 0.9725268936322198, |
|
"step": 482 |
|
}, |
|
{ |
|
"epoch": 3.11, |
|
"learning_rate": 3.958333333333333e-05, |
|
"loss": 1.08, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.7575522850503486, |
|
"eval_f1_macro": 0.5497163954183316, |
|
"eval_f1_micro": 0.7575522850503486, |
|
"eval_f1_weighted": 0.7437674055775699, |
|
"eval_loss": 0.7538753151893616, |
|
"eval_macro_fpr": 0.023393901824967867, |
|
"eval_macro_sensitivity": 0.5613408412198008, |
|
"eval_macro_specificity": 0.9817091819688993, |
|
"eval_precision": 0.7583906478192325, |
|
"eval_precision_macro": 0.5791225123984725, |
|
"eval_recall": 0.7575522850503486, |
|
"eval_recall_macro": 0.5613408412198008, |
|
"eval_runtime": 120.3095, |
|
"eval_samples_per_second": 10.731, |
|
"eval_steps_per_second": 1.347, |
|
"eval_weighted_fpr": 0.022349161013923598, |
|
"eval_weighted_sensitivity": 0.7575522850503486, |
|
"eval_weighted_specificity": 0.9680854444831427, |
|
"step": 643 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.7831138652207591, |
|
"eval_f1_macro": 0.6353946839596228, |
|
"eval_f1_micro": 0.783113865220759, |
|
"eval_f1_weighted": 0.770250750407997, |
|
"eval_loss": 0.6978110074996948, |
|
"eval_macro_fpr": 0.020328728105215688, |
|
"eval_macro_sensitivity": 0.6491872351233146, |
|
"eval_macro_specificity": 0.983610303127039, |
|
"eval_precision": 0.790031827496624, |
|
"eval_precision_macro": 0.7409525878258343, |
|
"eval_recall": 0.7831138652207591, |
|
"eval_recall_macro": 0.6491872351233146, |
|
"eval_runtime": 119.9411, |
|
"eval_samples_per_second": 10.764, |
|
"eval_steps_per_second": 1.351, |
|
"eval_weighted_fpr": 0.019398642095053348, |
|
"eval_weighted_sensitivity": 0.7831138652207591, |
|
"eval_weighted_specificity": 0.9710406816848265, |
|
"step": 803 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.8156467854376452, |
|
"eval_f1_macro": 0.686011065139391, |
|
"eval_f1_micro": 0.8156467854376452, |
|
"eval_f1_weighted": 0.8087620976325791, |
|
"eval_loss": 0.5920090675354004, |
|
"eval_macro_fpr": 0.016634568189926056, |
|
"eval_macro_sensitivity": 0.6889168814632094, |
|
"eval_macro_specificity": 0.9860196319752603, |
|
"eval_precision": 0.8053079350996695, |
|
"eval_precision_macro": 0.7051361586363433, |
|
"eval_recall": 0.8156467854376452, |
|
"eval_recall_macro": 0.6889168814632094, |
|
"eval_runtime": 121.4244, |
|
"eval_samples_per_second": 10.632, |
|
"eval_steps_per_second": 1.334, |
|
"eval_weighted_fpr": 0.01588785046728972, |
|
"eval_weighted_sensitivity": 0.8156467854376452, |
|
"eval_weighted_specificity": 0.974647694191258, |
|
"step": 964 |
|
}, |
|
{ |
|
"epoch": 6.22, |
|
"learning_rate": 2.916666666666667e-05, |
|
"loss": 0.5581, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.8187451587916343, |
|
"eval_f1_macro": 0.7393184269658342, |
|
"eval_f1_micro": 0.8187451587916342, |
|
"eval_f1_weighted": 0.8146848849127107, |
|
"eval_loss": 0.6230757236480713, |
|
"eval_macro_fpr": 0.016206558639896132, |
|
"eval_macro_sensitivity": 0.7424574536250088, |
|
"eval_macro_specificity": 0.9863587851767341, |
|
"eval_precision": 0.8177894369587694, |
|
"eval_precision_macro": 0.7626654223433325, |
|
"eval_recall": 0.8187451587916343, |
|
"eval_recall_macro": 0.7424574536250088, |
|
"eval_runtime": 122.7775, |
|
"eval_samples_per_second": 10.515, |
|
"eval_steps_per_second": 1.319, |
|
"eval_weighted_fpr": 0.015566790846194785, |
|
"eval_weighted_sensitivity": 0.8187451587916343, |
|
"eval_weighted_specificity": 0.9766366188593788, |
|
"step": 1125 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8140975987606507, |
|
"eval_f1_macro": 0.7328585966804847, |
|
"eval_f1_micro": 0.8140975987606507, |
|
"eval_f1_weighted": 0.8088643288992207, |
|
"eval_loss": 0.6290707588195801, |
|
"eval_macro_fpr": 0.01671628651715199, |
|
"eval_macro_sensitivity": 0.730719512015592, |
|
"eval_macro_specificity": 0.985990627132147, |
|
"eval_precision": 0.8133783130550384, |
|
"eval_precision_macro": 0.7636063765511063, |
|
"eval_recall": 0.8140975987606507, |
|
"eval_recall_macro": 0.730719512015592, |
|
"eval_runtime": 122.8754, |
|
"eval_samples_per_second": 10.507, |
|
"eval_steps_per_second": 1.318, |
|
"eval_weighted_fpr": 0.016049217600641968, |
|
"eval_weighted_sensitivity": 0.8140975987606507, |
|
"eval_weighted_specificity": 0.975761808221554, |
|
"step": 1286 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.8241673121611154, |
|
"eval_f1_macro": 0.7364711129039813, |
|
"eval_f1_micro": 0.8241673121611154, |
|
"eval_f1_weighted": 0.8190822404938951, |
|
"eval_loss": 0.6226187348365784, |
|
"eval_macro_fpr": 0.015759087941173786, |
|
"eval_macro_sensitivity": 0.7340167949600996, |
|
"eval_macro_specificity": 0.9866810242390173, |
|
"eval_precision": 0.8212295601295609, |
|
"eval_precision_macro": 0.7665878963082912, |
|
"eval_recall": 0.8241673121611154, |
|
"eval_recall_macro": 0.7340167949600996, |
|
"eval_runtime": 119.2726, |
|
"eval_samples_per_second": 10.824, |
|
"eval_steps_per_second": 1.358, |
|
"eval_weighted_fpr": 0.015010249289162203, |
|
"eval_weighted_sensitivity": 0.8241673121611154, |
|
"eval_weighted_specificity": 0.9760480514241424, |
|
"step": 1446 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"learning_rate": 1.8750000000000002e-05, |
|
"loss": 0.3924, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.8109992254066615, |
|
"eval_f1_macro": 0.7240137823928982, |
|
"eval_f1_micro": 0.8109992254066615, |
|
"eval_f1_weighted": 0.8047604071311991, |
|
"eval_loss": 0.672822892665863, |
|
"eval_macro_fpr": 0.017004063571327103, |
|
"eval_macro_sensitivity": 0.7288750805513627, |
|
"eval_macro_specificity": 0.9858130697255809, |
|
"eval_precision": 0.8123042127541057, |
|
"eval_precision_macro": 0.7417780746962291, |
|
"eval_recall": 0.8109992254066615, |
|
"eval_recall_macro": 0.7288750805513627, |
|
"eval_runtime": 119.3649, |
|
"eval_samples_per_second": 10.816, |
|
"eval_steps_per_second": 1.357, |
|
"eval_weighted_fpr": 0.016373641121997046, |
|
"eval_weighted_sensitivity": 0.8109992254066615, |
|
"eval_weighted_specificity": 0.976196820477052, |
|
"step": 1607 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.8094500387296669, |
|
"eval_f1_macro": 0.7262574438118878, |
|
"eval_f1_micro": 0.8094500387296669, |
|
"eval_f1_weighted": 0.8026446222230169, |
|
"eval_loss": 0.6805150508880615, |
|
"eval_macro_fpr": 0.017269448415116812, |
|
"eval_macro_sensitivity": 0.7303446738424816, |
|
"eval_macro_specificity": 0.9856433903766489, |
|
"eval_precision": 0.8123272064418959, |
|
"eval_precision_macro": 0.7389776120628855, |
|
"eval_recall": 0.8094500387296669, |
|
"eval_recall_macro": 0.7303446738424816, |
|
"eval_runtime": 119.049, |
|
"eval_samples_per_second": 10.844, |
|
"eval_steps_per_second": 1.361, |
|
"eval_weighted_fpr": 0.016536703414896478, |
|
"eval_weighted_sensitivity": 0.8094500387296669, |
|
"eval_weighted_specificity": 0.9752008169200658, |
|
"step": 1768 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.8133230054221534, |
|
"eval_f1_macro": 0.7283700928598721, |
|
"eval_f1_micro": 0.8133230054221534, |
|
"eval_f1_weighted": 0.8089952243674349, |
|
"eval_loss": 0.670982301235199, |
|
"eval_macro_fpr": 0.016803062086639158, |
|
"eval_macro_sensitivity": 0.7306161057668827, |
|
"eval_macro_specificity": 0.9859491188467968, |
|
"eval_precision": 0.813705327621, |
|
"eval_precision_macro": 0.7396207219727483, |
|
"eval_recall": 0.8133230054221534, |
|
"eval_recall_macro": 0.7306161057668827, |
|
"eval_runtime": 179.3033, |
|
"eval_samples_per_second": 7.2, |
|
"eval_steps_per_second": 0.903, |
|
"eval_weighted_fpr": 0.016130111772973698, |
|
"eval_weighted_sensitivity": 0.8133230054221534, |
|
"eval_weighted_specificity": 0.9759137772797981, |
|
"step": 1929 |
|
}, |
|
{ |
|
"epoch": 12.44, |
|
"learning_rate": 8.333333333333334e-06, |
|
"loss": 0.2929, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.8187451587916343, |
|
"eval_f1_macro": 0.73684785586885, |
|
"eval_f1_micro": 0.8187451587916342, |
|
"eval_f1_weighted": 0.8150888108444543, |
|
"eval_loss": 0.6740049719810486, |
|
"eval_macro_fpr": 0.01621356652381048, |
|
"eval_macro_sensitivity": 0.7360046444502426, |
|
"eval_macro_specificity": 0.9863212120014355, |
|
"eval_precision": 0.8169592155695241, |
|
"eval_precision_macro": 0.7644187374870298, |
|
"eval_recall": 0.8187451587916343, |
|
"eval_recall_macro": 0.7360046444502426, |
|
"eval_runtime": 119.1613, |
|
"eval_samples_per_second": 10.834, |
|
"eval_steps_per_second": 1.36, |
|
"eval_weighted_fpr": 0.015566790846194785, |
|
"eval_weighted_sensitivity": 0.8187451587916343, |
|
"eval_weighted_specificity": 0.9760730212298985, |
|
"step": 2089 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.8179705654531371, |
|
"eval_f1_macro": 0.7360855331051521, |
|
"eval_f1_micro": 0.817970565453137, |
|
"eval_f1_weighted": 0.8136558284635095, |
|
"eval_loss": 0.6823435425758362, |
|
"eval_macro_fpr": 0.016364294303971197, |
|
"eval_macro_sensitivity": 0.7336475818062481, |
|
"eval_macro_specificity": 0.9862178349089701, |
|
"eval_precision": 0.8158757496725866, |
|
"eval_precision_macro": 0.7657492044841306, |
|
"eval_recall": 0.8179705654531371, |
|
"eval_recall_macro": 0.7336475818062481, |
|
"eval_runtime": 119.9116, |
|
"eval_samples_per_second": 10.766, |
|
"eval_steps_per_second": 1.351, |
|
"eval_weighted_fpr": 0.01564684732671949, |
|
"eval_weighted_sensitivity": 0.8179705654531371, |
|
"eval_weighted_specificity": 0.9752969581814132, |
|
"step": 2250 |
|
}, |
|
{ |
|
"epoch": 14.93, |
|
"eval_accuracy": 0.8171959721146398, |
|
"eval_f1_macro": 0.741686227084744, |
|
"eval_f1_micro": 0.8171959721146398, |
|
"eval_f1_weighted": 0.8123666303237236, |
|
"eval_loss": 0.6883538365364075, |
|
"eval_macro_fpr": 0.016431634793055545, |
|
"eval_macro_sensitivity": 0.7412016365606894, |
|
"eval_macro_specificity": 0.9861826479575689, |
|
"eval_precision": 0.8131542275099815, |
|
"eval_precision_macro": 0.7584490957896397, |
|
"eval_recall": 0.8171959721146398, |
|
"eval_recall_macro": 0.7412016365606894, |
|
"eval_runtime": 120.2818, |
|
"eval_samples_per_second": 10.733, |
|
"eval_steps_per_second": 1.347, |
|
"eval_weighted_fpr": 0.015727042516326804, |
|
"eval_weighted_sensitivity": 0.8171959721146398, |
|
"eval_weighted_specificity": 0.975543747248895, |
|
"step": 2400 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 2400, |
|
"num_train_epochs": 15, |
|
"save_steps": 500, |
|
"total_flos": 8.542715907800678e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|