UMBERTO_fine-tuned_DocClass_PA / trainer_state.json
Auriemma's picture
Upload 11 files
97902cd
raw
history blame
34.7 kB
{
"best_metric": 0.8937805730258561,
"best_model_checkpoint": "umberto-commoncrawl-cased/checkpoint-5510",
"epoch": 10.0,
"global_step": 5510,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.91,
"learning_rate": 1.8185117967332124e-05,
"loss": 0.3388,
"step": 500
},
{
"epoch": 1.0,
"eval_accuracy": 0.3091239219246482,
"eval_f1": 0.6689956331877728,
"eval_loss": 0.23511561751365662,
"eval_report": {
"0": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 40
},
"1": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 135
},
"10": {
"f1-score": 0.7397260273972603,
"precision": 0.8957345971563981,
"recall": 0.63,
"support": 300
},
"11": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 285
},
"12": {
"f1-score": 0.16611295681063123,
"precision": 0.9615384615384616,
"recall": 0.09090909090909091,
"support": 275
},
"2": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 86
},
"3": {
"f1-score": 0.6111111111111112,
"precision": 0.9285714285714286,
"recall": 0.4554140127388535,
"support": 314
},
"4": {
"f1-score": 0.8102429415627053,
"precision": 0.8510344827586207,
"recall": 0.7731829573934837,
"support": 798
},
"5": {
"f1-score": 0.8079470198675497,
"precision": 0.9003690036900369,
"recall": 0.7327327327327328,
"support": 333
},
"6": {
"f1-score": 0.38190954773869346,
"precision": 0.987012987012987,
"recall": 0.2367601246105919,
"support": 321
},
"7": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 199
},
"8": {
"f1-score": 0.9444967074317967,
"precision": 0.9561904761904761,
"recall": 0.9330855018587361,
"support": 1076
},
"9": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 194
},
"macro avg": {
"f1-score": 0.34319587014767294,
"precision": 0.4984962643783391,
"recall": 0.29631418617257604,
"support": 4356
},
"micro avg": {
"f1-score": 0.6689956331877728,
"precision": 0.9140811455847255,
"recall": 0.5275482093663911,
"support": 4356
},
"samples avg": {
"f1-score": 0.5890755031018308,
"precision": 0.7131941292177334,
"recall": 0.5347253744893328,
"support": 4356
},
"weighted avg": {
"f1-score": 0.5771302587774695,
"precision": 0.7229925163736703,
"recall": 0.5275482093663911,
"support": 4356
}
},
"eval_roc_auc": 0.7593265487798887,
"eval_runtime": 25.8816,
"eval_samples_per_second": 85.119,
"eval_steps_per_second": 5.332,
"step": 551
},
{
"epoch": 1.81,
"learning_rate": 1.637023593466425e-05,
"loss": 0.2063,
"step": 1000
},
{
"epoch": 2.0,
"eval_accuracy": 0.5206536541080345,
"eval_f1": 0.8021708231037601,
"eval_loss": 0.17003820836544037,
"eval_report": {
"0": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 40
},
"1": {
"f1-score": 0.8755020080321286,
"precision": 0.956140350877193,
"recall": 0.8074074074074075,
"support": 135
},
"10": {
"f1-score": 0.7489711934156379,
"precision": 0.978494623655914,
"recall": 0.6066666666666667,
"support": 300
},
"11": {
"f1-score": 0.7182539682539681,
"precision": 0.8264840182648402,
"recall": 0.6350877192982456,
"support": 285
},
"12": {
"f1-score": 0.7465069860279441,
"precision": 0.827433628318584,
"recall": 0.68,
"support": 275
},
"2": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 86
},
"3": {
"f1-score": 0.6543209876543209,
"precision": 0.9244186046511628,
"recall": 0.5063694267515924,
"support": 314
},
"4": {
"f1-score": 0.8340136054421768,
"precision": 0.9122023809523809,
"recall": 0.768170426065163,
"support": 798
},
"5": {
"f1-score": 0.8135593220338982,
"precision": 0.933852140077821,
"recall": 0.7207207207207207,
"support": 333
},
"6": {
"f1-score": 0.8043875685557588,
"precision": 0.9734513274336283,
"recall": 0.6853582554517134,
"support": 321
},
"7": {
"f1-score": 0.5405405405405406,
"precision": 0.8247422680412371,
"recall": 0.4020100502512563,
"support": 199
},
"8": {
"f1-score": 0.9505316689782709,
"precision": 0.9457221711131555,
"recall": 0.9553903345724907,
"support": 1076
},
"9": {
"f1-score": 0.6542056074766355,
"precision": 0.8267716535433071,
"recall": 0.5412371134020618,
"support": 194
},
"macro avg": {
"f1-score": 0.6415994966470216,
"precision": 0.7638240897637865,
"recall": 0.5621860092759475,
"support": 4356
},
"micro avg": {
"f1-score": 0.8021708231037601,
"precision": 0.9175288205734555,
"recall": 0.7125803489439853,
"support": 4356
},
"samples avg": {
"f1-score": 0.7855154226920001,
"precision": 0.884627023755485,
"recall": 0.7412240883643516,
"support": 4356
},
"weighted avg": {
"f1-score": 0.7828867707685374,
"precision": 0.8883125749118967,
"recall": 0.7125803489439853,
"support": 4356
}
},
"eval_roc_auc": 0.8505454147635545,
"eval_runtime": 25.8749,
"eval_samples_per_second": 85.141,
"eval_steps_per_second": 5.333,
"step": 1102
},
{
"epoch": 2.72,
"learning_rate": 1.4555353901996372e-05,
"loss": 0.1508,
"step": 1500
},
{
"epoch": 3.0,
"eval_accuracy": 0.5969133000453927,
"eval_f1": 0.8439663699307616,
"eval_loss": 0.13934455811977386,
"eval_report": {
"0": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 40
},
"1": {
"f1-score": 0.918918918918919,
"precision": 0.9596774193548387,
"recall": 0.8814814814814815,
"support": 135
},
"10": {
"f1-score": 0.8544776119402986,
"precision": 0.9703389830508474,
"recall": 0.7633333333333333,
"support": 300
},
"11": {
"f1-score": 0.7470355731225297,
"precision": 0.8552036199095022,
"recall": 0.6631578947368421,
"support": 285
},
"12": {
"f1-score": 0.781431334622824,
"precision": 0.8347107438016529,
"recall": 0.7345454545454545,
"support": 275
},
"2": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 86
},
"3": {
"f1-score": 0.7650273224043715,
"precision": 0.8936170212765957,
"recall": 0.6687898089171974,
"support": 314
},
"4": {
"f1-score": 0.8625592417061612,
"precision": 0.9381443298969072,
"recall": 0.7982456140350878,
"support": 798
},
"5": {
"f1-score": 0.867283950617284,
"precision": 0.8920634920634921,
"recall": 0.8438438438438438,
"support": 333
},
"6": {
"f1-score": 0.851138353765324,
"precision": 0.972,
"recall": 0.7570093457943925,
"support": 321
},
"7": {
"f1-score": 0.6850152905198778,
"precision": 0.875,
"recall": 0.5628140703517588,
"support": 199
},
"8": {
"f1-score": 0.949977467327625,
"precision": 0.9221347331583553,
"recall": 0.9795539033457249,
"support": 1076
},
"9": {
"f1-score": 0.7762039660056657,
"precision": 0.8616352201257862,
"recall": 0.7061855670103093,
"support": 194
},
"macro avg": {
"f1-score": 0.6968514639192984,
"precision": 0.7672711971259983,
"recall": 0.6429969474919558,
"support": 4356
},
"micro avg": {
"f1-score": 0.8439663699307616,
"precision": 0.9145230439442658,
"recall": 0.7835169880624426,
"support": 4356
},
"samples avg": {
"f1-score": 0.8340509694572336,
"precision": 0.9041836889090633,
"recall": 0.8090482675139962,
"support": 4356
},
"weighted avg": {
"f1-score": 0.8282450140705083,
"precision": 0.8874517679353394,
"recall": 0.7835169880624426,
"support": 4356
}
},
"eval_roc_auc": 0.8851901128592079,
"eval_runtime": 25.8631,
"eval_samples_per_second": 85.179,
"eval_steps_per_second": 5.336,
"step": 1653
},
{
"epoch": 3.63,
"learning_rate": 1.2740471869328494e-05,
"loss": 0.1208,
"step": 2000
},
{
"epoch": 4.0,
"eval_accuracy": 0.655015887426237,
"eval_f1": 0.8709677419354839,
"eval_loss": 0.12088670581579208,
"eval_report": {
"0": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 40
},
"1": {
"f1-score": 0.930909090909091,
"precision": 0.9142857142857143,
"recall": 0.9481481481481482,
"support": 135
},
"10": {
"f1-score": 0.838095238095238,
"precision": 0.9777777777777777,
"recall": 0.7333333333333333,
"support": 300
},
"11": {
"f1-score": 0.7837837837837837,
"precision": 0.871244635193133,
"recall": 0.712280701754386,
"support": 285
},
"12": {
"f1-score": 0.8265682656826568,
"precision": 0.8389513108614233,
"recall": 0.8145454545454546,
"support": 275
},
"2": {
"f1-score": 0.4615384615384615,
"precision": 0.8709677419354839,
"recall": 0.313953488372093,
"support": 86
},
"3": {
"f1-score": 0.8124999999999999,
"precision": 0.8931297709923665,
"recall": 0.7452229299363057,
"support": 314
},
"4": {
"f1-score": 0.8861538461538461,
"precision": 0.8706166868198307,
"recall": 0.9022556390977443,
"support": 798
},
"5": {
"f1-score": 0.8738461538461537,
"precision": 0.8958990536277602,
"recall": 0.8528528528528528,
"support": 333
},
"6": {
"f1-score": 0.8980263157894736,
"precision": 0.9512195121951219,
"recall": 0.8504672897196262,
"support": 321
},
"7": {
"f1-score": 0.7804878048780488,
"precision": 0.8470588235294118,
"recall": 0.7236180904522613,
"support": 199
},
"8": {
"f1-score": 0.9590163934426229,
"precision": 0.9401785714285714,
"recall": 0.9786245353159851,
"support": 1076
},
"9": {
"f1-score": 0.8286445012787723,
"precision": 0.8223350253807107,
"recall": 0.8350515463917526,
"support": 194
},
"macro avg": {
"f1-score": 0.7599669119537038,
"precision": 0.8225895864636388,
"recall": 0.7238733853784572,
"support": 4356
},
"micro avg": {
"f1-score": 0.8709677419354839,
"precision": 0.900883218842002,
"recall": 0.8429752066115702,
"support": 4356
},
"samples avg": {
"f1-score": 0.8697403972937336,
"precision": 0.9097442880919957,
"recall": 0.8644651233166893,
"support": 4356
},
"weighted avg": {
"f1-score": 0.8624855347630281,
"precision": 0.8928562943515039,
"recall": 0.8429752066115702,
"support": 4356
}
},
"eval_roc_auc": 0.913169026523674,
"eval_runtime": 25.8665,
"eval_samples_per_second": 85.168,
"eval_steps_per_second": 5.335,
"step": 2204
},
{
"epoch": 4.54,
"learning_rate": 1.0925589836660618e-05,
"loss": 0.0971,
"step": 2500
},
{
"epoch": 5.0,
"eval_accuracy": 0.6631865637766682,
"eval_f1": 0.876908396946565,
"eval_loss": 0.11281398683786392,
"eval_report": {
"0": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 40
},
"1": {
"f1-score": 0.9283018867924527,
"precision": 0.9461538461538461,
"recall": 0.9111111111111111,
"support": 135
},
"10": {
"f1-score": 0.8904347826086957,
"precision": 0.9309090909090909,
"recall": 0.8533333333333334,
"support": 300
},
"11": {
"f1-score": 0.8158844765342961,
"precision": 0.8401486988847584,
"recall": 0.7929824561403509,
"support": 285
},
"12": {
"f1-score": 0.8304761904761904,
"precision": 0.872,
"recall": 0.7927272727272727,
"support": 275
},
"2": {
"f1-score": 0.4786324786324786,
"precision": 0.9032258064516129,
"recall": 0.32558139534883723,
"support": 86
},
"3": {
"f1-score": 0.7977736549165121,
"precision": 0.9555555555555556,
"recall": 0.6847133757961783,
"support": 314
},
"4": {
"f1-score": 0.8926767676767676,
"precision": 0.8994910941475827,
"recall": 0.8859649122807017,
"support": 798
},
"5": {
"f1-score": 0.8780487804878049,
"precision": 0.891640866873065,
"recall": 0.8648648648648649,
"support": 333
},
"6": {
"f1-score": 0.9051580698835274,
"precision": 0.9714285714285714,
"recall": 0.8473520249221184,
"support": 321
},
"7": {
"f1-score": 0.7757255936675462,
"precision": 0.8166666666666667,
"recall": 0.7386934673366834,
"support": 199
},
"8": {
"f1-score": 0.9562413634269923,
"precision": 0.947945205479452,
"recall": 0.9646840148698885,
"support": 1076
},
"9": {
"f1-score": 0.835978835978836,
"precision": 0.8586956521739131,
"recall": 0.8144329896907216,
"support": 194
},
"macro avg": {
"f1-score": 0.7681025293140078,
"precision": 0.8333739272864704,
"recall": 0.7289570168016971,
"support": 4356
},
"micro avg": {
"f1-score": 0.876908396946565,
"precision": 0.9126117179741807,
"recall": 0.8438934802571166,
"support": 4356
},
"samples avg": {
"f1-score": 0.8725850031342542,
"precision": 0.9159101225601453,
"recall": 0.8631411711302769,
"support": 4356
},
"weighted avg": {
"f1-score": 0.86909769922114,
"precision": 0.904407547519813,
"recall": 0.8438934802571166,
"support": 4356
}
},
"eval_roc_auc": 0.9146988712490953,
"eval_runtime": 25.8749,
"eval_samples_per_second": 85.14,
"eval_steps_per_second": 5.333,
"step": 2755
},
{
"epoch": 5.44,
"learning_rate": 9.110707803992742e-06,
"loss": 0.0811,
"step": 3000
},
{
"epoch": 6.0,
"eval_accuracy": 0.6867907399001362,
"eval_f1": 0.8865256515133809,
"eval_loss": 0.1077384203672409,
"eval_report": {
"0": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 40
},
"1": {
"f1-score": 0.9407407407407408,
"precision": 0.9407407407407408,
"recall": 0.9407407407407408,
"support": 135
},
"10": {
"f1-score": 0.8853046594982079,
"precision": 0.9573643410852714,
"recall": 0.8233333333333334,
"support": 300
},
"11": {
"f1-score": 0.8208695652173912,
"precision": 0.8137931034482758,
"recall": 0.8280701754385965,
"support": 285
},
"12": {
"f1-score": 0.8451730418943533,
"precision": 0.8467153284671532,
"recall": 0.8436363636363636,
"support": 275
},
"2": {
"f1-score": 0.5625000000000001,
"precision": 0.8571428571428571,
"recall": 0.4186046511627907,
"support": 86
},
"3": {
"f1-score": 0.8489932885906041,
"precision": 0.8971631205673759,
"recall": 0.8057324840764332,
"support": 314
},
"4": {
"f1-score": 0.9015479876160991,
"precision": 0.8910648714810282,
"recall": 0.9122807017543859,
"support": 798
},
"5": {
"f1-score": 0.895148669796557,
"precision": 0.934640522875817,
"recall": 0.8588588588588588,
"support": 333
},
"6": {
"f1-score": 0.8978224455611391,
"precision": 0.9710144927536232,
"recall": 0.8348909657320872,
"support": 321
},
"7": {
"f1-score": 0.8133971291866029,
"precision": 0.776255707762557,
"recall": 0.8542713567839196,
"support": 199
},
"8": {
"f1-score": 0.9545663148233136,
"precision": 0.942883046237534,
"recall": 0.966542750929368,
"support": 1076
},
"9": {
"f1-score": 0.8651399491094148,
"precision": 0.8542713567839196,
"recall": 0.8762886597938144,
"support": 194
},
"macro avg": {
"f1-score": 0.7870156763103403,
"precision": 0.8217730376420119,
"recall": 0.7664039263262072,
"support": 4356
},
"micro avg": {
"f1-score": 0.8865256515133809,
"precision": 0.9028802666031898,
"recall": 0.870752984389348,
"support": 4356
},
"samples avg": {
"f1-score": 0.8854851609277392,
"precision": 0.9150022696323196,
"recall": 0.8869723104857014,
"support": 4356
},
"weighted avg": {
"f1-score": 0.8807295782472653,
"precision": 0.8960415422991472,
"recall": 0.870752984389348,
"support": 4356
}
},
"eval_roc_auc": 0.9269755532662054,
"eval_runtime": 25.8985,
"eval_samples_per_second": 85.063,
"eval_steps_per_second": 5.329,
"step": 3306
},
{
"epoch": 6.35,
"learning_rate": 7.295825771324865e-06,
"loss": 0.0692,
"step": 3500
},
{
"epoch": 7.0,
"eval_accuracy": 0.672719019518838,
"eval_f1": 0.8813199764289925,
"eval_loss": 0.10911860316991806,
"eval_report": {
"0": {
"f1-score": 0.04878048780487806,
"precision": 1.0,
"recall": 0.025,
"support": 40
},
"1": {
"f1-score": 0.9338235294117647,
"precision": 0.927007299270073,
"recall": 0.9407407407407408,
"support": 135
},
"10": {
"f1-score": 0.877005347593583,
"precision": 0.9425287356321839,
"recall": 0.82,
"support": 300
},
"11": {
"f1-score": 0.808193668528864,
"precision": 0.8611111111111112,
"recall": 0.7614035087719299,
"support": 285
},
"12": {
"f1-score": 0.850187265917603,
"precision": 0.8764478764478765,
"recall": 0.8254545454545454,
"support": 275
},
"2": {
"f1-score": 0.5736434108527131,
"precision": 0.8604651162790697,
"recall": 0.43023255813953487,
"support": 86
},
"3": {
"f1-score": 0.8585690515806988,
"precision": 0.8989547038327527,
"recall": 0.821656050955414,
"support": 314
},
"4": {
"f1-score": 0.8974668275030157,
"precision": 0.8651162790697674,
"recall": 0.9323308270676691,
"support": 798
},
"5": {
"f1-score": 0.8680445151033386,
"precision": 0.9222972972972973,
"recall": 0.8198198198198198,
"support": 333
},
"6": {
"f1-score": 0.9030100334448161,
"precision": 0.9747292418772563,
"recall": 0.8411214953271028,
"support": 321
},
"7": {
"f1-score": 0.7885117493472584,
"precision": 0.8206521739130435,
"recall": 0.7587939698492462,
"support": 199
},
"8": {
"f1-score": 0.9535095715587968,
"precision": 0.9355992844364938,
"recall": 0.9721189591078067,
"support": 1076
},
"9": {
"f1-score": 0.8160919540229885,
"precision": 0.922077922077922,
"recall": 0.7319587628865979,
"support": 194
},
"macro avg": {
"f1-score": 0.782833647128486,
"precision": 0.9082297724034496,
"recall": 0.7446639413938775,
"support": 4356
},
"micro avg": {
"f1-score": 0.8813199764289925,
"precision": 0.905546137079196,
"recall": 0.858356290174472,
"support": 4356
},
"samples avg": {
"f1-score": 0.8788772885459222,
"precision": 0.9134513542139506,
"recall": 0.8763428657890756,
"support": 4356
},
"weighted avg": {
"f1-score": 0.8747693430346722,
"precision": 0.9067699317424669,
"recall": 0.858356290174472,
"support": 4356
}
},
"eval_roc_auc": 0.9211478358173765,
"eval_runtime": 25.9101,
"eval_samples_per_second": 85.025,
"eval_steps_per_second": 5.326,
"step": 3857
},
{
"epoch": 7.26,
"learning_rate": 5.480943738656987e-06,
"loss": 0.0612,
"step": 4000
},
{
"epoch": 8.0,
"eval_accuracy": 0.6967771221062188,
"eval_f1": 0.8906778672266946,
"eval_loss": 0.10351744294166565,
"eval_report": {
"0": {
"f1-score": 0.2608695652173913,
"precision": 1.0,
"recall": 0.15,
"support": 40
},
"1": {
"f1-score": 0.9343065693430658,
"precision": 0.920863309352518,
"recall": 0.9481481481481482,
"support": 135
},
"10": {
"f1-score": 0.8846153846153848,
"precision": 0.9301470588235294,
"recall": 0.8433333333333334,
"support": 300
},
"11": {
"f1-score": 0.807899461400359,
"precision": 0.8272058823529411,
"recall": 0.7894736842105263,
"support": 285
},
"12": {
"f1-score": 0.8566243194192378,
"precision": 0.855072463768116,
"recall": 0.8581818181818182,
"support": 275
},
"2": {
"f1-score": 0.6174496644295302,
"precision": 0.7301587301587301,
"recall": 0.5348837209302325,
"support": 86
},
"3": {
"f1-score": 0.8707037643207856,
"precision": 0.8956228956228957,
"recall": 0.8471337579617835,
"support": 314
},
"4": {
"f1-score": 0.9031446540880502,
"precision": 0.9065656565656566,
"recall": 0.899749373433584,
"support": 798
},
"5": {
"f1-score": 0.8973966309341501,
"precision": 0.915625,
"recall": 0.8798798798798799,
"support": 333
},
"6": {
"f1-score": 0.9210526315789473,
"precision": 0.975609756097561,
"recall": 0.8722741433021807,
"support": 321
},
"7": {
"f1-score": 0.8070175438596492,
"precision": 0.805,
"recall": 0.8090452261306532,
"support": 199
},
"8": {
"f1-score": 0.9565614997713763,
"precision": 0.9414941494149415,
"recall": 0.9721189591078067,
"support": 1076
},
"9": {
"f1-score": 0.8502673796791443,
"precision": 0.8833333333333333,
"recall": 0.8195876288659794,
"support": 194
},
"macro avg": {
"f1-score": 0.8129160822043902,
"precision": 0.8912844796530941,
"recall": 0.7864468979604557,
"support": 4356
},
"micro avg": {
"f1-score": 0.8906778672266946,
"precision": 0.9055753262158956,
"recall": 0.8762626262626263,
"support": 4356
},
"samples avg": {
"f1-score": 0.8899876791388366,
"precision": 0.9160992585867755,
"recall": 0.8930624905431986,
"support": 4356
},
"weighted avg": {
"f1-score": 0.8871176344746756,
"precision": 0.9055099014048587,
"recall": 0.8762626262626263,
"support": 4356
}
},
"eval_roc_auc": 0.9299362795687385,
"eval_runtime": 25.9048,
"eval_samples_per_second": 85.042,
"eval_steps_per_second": 5.327,
"step": 4408
},
{
"epoch": 8.17,
"learning_rate": 3.666061705989111e-06,
"loss": 0.0539,
"step": 4500
},
{
"epoch": 9.0,
"eval_accuracy": 0.699046754425783,
"eval_f1": 0.8925369658865993,
"eval_loss": 0.10284219682216644,
"eval_report": {
"0": {
"f1-score": 0.18181818181818182,
"precision": 1.0,
"recall": 0.1,
"support": 40
},
"1": {
"f1-score": 0.9477611940298507,
"precision": 0.9548872180451128,
"recall": 0.9407407407407408,
"support": 135
},
"10": {
"f1-score": 0.8865619546247819,
"precision": 0.9304029304029304,
"recall": 0.8466666666666667,
"support": 300
},
"11": {
"f1-score": 0.8136200716845878,
"precision": 0.8315018315018315,
"recall": 0.7964912280701755,
"support": 285
},
"12": {
"f1-score": 0.855072463768116,
"precision": 0.851985559566787,
"recall": 0.8581818181818182,
"support": 275
},
"2": {
"f1-score": 0.5985401459854015,
"precision": 0.803921568627451,
"recall": 0.47674418604651164,
"support": 86
},
"3": {
"f1-score": 0.8760330578512396,
"precision": 0.9106529209621993,
"recall": 0.8439490445859873,
"support": 314
},
"4": {
"f1-score": 0.9055214723926379,
"precision": 0.8870192307692307,
"recall": 0.924812030075188,
"support": 798
},
"5": {
"f1-score": 0.8905775075987841,
"precision": 0.9015384615384615,
"recall": 0.8798798798798799,
"support": 333
},
"6": {
"f1-score": 0.9153094462540716,
"precision": 0.9590443686006825,
"recall": 0.8753894080996885,
"support": 321
},
"7": {
"f1-score": 0.8170426065162906,
"precision": 0.815,
"recall": 0.8190954773869347,
"support": 199
},
"8": {
"f1-score": 0.9581993569131833,
"precision": 0.9473206176203451,
"recall": 0.9693308550185874,
"support": 1076
},
"9": {
"f1-score": 0.8609625668449198,
"precision": 0.8944444444444445,
"recall": 0.8298969072164949,
"support": 194
},
"macro avg": {
"f1-score": 0.8082323097140035,
"precision": 0.8990553193907289,
"recall": 0.7816290955360519,
"support": 4356
},
"micro avg": {
"f1-score": 0.8925369658865993,
"precision": 0.9055043704228679,
"recall": 0.8799357208448118,
"support": 4356
},
"samples avg": {
"f1-score": 0.8913213583209044,
"precision": 0.916288394613406,
"recall": 0.8957482221213496,
"support": 4356
},
"weighted avg": {
"f1-score": 0.8880597009850972,
"precision": 0.9057204039138281,
"recall": 0.8799357208448118,
"support": 4356
}
},
"eval_roc_auc": 0.9317316457866525,
"eval_runtime": 25.9692,
"eval_samples_per_second": 84.831,
"eval_steps_per_second": 5.314,
"step": 4959
},
{
"epoch": 9.07,
"learning_rate": 1.8511796733212343e-06,
"loss": 0.0498,
"step": 5000
},
{
"epoch": 9.98,
"learning_rate": 3.629764065335753e-08,
"loss": 0.0468,
"step": 5500
},
{
"epoch": 10.0,
"eval_accuracy": 0.7031320926009986,
"eval_f1": 0.8937805730258561,
"eval_loss": 0.10207226872444153,
"eval_report": {
"0": {
"f1-score": 0.2978723404255319,
"precision": 1.0,
"recall": 0.175,
"support": 40
},
"1": {
"f1-score": 0.9477611940298507,
"precision": 0.9548872180451128,
"recall": 0.9407407407407408,
"support": 135
},
"10": {
"f1-score": 0.8885017421602788,
"precision": 0.9306569343065694,
"recall": 0.85,
"support": 300
},
"11": {
"f1-score": 0.8158844765342961,
"precision": 0.8401486988847584,
"recall": 0.7929824561403509,
"support": 285
},
"12": {
"f1-score": 0.8534798534798536,
"precision": 0.8597785977859779,
"recall": 0.8472727272727273,
"support": 275
},
"2": {
"f1-score": 0.6482758620689655,
"precision": 0.7966101694915254,
"recall": 0.5465116279069767,
"support": 86
},
"3": {
"f1-score": 0.8794788273615636,
"precision": 0.9,
"recall": 0.8598726114649682,
"support": 314
},
"4": {
"f1-score": 0.9057301293900184,
"precision": 0.8909090909090909,
"recall": 0.9210526315789473,
"support": 798
},
"5": {
"f1-score": 0.8895705521472392,
"precision": 0.9090909090909091,
"recall": 0.8708708708708709,
"support": 333
},
"6": {
"f1-score": 0.9200652528548124,
"precision": 0.9657534246575342,
"recall": 0.8785046728971962,
"support": 321
},
"7": {
"f1-score": 0.8070175438596492,
"precision": 0.805,
"recall": 0.8090452261306532,
"support": 199
},
"8": {
"f1-score": 0.9576036866359448,
"precision": 0.9497257769652651,
"recall": 0.9656133828996283,
"support": 1076
},
"9": {
"f1-score": 0.8661417322834646,
"precision": 0.8823529411764706,
"recall": 0.8505154639175257,
"support": 194
},
"macro avg": {
"f1-score": 0.8213371687101131,
"precision": 0.8988395201010164,
"recall": 0.7929217239861989,
"support": 4356
},
"micro avg": {
"f1-score": 0.8937805730258561,
"precision": 0.9070921985815603,
"recall": 0.8808539944903582,
"support": 4356
},
"samples avg": {
"f1-score": 0.8926485528392021,
"precision": 0.9176123467998184,
"recall": 0.8967317294598275,
"support": 4356
},
"weighted avg": {
"f1-score": 0.8904741566354063,
"precision": 0.9072664844050249,
"recall": 0.8808539944903582,
"support": 4356
}
},
"eval_roc_auc": 0.9323349163655514,
"eval_runtime": 25.9424,
"eval_samples_per_second": 84.919,
"eval_steps_per_second": 5.319,
"step": 5510
}
],
"max_steps": 5510,
"num_train_epochs": 10,
"total_flos": 2.319816157052928e+16,
"trial_name": null,
"trial_params": null
}