{ "best_metric": 0.8937805730258561, "best_model_checkpoint": "umberto-commoncrawl-cased/checkpoint-5510", "epoch": 10.0, "global_step": 5510, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.91, "learning_rate": 1.8185117967332124e-05, "loss": 0.3388, "step": 500 }, { "epoch": 1.0, "eval_accuracy": 0.3091239219246482, "eval_f1": 0.6689956331877728, "eval_loss": 0.23511561751365662, "eval_report": { "0": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 40 }, "1": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 135 }, "10": { "f1-score": 0.7397260273972603, "precision": 0.8957345971563981, "recall": 0.63, "support": 300 }, "11": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 285 }, "12": { "f1-score": 0.16611295681063123, "precision": 0.9615384615384616, "recall": 0.09090909090909091, "support": 275 }, "2": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 86 }, "3": { "f1-score": 0.6111111111111112, "precision": 0.9285714285714286, "recall": 0.4554140127388535, "support": 314 }, "4": { "f1-score": 0.8102429415627053, "precision": 0.8510344827586207, "recall": 0.7731829573934837, "support": 798 }, "5": { "f1-score": 0.8079470198675497, "precision": 0.9003690036900369, "recall": 0.7327327327327328, "support": 333 }, "6": { "f1-score": 0.38190954773869346, "precision": 0.987012987012987, "recall": 0.2367601246105919, "support": 321 }, "7": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 199 }, "8": { "f1-score": 0.9444967074317967, "precision": 0.9561904761904761, "recall": 0.9330855018587361, "support": 1076 }, "9": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 194 }, "macro avg": { "f1-score": 0.34319587014767294, "precision": 0.4984962643783391, "recall": 0.29631418617257604, "support": 4356 }, "micro avg": { "f1-score": 0.6689956331877728, "precision": 0.9140811455847255, "recall": 0.5275482093663911, "support": 4356 }, "samples avg": { "f1-score": 0.5890755031018308, "precision": 0.7131941292177334, "recall": 0.5347253744893328, "support": 4356 }, "weighted avg": { "f1-score": 0.5771302587774695, "precision": 0.7229925163736703, "recall": 0.5275482093663911, "support": 4356 } }, "eval_roc_auc": 0.7593265487798887, "eval_runtime": 25.8816, "eval_samples_per_second": 85.119, "eval_steps_per_second": 5.332, "step": 551 }, { "epoch": 1.81, "learning_rate": 1.637023593466425e-05, "loss": 0.2063, "step": 1000 }, { "epoch": 2.0, "eval_accuracy": 0.5206536541080345, "eval_f1": 0.8021708231037601, "eval_loss": 0.17003820836544037, "eval_report": { "0": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 40 }, "1": { "f1-score": 0.8755020080321286, "precision": 0.956140350877193, "recall": 0.8074074074074075, "support": 135 }, "10": { "f1-score": 0.7489711934156379, "precision": 0.978494623655914, "recall": 0.6066666666666667, "support": 300 }, "11": { "f1-score": 0.7182539682539681, "precision": 0.8264840182648402, "recall": 0.6350877192982456, "support": 285 }, "12": { "f1-score": 0.7465069860279441, "precision": 0.827433628318584, "recall": 0.68, "support": 275 }, "2": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 86 }, "3": { "f1-score": 0.6543209876543209, "precision": 0.9244186046511628, "recall": 0.5063694267515924, "support": 314 }, "4": { "f1-score": 0.8340136054421768, "precision": 0.9122023809523809, "recall": 0.768170426065163, "support": 798 }, "5": { "f1-score": 0.8135593220338982, "precision": 0.933852140077821, "recall": 0.7207207207207207, "support": 333 }, "6": { "f1-score": 0.8043875685557588, "precision": 0.9734513274336283, "recall": 0.6853582554517134, "support": 321 }, "7": { "f1-score": 0.5405405405405406, "precision": 0.8247422680412371, "recall": 0.4020100502512563, "support": 199 }, "8": { "f1-score": 0.9505316689782709, "precision": 0.9457221711131555, "recall": 0.9553903345724907, "support": 1076 }, "9": { "f1-score": 0.6542056074766355, "precision": 0.8267716535433071, "recall": 0.5412371134020618, "support": 194 }, "macro avg": { "f1-score": 0.6415994966470216, "precision": 0.7638240897637865, "recall": 0.5621860092759475, "support": 4356 }, "micro avg": { "f1-score": 0.8021708231037601, "precision": 0.9175288205734555, "recall": 0.7125803489439853, "support": 4356 }, "samples avg": { "f1-score": 0.7855154226920001, "precision": 0.884627023755485, "recall": 0.7412240883643516, "support": 4356 }, "weighted avg": { "f1-score": 0.7828867707685374, "precision": 0.8883125749118967, "recall": 0.7125803489439853, "support": 4356 } }, "eval_roc_auc": 0.8505454147635545, "eval_runtime": 25.8749, "eval_samples_per_second": 85.141, "eval_steps_per_second": 5.333, "step": 1102 }, { "epoch": 2.72, "learning_rate": 1.4555353901996372e-05, "loss": 0.1508, "step": 1500 }, { "epoch": 3.0, "eval_accuracy": 0.5969133000453927, "eval_f1": 0.8439663699307616, "eval_loss": 0.13934455811977386, "eval_report": { "0": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 40 }, "1": { "f1-score": 0.918918918918919, "precision": 0.9596774193548387, "recall": 0.8814814814814815, "support": 135 }, "10": { "f1-score": 0.8544776119402986, "precision": 0.9703389830508474, "recall": 0.7633333333333333, "support": 300 }, "11": { "f1-score": 0.7470355731225297, "precision": 0.8552036199095022, "recall": 0.6631578947368421, "support": 285 }, "12": { "f1-score": 0.781431334622824, "precision": 0.8347107438016529, "recall": 0.7345454545454545, "support": 275 }, "2": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 86 }, "3": { "f1-score": 0.7650273224043715, "precision": 0.8936170212765957, "recall": 0.6687898089171974, "support": 314 }, "4": { "f1-score": 0.8625592417061612, "precision": 0.9381443298969072, "recall": 0.7982456140350878, "support": 798 }, "5": { "f1-score": 0.867283950617284, "precision": 0.8920634920634921, "recall": 0.8438438438438438, "support": 333 }, "6": { "f1-score": 0.851138353765324, "precision": 0.972, "recall": 0.7570093457943925, "support": 321 }, "7": { "f1-score": 0.6850152905198778, "precision": 0.875, "recall": 0.5628140703517588, "support": 199 }, "8": { "f1-score": 0.949977467327625, "precision": 0.9221347331583553, "recall": 0.9795539033457249, "support": 1076 }, "9": { "f1-score": 0.7762039660056657, "precision": 0.8616352201257862, "recall": 0.7061855670103093, "support": 194 }, "macro avg": { "f1-score": 0.6968514639192984, "precision": 0.7672711971259983, "recall": 0.6429969474919558, "support": 4356 }, "micro avg": { "f1-score": 0.8439663699307616, "precision": 0.9145230439442658, "recall": 0.7835169880624426, "support": 4356 }, "samples avg": { "f1-score": 0.8340509694572336, "precision": 0.9041836889090633, "recall": 0.8090482675139962, "support": 4356 }, "weighted avg": { "f1-score": 0.8282450140705083, "precision": 0.8874517679353394, "recall": 0.7835169880624426, "support": 4356 } }, "eval_roc_auc": 0.8851901128592079, "eval_runtime": 25.8631, "eval_samples_per_second": 85.179, "eval_steps_per_second": 5.336, "step": 1653 }, { "epoch": 3.63, "learning_rate": 1.2740471869328494e-05, "loss": 0.1208, "step": 2000 }, { "epoch": 4.0, "eval_accuracy": 0.655015887426237, "eval_f1": 0.8709677419354839, "eval_loss": 0.12088670581579208, "eval_report": { "0": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 40 }, "1": { "f1-score": 0.930909090909091, "precision": 0.9142857142857143, "recall": 0.9481481481481482, "support": 135 }, "10": { "f1-score": 0.838095238095238, "precision": 0.9777777777777777, "recall": 0.7333333333333333, "support": 300 }, "11": { "f1-score": 0.7837837837837837, "precision": 0.871244635193133, "recall": 0.712280701754386, "support": 285 }, "12": { "f1-score": 0.8265682656826568, "precision": 0.8389513108614233, "recall": 0.8145454545454546, "support": 275 }, "2": { "f1-score": 0.4615384615384615, "precision": 0.8709677419354839, "recall": 0.313953488372093, "support": 86 }, "3": { "f1-score": 0.8124999999999999, "precision": 0.8931297709923665, "recall": 0.7452229299363057, "support": 314 }, "4": { "f1-score": 0.8861538461538461, "precision": 0.8706166868198307, "recall": 0.9022556390977443, "support": 798 }, "5": { "f1-score": 0.8738461538461537, "precision": 0.8958990536277602, "recall": 0.8528528528528528, "support": 333 }, "6": { "f1-score": 0.8980263157894736, "precision": 0.9512195121951219, "recall": 0.8504672897196262, "support": 321 }, "7": { "f1-score": 0.7804878048780488, "precision": 0.8470588235294118, "recall": 0.7236180904522613, "support": 199 }, "8": { "f1-score": 0.9590163934426229, "precision": 0.9401785714285714, "recall": 0.9786245353159851, "support": 1076 }, "9": { "f1-score": 0.8286445012787723, "precision": 0.8223350253807107, "recall": 0.8350515463917526, "support": 194 }, "macro avg": { "f1-score": 0.7599669119537038, "precision": 0.8225895864636388, "recall": 0.7238733853784572, "support": 4356 }, "micro avg": { "f1-score": 0.8709677419354839, "precision": 0.900883218842002, "recall": 0.8429752066115702, "support": 4356 }, "samples avg": { "f1-score": 0.8697403972937336, "precision": 0.9097442880919957, "recall": 0.8644651233166893, "support": 4356 }, "weighted avg": { "f1-score": 0.8624855347630281, "precision": 0.8928562943515039, "recall": 0.8429752066115702, "support": 4356 } }, "eval_roc_auc": 0.913169026523674, "eval_runtime": 25.8665, "eval_samples_per_second": 85.168, "eval_steps_per_second": 5.335, "step": 2204 }, { "epoch": 4.54, "learning_rate": 1.0925589836660618e-05, "loss": 0.0971, "step": 2500 }, { "epoch": 5.0, "eval_accuracy": 0.6631865637766682, "eval_f1": 0.876908396946565, "eval_loss": 0.11281398683786392, "eval_report": { "0": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 40 }, "1": { "f1-score": 0.9283018867924527, "precision": 0.9461538461538461, "recall": 0.9111111111111111, "support": 135 }, "10": { "f1-score": 0.8904347826086957, "precision": 0.9309090909090909, "recall": 0.8533333333333334, "support": 300 }, "11": { "f1-score": 0.8158844765342961, "precision": 0.8401486988847584, "recall": 0.7929824561403509, "support": 285 }, "12": { "f1-score": 0.8304761904761904, "precision": 0.872, "recall": 0.7927272727272727, "support": 275 }, "2": { "f1-score": 0.4786324786324786, "precision": 0.9032258064516129, "recall": 0.32558139534883723, "support": 86 }, "3": { "f1-score": 0.7977736549165121, "precision": 0.9555555555555556, "recall": 0.6847133757961783, "support": 314 }, "4": { "f1-score": 0.8926767676767676, "precision": 0.8994910941475827, "recall": 0.8859649122807017, "support": 798 }, "5": { "f1-score": 0.8780487804878049, "precision": 0.891640866873065, "recall": 0.8648648648648649, "support": 333 }, "6": { "f1-score": 0.9051580698835274, "precision": 0.9714285714285714, "recall": 0.8473520249221184, "support": 321 }, "7": { "f1-score": 0.7757255936675462, "precision": 0.8166666666666667, "recall": 0.7386934673366834, "support": 199 }, "8": { "f1-score": 0.9562413634269923, "precision": 0.947945205479452, "recall": 0.9646840148698885, "support": 1076 }, "9": { "f1-score": 0.835978835978836, "precision": 0.8586956521739131, "recall": 0.8144329896907216, "support": 194 }, "macro avg": { "f1-score": 0.7681025293140078, "precision": 0.8333739272864704, "recall": 0.7289570168016971, "support": 4356 }, "micro avg": { "f1-score": 0.876908396946565, "precision": 0.9126117179741807, "recall": 0.8438934802571166, "support": 4356 }, "samples avg": { "f1-score": 0.8725850031342542, "precision": 0.9159101225601453, "recall": 0.8631411711302769, "support": 4356 }, "weighted avg": { "f1-score": 0.86909769922114, "precision": 0.904407547519813, "recall": 0.8438934802571166, "support": 4356 } }, "eval_roc_auc": 0.9146988712490953, "eval_runtime": 25.8749, "eval_samples_per_second": 85.14, "eval_steps_per_second": 5.333, "step": 2755 }, { "epoch": 5.44, "learning_rate": 9.110707803992742e-06, "loss": 0.0811, "step": 3000 }, { "epoch": 6.0, "eval_accuracy": 0.6867907399001362, "eval_f1": 0.8865256515133809, "eval_loss": 0.1077384203672409, "eval_report": { "0": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 40 }, "1": { "f1-score": 0.9407407407407408, "precision": 0.9407407407407408, "recall": 0.9407407407407408, "support": 135 }, "10": { "f1-score": 0.8853046594982079, "precision": 0.9573643410852714, "recall": 0.8233333333333334, "support": 300 }, "11": { "f1-score": 0.8208695652173912, "precision": 0.8137931034482758, "recall": 0.8280701754385965, "support": 285 }, "12": { "f1-score": 0.8451730418943533, "precision": 0.8467153284671532, "recall": 0.8436363636363636, "support": 275 }, "2": { "f1-score": 0.5625000000000001, "precision": 0.8571428571428571, "recall": 0.4186046511627907, "support": 86 }, "3": { "f1-score": 0.8489932885906041, "precision": 0.8971631205673759, "recall": 0.8057324840764332, "support": 314 }, "4": { "f1-score": 0.9015479876160991, "precision": 0.8910648714810282, "recall": 0.9122807017543859, "support": 798 }, "5": { "f1-score": 0.895148669796557, "precision": 0.934640522875817, "recall": 0.8588588588588588, "support": 333 }, "6": { "f1-score": 0.8978224455611391, "precision": 0.9710144927536232, "recall": 0.8348909657320872, "support": 321 }, "7": { "f1-score": 0.8133971291866029, "precision": 0.776255707762557, "recall": 0.8542713567839196, "support": 199 }, "8": { "f1-score": 0.9545663148233136, "precision": 0.942883046237534, "recall": 0.966542750929368, "support": 1076 }, "9": { "f1-score": 0.8651399491094148, "precision": 0.8542713567839196, "recall": 0.8762886597938144, "support": 194 }, "macro avg": { "f1-score": 0.7870156763103403, "precision": 0.8217730376420119, "recall": 0.7664039263262072, "support": 4356 }, "micro avg": { "f1-score": 0.8865256515133809, "precision": 0.9028802666031898, "recall": 0.870752984389348, "support": 4356 }, "samples avg": { "f1-score": 0.8854851609277392, "precision": 0.9150022696323196, "recall": 0.8869723104857014, "support": 4356 }, "weighted avg": { "f1-score": 0.8807295782472653, "precision": 0.8960415422991472, "recall": 0.870752984389348, "support": 4356 } }, "eval_roc_auc": 0.9269755532662054, "eval_runtime": 25.8985, "eval_samples_per_second": 85.063, "eval_steps_per_second": 5.329, "step": 3306 }, { "epoch": 6.35, "learning_rate": 7.295825771324865e-06, "loss": 0.0692, "step": 3500 }, { "epoch": 7.0, "eval_accuracy": 0.672719019518838, "eval_f1": 0.8813199764289925, "eval_loss": 0.10911860316991806, "eval_report": { "0": { "f1-score": 0.04878048780487806, "precision": 1.0, "recall": 0.025, "support": 40 }, "1": { "f1-score": 0.9338235294117647, "precision": 0.927007299270073, "recall": 0.9407407407407408, "support": 135 }, "10": { "f1-score": 0.877005347593583, "precision": 0.9425287356321839, "recall": 0.82, "support": 300 }, "11": { "f1-score": 0.808193668528864, "precision": 0.8611111111111112, "recall": 0.7614035087719299, "support": 285 }, "12": { "f1-score": 0.850187265917603, "precision": 0.8764478764478765, "recall": 0.8254545454545454, "support": 275 }, "2": { "f1-score": 0.5736434108527131, "precision": 0.8604651162790697, "recall": 0.43023255813953487, "support": 86 }, "3": { "f1-score": 0.8585690515806988, "precision": 0.8989547038327527, "recall": 0.821656050955414, "support": 314 }, "4": { "f1-score": 0.8974668275030157, "precision": 0.8651162790697674, "recall": 0.9323308270676691, "support": 798 }, "5": { "f1-score": 0.8680445151033386, "precision": 0.9222972972972973, "recall": 0.8198198198198198, "support": 333 }, "6": { "f1-score": 0.9030100334448161, "precision": 0.9747292418772563, "recall": 0.8411214953271028, "support": 321 }, "7": { "f1-score": 0.7885117493472584, "precision": 0.8206521739130435, "recall": 0.7587939698492462, "support": 199 }, "8": { "f1-score": 0.9535095715587968, "precision": 0.9355992844364938, "recall": 0.9721189591078067, "support": 1076 }, "9": { "f1-score": 0.8160919540229885, "precision": 0.922077922077922, "recall": 0.7319587628865979, "support": 194 }, "macro avg": { "f1-score": 0.782833647128486, "precision": 0.9082297724034496, "recall": 0.7446639413938775, "support": 4356 }, "micro avg": { "f1-score": 0.8813199764289925, "precision": 0.905546137079196, "recall": 0.858356290174472, "support": 4356 }, "samples avg": { "f1-score": 0.8788772885459222, "precision": 0.9134513542139506, "recall": 0.8763428657890756, "support": 4356 }, "weighted avg": { "f1-score": 0.8747693430346722, "precision": 0.9067699317424669, "recall": 0.858356290174472, "support": 4356 } }, "eval_roc_auc": 0.9211478358173765, "eval_runtime": 25.9101, "eval_samples_per_second": 85.025, "eval_steps_per_second": 5.326, "step": 3857 }, { "epoch": 7.26, "learning_rate": 5.480943738656987e-06, "loss": 0.0612, "step": 4000 }, { "epoch": 8.0, "eval_accuracy": 0.6967771221062188, "eval_f1": 0.8906778672266946, "eval_loss": 0.10351744294166565, "eval_report": { "0": { "f1-score": 0.2608695652173913, "precision": 1.0, "recall": 0.15, "support": 40 }, "1": { "f1-score": 0.9343065693430658, "precision": 0.920863309352518, "recall": 0.9481481481481482, "support": 135 }, "10": { "f1-score": 0.8846153846153848, "precision": 0.9301470588235294, "recall": 0.8433333333333334, "support": 300 }, "11": { "f1-score": 0.807899461400359, "precision": 0.8272058823529411, "recall": 0.7894736842105263, "support": 285 }, "12": { "f1-score": 0.8566243194192378, "precision": 0.855072463768116, "recall": 0.8581818181818182, "support": 275 }, "2": { "f1-score": 0.6174496644295302, "precision": 0.7301587301587301, "recall": 0.5348837209302325, "support": 86 }, "3": { "f1-score": 0.8707037643207856, "precision": 0.8956228956228957, "recall": 0.8471337579617835, "support": 314 }, "4": { "f1-score": 0.9031446540880502, "precision": 0.9065656565656566, "recall": 0.899749373433584, "support": 798 }, "5": { "f1-score": 0.8973966309341501, "precision": 0.915625, "recall": 0.8798798798798799, "support": 333 }, "6": { "f1-score": 0.9210526315789473, "precision": 0.975609756097561, "recall": 0.8722741433021807, "support": 321 }, "7": { "f1-score": 0.8070175438596492, "precision": 0.805, "recall": 0.8090452261306532, "support": 199 }, "8": { "f1-score": 0.9565614997713763, "precision": 0.9414941494149415, "recall": 0.9721189591078067, "support": 1076 }, "9": { "f1-score": 0.8502673796791443, "precision": 0.8833333333333333, "recall": 0.8195876288659794, "support": 194 }, "macro avg": { "f1-score": 0.8129160822043902, "precision": 0.8912844796530941, "recall": 0.7864468979604557, "support": 4356 }, "micro avg": { "f1-score": 0.8906778672266946, "precision": 0.9055753262158956, "recall": 0.8762626262626263, "support": 4356 }, "samples avg": { "f1-score": 0.8899876791388366, "precision": 0.9160992585867755, "recall": 0.8930624905431986, "support": 4356 }, "weighted avg": { "f1-score": 0.8871176344746756, "precision": 0.9055099014048587, "recall": 0.8762626262626263, "support": 4356 } }, "eval_roc_auc": 0.9299362795687385, "eval_runtime": 25.9048, "eval_samples_per_second": 85.042, "eval_steps_per_second": 5.327, "step": 4408 }, { "epoch": 8.17, "learning_rate": 3.666061705989111e-06, "loss": 0.0539, "step": 4500 }, { "epoch": 9.0, "eval_accuracy": 0.699046754425783, "eval_f1": 0.8925369658865993, "eval_loss": 0.10284219682216644, "eval_report": { "0": { "f1-score": 0.18181818181818182, "precision": 1.0, "recall": 0.1, "support": 40 }, "1": { "f1-score": 0.9477611940298507, "precision": 0.9548872180451128, "recall": 0.9407407407407408, "support": 135 }, "10": { "f1-score": 0.8865619546247819, "precision": 0.9304029304029304, "recall": 0.8466666666666667, "support": 300 }, "11": { "f1-score": 0.8136200716845878, "precision": 0.8315018315018315, "recall": 0.7964912280701755, "support": 285 }, "12": { "f1-score": 0.855072463768116, "precision": 0.851985559566787, "recall": 0.8581818181818182, "support": 275 }, "2": { "f1-score": 0.5985401459854015, "precision": 0.803921568627451, "recall": 0.47674418604651164, "support": 86 }, "3": { "f1-score": 0.8760330578512396, "precision": 0.9106529209621993, "recall": 0.8439490445859873, "support": 314 }, "4": { "f1-score": 0.9055214723926379, "precision": 0.8870192307692307, "recall": 0.924812030075188, "support": 798 }, "5": { "f1-score": 0.8905775075987841, "precision": 0.9015384615384615, "recall": 0.8798798798798799, "support": 333 }, "6": { "f1-score": 0.9153094462540716, "precision": 0.9590443686006825, "recall": 0.8753894080996885, "support": 321 }, "7": { "f1-score": 0.8170426065162906, "precision": 0.815, "recall": 0.8190954773869347, "support": 199 }, "8": { "f1-score": 0.9581993569131833, "precision": 0.9473206176203451, "recall": 0.9693308550185874, "support": 1076 }, "9": { "f1-score": 0.8609625668449198, "precision": 0.8944444444444445, "recall": 0.8298969072164949, "support": 194 }, "macro avg": { "f1-score": 0.8082323097140035, "precision": 0.8990553193907289, "recall": 0.7816290955360519, "support": 4356 }, "micro avg": { "f1-score": 0.8925369658865993, "precision": 0.9055043704228679, "recall": 0.8799357208448118, "support": 4356 }, "samples avg": { "f1-score": 0.8913213583209044, "precision": 0.916288394613406, "recall": 0.8957482221213496, "support": 4356 }, "weighted avg": { "f1-score": 0.8880597009850972, "precision": 0.9057204039138281, "recall": 0.8799357208448118, "support": 4356 } }, "eval_roc_auc": 0.9317316457866525, "eval_runtime": 25.9692, "eval_samples_per_second": 84.831, "eval_steps_per_second": 5.314, "step": 4959 }, { "epoch": 9.07, "learning_rate": 1.8511796733212343e-06, "loss": 0.0498, "step": 5000 }, { "epoch": 9.98, "learning_rate": 3.629764065335753e-08, "loss": 0.0468, "step": 5500 }, { "epoch": 10.0, "eval_accuracy": 0.7031320926009986, "eval_f1": 0.8937805730258561, "eval_loss": 0.10207226872444153, "eval_report": { "0": { "f1-score": 0.2978723404255319, "precision": 1.0, "recall": 0.175, "support": 40 }, "1": { "f1-score": 0.9477611940298507, "precision": 0.9548872180451128, "recall": 0.9407407407407408, "support": 135 }, "10": { "f1-score": 0.8885017421602788, "precision": 0.9306569343065694, "recall": 0.85, "support": 300 }, "11": { "f1-score": 0.8158844765342961, "precision": 0.8401486988847584, "recall": 0.7929824561403509, "support": 285 }, "12": { "f1-score": 0.8534798534798536, "precision": 0.8597785977859779, "recall": 0.8472727272727273, "support": 275 }, "2": { "f1-score": 0.6482758620689655, "precision": 0.7966101694915254, "recall": 0.5465116279069767, "support": 86 }, "3": { "f1-score": 0.8794788273615636, "precision": 0.9, "recall": 0.8598726114649682, "support": 314 }, "4": { "f1-score": 0.9057301293900184, "precision": 0.8909090909090909, "recall": 0.9210526315789473, "support": 798 }, "5": { "f1-score": 0.8895705521472392, "precision": 0.9090909090909091, "recall": 0.8708708708708709, "support": 333 }, "6": { "f1-score": 0.9200652528548124, "precision": 0.9657534246575342, "recall": 0.8785046728971962, "support": 321 }, "7": { "f1-score": 0.8070175438596492, "precision": 0.805, "recall": 0.8090452261306532, "support": 199 }, "8": { "f1-score": 0.9576036866359448, "precision": 0.9497257769652651, "recall": 0.9656133828996283, "support": 1076 }, "9": { "f1-score": 0.8661417322834646, "precision": 0.8823529411764706, "recall": 0.8505154639175257, "support": 194 }, "macro avg": { "f1-score": 0.8213371687101131, "precision": 0.8988395201010164, "recall": 0.7929217239861989, "support": 4356 }, "micro avg": { "f1-score": 0.8937805730258561, "precision": 0.9070921985815603, "recall": 0.8808539944903582, "support": 4356 }, "samples avg": { "f1-score": 0.8926485528392021, "precision": 0.9176123467998184, "recall": 0.8967317294598275, "support": 4356 }, "weighted avg": { "f1-score": 0.8904741566354063, "precision": 0.9072664844050249, "recall": 0.8808539944903582, "support": 4356 } }, "eval_roc_auc": 0.9323349163655514, "eval_runtime": 25.9424, "eval_samples_per_second": 84.919, "eval_steps_per_second": 5.319, "step": 5510 } ], "max_steps": 5510, "num_train_epochs": 10, "total_flos": 2.319816157052928e+16, "trial_name": null, "trial_params": null }