|
{ |
|
"best_metric": 0.9160090191657272, |
|
"best_model_checkpoint": "swinv2-base-patch4-window12-192-22k-finetuned-lora-ISIC-2019/checkpoint-4875", |
|
"epoch": 99.2, |
|
"eval_steps": 500, |
|
"global_step": 6200, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.16, |
|
"learning_rate": 0.0009983870967741936, |
|
"loss": 1.4282, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"learning_rate": 0.0009970967741935483, |
|
"loss": 1.1082, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"learning_rate": 0.0009954838709677419, |
|
"loss": 1.0397, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"learning_rate": 0.0009938709677419356, |
|
"loss": 0.9258, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"learning_rate": 0.0009922580645161292, |
|
"loss": 0.8897, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.96, |
|
"learning_rate": 0.0009906451612903225, |
|
"loss": 0.8488, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"step": 62, |
|
"train_accuracy": 0.718556119571348, |
|
"train_f1": 0.6867379798585972, |
|
"train_loss": 0.770628809928894, |
|
"train_precision": 0.708956589572109, |
|
"train_recall": 0.718556119571348, |
|
"train_runtime": 291.5866, |
|
"train_samples_per_second": 54.725, |
|
"train_steps_per_second": 0.857 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"eval_accuracy": 0.7153325817361894, |
|
"eval_f1": 0.6823083139813236, |
|
"eval_loss": 0.7977813482284546, |
|
"eval_precision": 0.7199162830832594, |
|
"eval_recall": 0.7153325817361894, |
|
"eval_runtime": 49.2679, |
|
"eval_samples_per_second": 36.007, |
|
"eval_steps_per_second": 0.568, |
|
"step": 62 |
|
}, |
|
{ |
|
"epoch": 1.12, |
|
"learning_rate": 0.000989032258064516, |
|
"loss": 0.7836, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 1.28, |
|
"learning_rate": 0.0009874193548387096, |
|
"loss": 0.772, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 1.44, |
|
"learning_rate": 0.0009858064516129032, |
|
"loss": 0.8074, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"learning_rate": 0.0009841935483870968, |
|
"loss": 0.7912, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"learning_rate": 0.0009825806451612903, |
|
"loss": 0.7762, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 1.92, |
|
"learning_rate": 0.0009809677419354839, |
|
"loss": 0.7795, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"step": 125, |
|
"train_accuracy": 0.7600426145265401, |
|
"train_f1": 0.7540133314127565, |
|
"train_loss": 0.6639156937599182, |
|
"train_precision": 0.7611520386158022, |
|
"train_recall": 0.7600426145265401, |
|
"train_runtime": 254.6664, |
|
"train_samples_per_second": 62.658, |
|
"train_steps_per_second": 0.982 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7497181510710259, |
|
"eval_f1": 0.7388896367994308, |
|
"eval_loss": 0.6961308717727661, |
|
"eval_precision": 0.7541740918352317, |
|
"eval_recall": 0.7497181510710259, |
|
"eval_runtime": 48.7662, |
|
"eval_samples_per_second": 36.378, |
|
"eval_steps_per_second": 0.574, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 2.08, |
|
"learning_rate": 0.0009793548387096774, |
|
"loss": 0.7586, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 2.24, |
|
"learning_rate": 0.000977741935483871, |
|
"loss": 0.705, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 2.4, |
|
"learning_rate": 0.0009761290322580644, |
|
"loss": 0.6983, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 2.56, |
|
"learning_rate": 0.0009745161290322581, |
|
"loss": 0.6913, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 2.72, |
|
"learning_rate": 0.0009729032258064517, |
|
"loss": 0.6849, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 2.88, |
|
"learning_rate": 0.0009714516129032258, |
|
"loss": 0.7169, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 2.99, |
|
"step": 187, |
|
"train_accuracy": 0.7776524409350128, |
|
"train_f1": 0.7639537137185656, |
|
"train_loss": 0.6073001027107239, |
|
"train_precision": 0.7743141490761454, |
|
"train_recall": 0.7776524409350128, |
|
"train_runtime": 256.1493, |
|
"train_samples_per_second": 62.296, |
|
"train_steps_per_second": 0.976 |
|
}, |
|
{ |
|
"epoch": 2.99, |
|
"eval_accuracy": 0.7717023675310034, |
|
"eval_f1": 0.7547317483415474, |
|
"eval_loss": 0.6364655494689941, |
|
"eval_precision": 0.7658539052724858, |
|
"eval_recall": 0.7717023675310034, |
|
"eval_runtime": 48.4464, |
|
"eval_samples_per_second": 36.618, |
|
"eval_steps_per_second": 0.578, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 3.04, |
|
"learning_rate": 0.0009698387096774194, |
|
"loss": 0.6428, |
|
"step": 190 |
|
}, |
|
{ |
|
"epoch": 3.2, |
|
"learning_rate": 0.0009682258064516129, |
|
"loss": 0.6604, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 3.36, |
|
"learning_rate": 0.0009666129032258064, |
|
"loss": 0.6531, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 3.52, |
|
"learning_rate": 0.000965, |
|
"loss": 0.643, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 3.68, |
|
"learning_rate": 0.0009633870967741936, |
|
"loss": 0.6918, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 3.84, |
|
"learning_rate": 0.0009617741935483872, |
|
"loss": 0.6442, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 0.0009601612903225807, |
|
"loss": 0.6576, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"step": 250, |
|
"train_accuracy": 0.7903114620542708, |
|
"train_f1": 0.7760264280771675, |
|
"train_loss": 0.5970289707183838, |
|
"train_precision": 0.7953318203400003, |
|
"train_recall": 0.7903114620542708, |
|
"train_runtime": 256.7891, |
|
"train_samples_per_second": 62.14, |
|
"train_steps_per_second": 0.974 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.790304396843292, |
|
"eval_f1": 0.7777020089235339, |
|
"eval_loss": 0.6154965162277222, |
|
"eval_precision": 0.7982692040791739, |
|
"eval_recall": 0.790304396843292, |
|
"eval_runtime": 46.9309, |
|
"eval_samples_per_second": 37.8, |
|
"eval_steps_per_second": 0.597, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 4.16, |
|
"learning_rate": 0.0009585483870967742, |
|
"loss": 0.6104, |
|
"step": 260 |
|
}, |
|
{ |
|
"epoch": 4.32, |
|
"learning_rate": 0.0009569354838709677, |
|
"loss": 0.5991, |
|
"step": 270 |
|
}, |
|
{ |
|
"epoch": 4.48, |
|
"learning_rate": 0.0009553225806451613, |
|
"loss": 0.625, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 4.64, |
|
"learning_rate": 0.0009537096774193548, |
|
"loss": 0.6223, |
|
"step": 290 |
|
}, |
|
{ |
|
"epoch": 4.8, |
|
"learning_rate": 0.0009520967741935485, |
|
"loss": 0.6309, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 4.96, |
|
"learning_rate": 0.000950483870967742, |
|
"loss": 0.6164, |
|
"step": 310 |
|
}, |
|
{ |
|
"epoch": 4.99, |
|
"step": 312, |
|
"train_accuracy": 0.8017797831672621, |
|
"train_f1": 0.7931150004910923, |
|
"train_loss": 0.5476173758506775, |
|
"train_precision": 0.7996150347194898, |
|
"train_recall": 0.8017797831672621, |
|
"train_runtime": 254.273, |
|
"train_samples_per_second": 62.755, |
|
"train_steps_per_second": 0.983 |
|
}, |
|
{ |
|
"epoch": 4.99, |
|
"eval_accuracy": 0.7733934611048479, |
|
"eval_f1": 0.7627200347192373, |
|
"eval_loss": 0.5989590883255005, |
|
"eval_precision": 0.7799215570339676, |
|
"eval_recall": 0.7733934611048479, |
|
"eval_runtime": 46.2691, |
|
"eval_samples_per_second": 38.341, |
|
"eval_steps_per_second": 0.605, |
|
"step": 312 |
|
}, |
|
{ |
|
"epoch": 5.12, |
|
"learning_rate": 0.0009488709677419355, |
|
"loss": 0.6067, |
|
"step": 320 |
|
}, |
|
{ |
|
"epoch": 5.28, |
|
"learning_rate": 0.0009472580645161291, |
|
"loss": 0.6144, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 5.44, |
|
"learning_rate": 0.0009456451612903226, |
|
"loss": 0.5815, |
|
"step": 340 |
|
}, |
|
{ |
|
"epoch": 5.6, |
|
"learning_rate": 0.0009440322580645162, |
|
"loss": 0.6036, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 5.76, |
|
"learning_rate": 0.0009424193548387096, |
|
"loss": 0.5748, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 5.92, |
|
"learning_rate": 0.0009408064516129032, |
|
"loss": 0.5779, |
|
"step": 370 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"step": 375, |
|
"train_accuracy": 0.8046625305508555, |
|
"train_f1": 0.8003331690711911, |
|
"train_loss": 0.5287690758705139, |
|
"train_precision": 0.8066353914139762, |
|
"train_recall": 0.8046625305508555, |
|
"train_runtime": 254.1046, |
|
"train_samples_per_second": 62.797, |
|
"train_steps_per_second": 0.984 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.7745208568207441, |
|
"eval_f1": 0.7668632966865262, |
|
"eval_loss": 0.602535605430603, |
|
"eval_precision": 0.7770132133553053, |
|
"eval_recall": 0.7745208568207441, |
|
"eval_runtime": 38.0169, |
|
"eval_samples_per_second": 46.663, |
|
"eval_steps_per_second": 0.737, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 6.08, |
|
"learning_rate": 0.0009391935483870969, |
|
"loss": 0.5808, |
|
"step": 380 |
|
}, |
|
{ |
|
"epoch": 6.24, |
|
"learning_rate": 0.0009375806451612904, |
|
"loss": 0.5692, |
|
"step": 390 |
|
}, |
|
{ |
|
"epoch": 6.4, |
|
"learning_rate": 0.0009359677419354839, |
|
"loss": 0.5525, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 6.56, |
|
"learning_rate": 0.0009343548387096774, |
|
"loss": 0.562, |
|
"step": 410 |
|
}, |
|
{ |
|
"epoch": 6.72, |
|
"learning_rate": 0.000932741935483871, |
|
"loss": 0.5858, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 6.88, |
|
"learning_rate": 0.0009311290322580645, |
|
"loss": 0.5647, |
|
"step": 430 |
|
}, |
|
{ |
|
"epoch": 6.99, |
|
"step": 437, |
|
"train_accuracy": 0.8250924359215391, |
|
"train_f1": 0.8156580365652172, |
|
"train_loss": 0.4726848304271698, |
|
"train_precision": 0.8244531001171268, |
|
"train_recall": 0.8250924359215391, |
|
"train_runtime": 254.8694, |
|
"train_samples_per_second": 62.609, |
|
"train_steps_per_second": 0.981 |
|
}, |
|
{ |
|
"epoch": 6.99, |
|
"eval_accuracy": 0.8094701240135288, |
|
"eval_f1": 0.8000649092582361, |
|
"eval_loss": 0.5391651391983032, |
|
"eval_precision": 0.8082600629133598, |
|
"eval_recall": 0.8094701240135288, |
|
"eval_runtime": 33.5973, |
|
"eval_samples_per_second": 52.802, |
|
"eval_steps_per_second": 0.833, |
|
"step": 437 |
|
}, |
|
{ |
|
"epoch": 7.04, |
|
"learning_rate": 0.0009295161290322581, |
|
"loss": 0.5795, |
|
"step": 440 |
|
}, |
|
{ |
|
"epoch": 7.2, |
|
"learning_rate": 0.0009279032258064515, |
|
"loss": 0.535, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 7.36, |
|
"learning_rate": 0.0009262903225806451, |
|
"loss": 0.5441, |
|
"step": 460 |
|
}, |
|
{ |
|
"epoch": 7.52, |
|
"learning_rate": 0.0009246774193548388, |
|
"loss": 0.5329, |
|
"step": 470 |
|
}, |
|
{ |
|
"epoch": 7.68, |
|
"learning_rate": 0.0009230645161290323, |
|
"loss": 0.5191, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 7.84, |
|
"learning_rate": 0.0009214516129032259, |
|
"loss": 0.5428, |
|
"step": 490 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 0.0009198387096774193, |
|
"loss": 0.5062, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"step": 500, |
|
"train_accuracy": 0.8309832675314909, |
|
"train_f1": 0.8223807681274183, |
|
"train_loss": 0.4595116674900055, |
|
"train_precision": 0.8314452738097804, |
|
"train_recall": 0.8309832675314909, |
|
"train_runtime": 254.2706, |
|
"train_samples_per_second": 62.756, |
|
"train_steps_per_second": 0.983 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8015783540022547, |
|
"eval_f1": 0.7895223836045016, |
|
"eval_loss": 0.5510557293891907, |
|
"eval_precision": 0.8031324191974503, |
|
"eval_recall": 0.8015783540022547, |
|
"eval_runtime": 33.1712, |
|
"eval_samples_per_second": 53.48, |
|
"eval_steps_per_second": 0.844, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 8.16, |
|
"learning_rate": 0.0009182258064516129, |
|
"loss": 0.5424, |
|
"step": 510 |
|
}, |
|
{ |
|
"epoch": 8.32, |
|
"learning_rate": 0.0009166129032258065, |
|
"loss": 0.5172, |
|
"step": 520 |
|
}, |
|
{ |
|
"epoch": 8.48, |
|
"learning_rate": 0.000915, |
|
"loss": 0.5081, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 8.64, |
|
"learning_rate": 0.0009133870967741935, |
|
"loss": 0.5357, |
|
"step": 540 |
|
}, |
|
{ |
|
"epoch": 8.8, |
|
"learning_rate": 0.0009117741935483871, |
|
"loss": 0.5317, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 8.96, |
|
"learning_rate": 0.0009101612903225807, |
|
"loss": 0.5479, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 8.99, |
|
"step": 562, |
|
"train_accuracy": 0.8421382465375697, |
|
"train_f1": 0.8356541787788663, |
|
"train_loss": 0.4283278286457062, |
|
"train_precision": 0.8418489980800979, |
|
"train_recall": 0.8421382465375697, |
|
"train_runtime": 253.325, |
|
"train_samples_per_second": 62.99, |
|
"train_steps_per_second": 0.987 |
|
}, |
|
{ |
|
"epoch": 8.99, |
|
"eval_accuracy": 0.8156708004509583, |
|
"eval_f1": 0.8099706186065314, |
|
"eval_loss": 0.5151851773262024, |
|
"eval_precision": 0.8175937941832333, |
|
"eval_recall": 0.8156708004509583, |
|
"eval_runtime": 29.3964, |
|
"eval_samples_per_second": 60.347, |
|
"eval_steps_per_second": 0.952, |
|
"step": 562 |
|
}, |
|
{ |
|
"epoch": 9.12, |
|
"learning_rate": 0.0009087096774193548, |
|
"loss": 0.4922, |
|
"step": 570 |
|
}, |
|
{ |
|
"epoch": 9.28, |
|
"learning_rate": 0.0009070967741935484, |
|
"loss": 0.4682, |
|
"step": 580 |
|
}, |
|
{ |
|
"epoch": 9.44, |
|
"learning_rate": 0.0009054838709677419, |
|
"loss": 0.5159, |
|
"step": 590 |
|
}, |
|
{ |
|
"epoch": 9.6, |
|
"learning_rate": 0.0009038709677419356, |
|
"loss": 0.5072, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 9.76, |
|
"learning_rate": 0.0009022580645161291, |
|
"loss": 0.4946, |
|
"step": 610 |
|
}, |
|
{ |
|
"epoch": 9.92, |
|
"learning_rate": 0.0009006451612903226, |
|
"loss": 0.504, |
|
"step": 620 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 625, |
|
"train_accuracy": 0.8490317728896409, |
|
"train_f1": 0.8425370562453873, |
|
"train_loss": 0.4146420955657959, |
|
"train_precision": 0.8499471633168426, |
|
"train_recall": 0.8490317728896409, |
|
"train_runtime": 252.5657, |
|
"train_samples_per_second": 63.18, |
|
"train_steps_per_second": 0.99 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.8246899661781285, |
|
"eval_f1": 0.8181338629292875, |
|
"eval_loss": 0.4954419434070587, |
|
"eval_precision": 0.8265610533827844, |
|
"eval_recall": 0.8246899661781285, |
|
"eval_runtime": 29.7136, |
|
"eval_samples_per_second": 59.703, |
|
"eval_steps_per_second": 0.942, |
|
"step": 625 |
|
}, |
|
{ |
|
"epoch": 10.08, |
|
"learning_rate": 0.0008990322580645162, |
|
"loss": 0.4777, |
|
"step": 630 |
|
}, |
|
{ |
|
"epoch": 10.24, |
|
"learning_rate": 0.0008974193548387097, |
|
"loss": 0.4595, |
|
"step": 640 |
|
}, |
|
{ |
|
"epoch": 10.4, |
|
"learning_rate": 0.0008958064516129032, |
|
"loss": 0.4765, |
|
"step": 650 |
|
}, |
|
{ |
|
"epoch": 10.56, |
|
"learning_rate": 0.0008941935483870967, |
|
"loss": 0.481, |
|
"step": 660 |
|
}, |
|
{ |
|
"epoch": 10.72, |
|
"learning_rate": 0.0008925806451612903, |
|
"loss": 0.4936, |
|
"step": 670 |
|
}, |
|
{ |
|
"epoch": 10.88, |
|
"learning_rate": 0.0008909677419354839, |
|
"loss": 0.4928, |
|
"step": 680 |
|
}, |
|
{ |
|
"epoch": 10.99, |
|
"step": 687, |
|
"train_accuracy": 0.8662029203484364, |
|
"train_f1": 0.8651095243578739, |
|
"train_loss": 0.36719974875450134, |
|
"train_precision": 0.8661939607708877, |
|
"train_recall": 0.8662029203484364, |
|
"train_runtime": 248.0205, |
|
"train_samples_per_second": 64.337, |
|
"train_steps_per_second": 1.008 |
|
}, |
|
{ |
|
"epoch": 10.99, |
|
"eval_accuracy": 0.8325817361894025, |
|
"eval_f1": 0.8330415565435833, |
|
"eval_loss": 0.4721773862838745, |
|
"eval_precision": 0.8382637561400605, |
|
"eval_recall": 0.8325817361894025, |
|
"eval_runtime": 29.1932, |
|
"eval_samples_per_second": 60.768, |
|
"eval_steps_per_second": 0.959, |
|
"step": 687 |
|
}, |
|
{ |
|
"epoch": 11.04, |
|
"learning_rate": 0.0008893548387096775, |
|
"loss": 0.4791, |
|
"step": 690 |
|
}, |
|
{ |
|
"epoch": 11.2, |
|
"learning_rate": 0.000887741935483871, |
|
"loss": 0.471, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 11.36, |
|
"learning_rate": 0.0008861290322580645, |
|
"loss": 0.4514, |
|
"step": 710 |
|
}, |
|
{ |
|
"epoch": 11.52, |
|
"learning_rate": 0.0008845161290322581, |
|
"loss": 0.4554, |
|
"step": 720 |
|
}, |
|
{ |
|
"epoch": 11.68, |
|
"learning_rate": 0.0008829032258064516, |
|
"loss": 0.4778, |
|
"step": 730 |
|
}, |
|
{ |
|
"epoch": 11.84, |
|
"learning_rate": 0.0008812903225806452, |
|
"loss": 0.4214, |
|
"step": 740 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"learning_rate": 0.0008796774193548387, |
|
"loss": 0.4555, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"step": 750, |
|
"train_accuracy": 0.8760418625054834, |
|
"train_f1": 0.8735297151164703, |
|
"train_loss": 0.341611385345459, |
|
"train_precision": 0.8749284746900984, |
|
"train_recall": 0.8760418625054834, |
|
"train_runtime": 251.381, |
|
"train_samples_per_second": 63.477, |
|
"train_steps_per_second": 0.995 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.846674182638106, |
|
"eval_f1": 0.8431872563091386, |
|
"eval_loss": 0.43833523988723755, |
|
"eval_precision": 0.8434438125814474, |
|
"eval_recall": 0.846674182638106, |
|
"eval_runtime": 29.6753, |
|
"eval_samples_per_second": 59.78, |
|
"eval_steps_per_second": 0.944, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 12.16, |
|
"learning_rate": 0.0008780645161290322, |
|
"loss": 0.4597, |
|
"step": 760 |
|
}, |
|
{ |
|
"epoch": 12.32, |
|
"learning_rate": 0.0008764516129032259, |
|
"loss": 0.4253, |
|
"step": 770 |
|
}, |
|
{ |
|
"epoch": 12.48, |
|
"learning_rate": 0.0008748387096774194, |
|
"loss": 0.473, |
|
"step": 780 |
|
}, |
|
{ |
|
"epoch": 12.64, |
|
"learning_rate": 0.0008732258064516129, |
|
"loss": 0.4244, |
|
"step": 790 |
|
}, |
|
{ |
|
"epoch": 12.8, |
|
"learning_rate": 0.0008716129032258064, |
|
"loss": 0.4602, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 12.96, |
|
"learning_rate": 0.00087, |
|
"loss": 0.4345, |
|
"step": 810 |
|
}, |
|
{ |
|
"epoch": 12.99, |
|
"step": 812, |
|
"train_accuracy": 0.8737857993357148, |
|
"train_f1": 0.8699664840253412, |
|
"train_loss": 0.3363898992538452, |
|
"train_precision": 0.8723546877750733, |
|
"train_recall": 0.8737857993357148, |
|
"train_runtime": 254.2635, |
|
"train_samples_per_second": 62.758, |
|
"train_steps_per_second": 0.983 |
|
}, |
|
{ |
|
"epoch": 12.99, |
|
"eval_accuracy": 0.8511837655016911, |
|
"eval_f1": 0.8464360738395965, |
|
"eval_loss": 0.44016385078430176, |
|
"eval_precision": 0.8479714249543402, |
|
"eval_recall": 0.8511837655016911, |
|
"eval_runtime": 29.6817, |
|
"eval_samples_per_second": 59.767, |
|
"eval_steps_per_second": 0.943, |
|
"step": 812 |
|
}, |
|
{ |
|
"epoch": 13.12, |
|
"learning_rate": 0.0008683870967741936, |
|
"loss": 0.4296, |
|
"step": 820 |
|
}, |
|
{ |
|
"epoch": 13.28, |
|
"learning_rate": 0.0008667741935483871, |
|
"loss": 0.4024, |
|
"step": 830 |
|
}, |
|
{ |
|
"epoch": 13.44, |
|
"learning_rate": 0.0008651612903225806, |
|
"loss": 0.4268, |
|
"step": 840 |
|
}, |
|
{ |
|
"epoch": 13.6, |
|
"learning_rate": 0.0008635483870967742, |
|
"loss": 0.411, |
|
"step": 850 |
|
}, |
|
{ |
|
"epoch": 13.76, |
|
"learning_rate": 0.0008619354838709678, |
|
"loss": 0.4179, |
|
"step": 860 |
|
}, |
|
{ |
|
"epoch": 13.92, |
|
"learning_rate": 0.0008603225806451614, |
|
"loss": 0.4398, |
|
"step": 870 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"step": 875, |
|
"train_accuracy": 0.880553988845021, |
|
"train_f1": 0.8770183301442244, |
|
"train_loss": 0.3260194957256317, |
|
"train_precision": 0.8807172403068199, |
|
"train_recall": 0.880553988845021, |
|
"train_runtime": 252.7172, |
|
"train_samples_per_second": 63.142, |
|
"train_steps_per_second": 0.989 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.8494926719278467, |
|
"eval_f1": 0.8469368583418073, |
|
"eval_loss": 0.44426438212394714, |
|
"eval_precision": 0.8497246468797232, |
|
"eval_recall": 0.8494926719278467, |
|
"eval_runtime": 29.5345, |
|
"eval_samples_per_second": 60.065, |
|
"eval_steps_per_second": 0.948, |
|
"step": 875 |
|
}, |
|
{ |
|
"epoch": 14.08, |
|
"learning_rate": 0.0008587096774193549, |
|
"loss": 0.4153, |
|
"step": 880 |
|
}, |
|
{ |
|
"epoch": 14.24, |
|
"learning_rate": 0.0008570967741935484, |
|
"loss": 0.4065, |
|
"step": 890 |
|
}, |
|
{ |
|
"epoch": 14.4, |
|
"learning_rate": 0.0008554838709677419, |
|
"loss": 0.4045, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 14.56, |
|
"learning_rate": 0.0008538709677419355, |
|
"loss": 0.3879, |
|
"step": 910 |
|
}, |
|
{ |
|
"epoch": 14.72, |
|
"learning_rate": 0.000852258064516129, |
|
"loss": 0.4095, |
|
"step": 920 |
|
}, |
|
{ |
|
"epoch": 14.88, |
|
"learning_rate": 0.0008506451612903226, |
|
"loss": 0.405, |
|
"step": 930 |
|
}, |
|
{ |
|
"epoch": 14.99, |
|
"step": 937, |
|
"train_accuracy": 0.8919596415366297, |
|
"train_f1": 0.8898750533747908, |
|
"train_loss": 0.29893702268600464, |
|
"train_precision": 0.8905204704311594, |
|
"train_recall": 0.8919596415366297, |
|
"train_runtime": 255.1579, |
|
"train_samples_per_second": 62.538, |
|
"train_steps_per_second": 0.98 |
|
}, |
|
{ |
|
"epoch": 14.99, |
|
"eval_accuracy": 0.8568207440811725, |
|
"eval_f1": 0.8543462911384269, |
|
"eval_loss": 0.4096240699291229, |
|
"eval_precision": 0.8552780691368613, |
|
"eval_recall": 0.8568207440811725, |
|
"eval_runtime": 29.6726, |
|
"eval_samples_per_second": 59.786, |
|
"eval_steps_per_second": 0.944, |
|
"step": 937 |
|
}, |
|
{ |
|
"epoch": 15.04, |
|
"learning_rate": 0.0008490322580645162, |
|
"loss": 0.4047, |
|
"step": 940 |
|
}, |
|
{ |
|
"epoch": 15.2, |
|
"learning_rate": 0.0008474193548387097, |
|
"loss": 0.4049, |
|
"step": 950 |
|
}, |
|
{ |
|
"epoch": 15.36, |
|
"learning_rate": 0.0008458064516129033, |
|
"loss": 0.39, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 15.52, |
|
"learning_rate": 0.0008441935483870968, |
|
"loss": 0.4253, |
|
"step": 970 |
|
}, |
|
{ |
|
"epoch": 15.68, |
|
"learning_rate": 0.0008425806451612903, |
|
"loss": 0.3707, |
|
"step": 980 |
|
}, |
|
{ |
|
"epoch": 15.84, |
|
"learning_rate": 0.0008409677419354838, |
|
"loss": 0.389, |
|
"step": 990 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"learning_rate": 0.0008393548387096774, |
|
"loss": 0.4069, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"step": 1000, |
|
"train_accuracy": 0.8934636836498089, |
|
"train_f1": 0.8909693605701321, |
|
"train_loss": 0.2904220521450043, |
|
"train_precision": 0.893519044249712, |
|
"train_recall": 0.8934636836498089, |
|
"train_runtime": 254.2734, |
|
"train_samples_per_second": 62.755, |
|
"train_steps_per_second": 0.983 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.8500563697857948, |
|
"eval_f1": 0.8452271271553625, |
|
"eval_loss": 0.4389975965023041, |
|
"eval_precision": 0.851487739267586, |
|
"eval_recall": 0.8500563697857948, |
|
"eval_runtime": 29.5522, |
|
"eval_samples_per_second": 60.029, |
|
"eval_steps_per_second": 0.947, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 16.16, |
|
"learning_rate": 0.0008377419354838711, |
|
"loss": 0.389, |
|
"step": 1010 |
|
}, |
|
{ |
|
"epoch": 16.32, |
|
"learning_rate": 0.0008361290322580646, |
|
"loss": 0.3682, |
|
"step": 1020 |
|
}, |
|
{ |
|
"epoch": 16.48, |
|
"learning_rate": 0.0008345161290322581, |
|
"loss": 0.3746, |
|
"step": 1030 |
|
}, |
|
{ |
|
"epoch": 16.64, |
|
"learning_rate": 0.0008329032258064516, |
|
"loss": 0.3817, |
|
"step": 1040 |
|
}, |
|
{ |
|
"epoch": 16.8, |
|
"learning_rate": 0.0008312903225806452, |
|
"loss": 0.3652, |
|
"step": 1050 |
|
}, |
|
{ |
|
"epoch": 16.96, |
|
"learning_rate": 0.0008296774193548387, |
|
"loss": 0.3774, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 16.99, |
|
"step": 1062, |
|
"train_accuracy": 0.9058093626621545, |
|
"train_f1": 0.9046539806661633, |
|
"train_loss": 0.2608683109283447, |
|
"train_precision": 0.9049170910236276, |
|
"train_recall": 0.9058093626621545, |
|
"train_runtime": 253.2237, |
|
"train_samples_per_second": 63.015, |
|
"train_steps_per_second": 0.987 |
|
}, |
|
{ |
|
"epoch": 16.99, |
|
"eval_accuracy": 0.8579481397970687, |
|
"eval_f1": 0.8563523858127897, |
|
"eval_loss": 0.415022075176239, |
|
"eval_precision": 0.8576310002165511, |
|
"eval_recall": 0.8579481397970687, |
|
"eval_runtime": 29.5963, |
|
"eval_samples_per_second": 59.94, |
|
"eval_steps_per_second": 0.946, |
|
"step": 1062 |
|
}, |
|
{ |
|
"epoch": 17.12, |
|
"learning_rate": 0.0008280645161290323, |
|
"loss": 0.3537, |
|
"step": 1070 |
|
}, |
|
{ |
|
"epoch": 17.28, |
|
"learning_rate": 0.0008264516129032257, |
|
"loss": 0.3743, |
|
"step": 1080 |
|
}, |
|
{ |
|
"epoch": 17.44, |
|
"learning_rate": 0.0008248387096774194, |
|
"loss": 0.3648, |
|
"step": 1090 |
|
}, |
|
{ |
|
"epoch": 17.6, |
|
"learning_rate": 0.000823225806451613, |
|
"loss": 0.3659, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 17.76, |
|
"learning_rate": 0.0008216129032258065, |
|
"loss": 0.3713, |
|
"step": 1110 |
|
}, |
|
{ |
|
"epoch": 17.92, |
|
"learning_rate": 0.00082, |
|
"loss": 0.3631, |
|
"step": 1120 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"step": 1125, |
|
"train_accuracy": 0.9117628626934887, |
|
"train_f1": 0.9111752276141204, |
|
"train_loss": 0.24888941645622253, |
|
"train_precision": 0.9116531142476182, |
|
"train_recall": 0.9117628626934887, |
|
"train_runtime": 253.2878, |
|
"train_samples_per_second": 62.999, |
|
"train_steps_per_second": 0.987 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 0.85456595264938, |
|
"eval_f1": 0.8546917151279523, |
|
"eval_loss": 0.42011961340904236, |
|
"eval_precision": 0.858590913110437, |
|
"eval_recall": 0.85456595264938, |
|
"eval_runtime": 29.5881, |
|
"eval_samples_per_second": 59.956, |
|
"eval_steps_per_second": 0.946, |
|
"step": 1125 |
|
}, |
|
{ |
|
"epoch": 18.08, |
|
"learning_rate": 0.0008183870967741935, |
|
"loss": 0.3537, |
|
"step": 1130 |
|
}, |
|
{ |
|
"epoch": 18.24, |
|
"learning_rate": 0.0008167741935483871, |
|
"loss": 0.3214, |
|
"step": 1140 |
|
}, |
|
{ |
|
"epoch": 18.4, |
|
"learning_rate": 0.0008151612903225807, |
|
"loss": 0.3464, |
|
"step": 1150 |
|
}, |
|
{ |
|
"epoch": 18.56, |
|
"learning_rate": 0.0008135483870967742, |
|
"loss": 0.3503, |
|
"step": 1160 |
|
}, |
|
{ |
|
"epoch": 18.72, |
|
"learning_rate": 0.0008119354838709677, |
|
"loss": 0.3745, |
|
"step": 1170 |
|
}, |
|
{ |
|
"epoch": 18.88, |
|
"learning_rate": 0.0008103225806451613, |
|
"loss": 0.3458, |
|
"step": 1180 |
|
}, |
|
{ |
|
"epoch": 18.99, |
|
"step": 1187, |
|
"train_accuracy": 0.912326878485931, |
|
"train_f1": 0.9113314150149505, |
|
"train_loss": 0.24995951354503632, |
|
"train_precision": 0.9115719864017833, |
|
"train_recall": 0.912326878485931, |
|
"train_runtime": 254.6215, |
|
"train_samples_per_second": 62.669, |
|
"train_steps_per_second": 0.982 |
|
}, |
|
{ |
|
"epoch": 18.99, |
|
"eval_accuracy": 0.8562570462232244, |
|
"eval_f1": 0.8542249820828076, |
|
"eval_loss": 0.40477874875068665, |
|
"eval_precision": 0.8544614619611243, |
|
"eval_recall": 0.8562570462232244, |
|
"eval_runtime": 29.856, |
|
"eval_samples_per_second": 59.418, |
|
"eval_steps_per_second": 0.938, |
|
"step": 1187 |
|
}, |
|
{ |
|
"epoch": 19.04, |
|
"learning_rate": 0.0008087096774193549, |
|
"loss": 0.3953, |
|
"step": 1190 |
|
}, |
|
{ |
|
"epoch": 19.2, |
|
"learning_rate": 0.0008070967741935484, |
|
"loss": 0.3386, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 19.36, |
|
"learning_rate": 0.000805483870967742, |
|
"loss": 0.3322, |
|
"step": 1210 |
|
}, |
|
{ |
|
"epoch": 19.52, |
|
"learning_rate": 0.0008038709677419355, |
|
"loss": 0.3425, |
|
"step": 1220 |
|
}, |
|
{ |
|
"epoch": 19.68, |
|
"learning_rate": 0.000802258064516129, |
|
"loss": 0.3448, |
|
"step": 1230 |
|
}, |
|
{ |
|
"epoch": 19.84, |
|
"learning_rate": 0.0008006451612903226, |
|
"loss": 0.3534, |
|
"step": 1240 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"learning_rate": 0.0007990322580645161, |
|
"loss": 0.3361, |
|
"step": 1250 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"step": 1250, |
|
"train_accuracy": 0.9059346995049194, |
|
"train_f1": 0.9033631776657957, |
|
"train_loss": 0.2528255581855774, |
|
"train_precision": 0.9064546977324616, |
|
"train_recall": 0.9059346995049194, |
|
"train_runtime": 252.7613, |
|
"train_samples_per_second": 63.131, |
|
"train_steps_per_second": 0.989 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.8596392333709132, |
|
"eval_f1": 0.8566333454163209, |
|
"eval_loss": 0.4370974004268646, |
|
"eval_precision": 0.8585278408293291, |
|
"eval_recall": 0.8596392333709132, |
|
"eval_runtime": 29.8096, |
|
"eval_samples_per_second": 59.511, |
|
"eval_steps_per_second": 0.939, |
|
"step": 1250 |
|
}, |
|
{ |
|
"epoch": 20.16, |
|
"learning_rate": 0.0007974193548387097, |
|
"loss": 0.3154, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 20.32, |
|
"learning_rate": 0.0007958064516129032, |
|
"loss": 0.3478, |
|
"step": 1270 |
|
}, |
|
{ |
|
"epoch": 20.48, |
|
"learning_rate": 0.0007941935483870968, |
|
"loss": 0.3385, |
|
"step": 1280 |
|
}, |
|
{ |
|
"epoch": 20.64, |
|
"learning_rate": 0.0007925806451612904, |
|
"loss": 0.3327, |
|
"step": 1290 |
|
}, |
|
{ |
|
"epoch": 20.8, |
|
"learning_rate": 0.0007909677419354839, |
|
"loss": 0.3398, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 20.96, |
|
"learning_rate": 0.0007893548387096774, |
|
"loss": 0.3386, |
|
"step": 1310 |
|
}, |
|
{ |
|
"epoch": 20.99, |
|
"step": 1312, |
|
"train_accuracy": 0.9205991101084163, |
|
"train_f1": 0.9202297733826367, |
|
"train_loss": 0.22639435529708862, |
|
"train_precision": 0.9204915599848654, |
|
"train_recall": 0.9205991101084163, |
|
"train_runtime": 253.7128, |
|
"train_samples_per_second": 62.894, |
|
"train_steps_per_second": 0.985 |
|
}, |
|
{ |
|
"epoch": 20.99, |
|
"eval_accuracy": 0.8686583990980834, |
|
"eval_f1": 0.8680154821185954, |
|
"eval_loss": 0.39551448822021484, |
|
"eval_precision": 0.8689593382775722, |
|
"eval_recall": 0.8686583990980834, |
|
"eval_runtime": 29.773, |
|
"eval_samples_per_second": 59.584, |
|
"eval_steps_per_second": 0.94, |
|
"step": 1312 |
|
}, |
|
{ |
|
"epoch": 21.12, |
|
"learning_rate": 0.0007877419354838709, |
|
"loss": 0.3038, |
|
"step": 1320 |
|
}, |
|
{ |
|
"epoch": 21.28, |
|
"learning_rate": 0.0007861290322580645, |
|
"loss": 0.3157, |
|
"step": 1330 |
|
}, |
|
{ |
|
"epoch": 21.44, |
|
"learning_rate": 0.0007845161290322582, |
|
"loss": 0.318, |
|
"step": 1340 |
|
}, |
|
{ |
|
"epoch": 21.6, |
|
"learning_rate": 0.0007829032258064517, |
|
"loss": 0.2993, |
|
"step": 1350 |
|
}, |
|
{ |
|
"epoch": 21.76, |
|
"learning_rate": 0.0007812903225806452, |
|
"loss": 0.3185, |
|
"step": 1360 |
|
}, |
|
{ |
|
"epoch": 21.92, |
|
"learning_rate": 0.0007796774193548387, |
|
"loss": 0.3091, |
|
"step": 1370 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"step": 1375, |
|
"train_accuracy": 0.9207871153725637, |
|
"train_f1": 0.919568201335574, |
|
"train_loss": 0.21673625707626343, |
|
"train_precision": 0.9203664780549666, |
|
"train_recall": 0.9207871153725637, |
|
"train_runtime": 249.1604, |
|
"train_samples_per_second": 64.043, |
|
"train_steps_per_second": 1.003 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_accuracy": 0.8680947012401353, |
|
"eval_f1": 0.8657724581221397, |
|
"eval_loss": 0.4277941584587097, |
|
"eval_precision": 0.8671942484944011, |
|
"eval_recall": 0.8680947012401353, |
|
"eval_runtime": 29.1495, |
|
"eval_samples_per_second": 60.859, |
|
"eval_steps_per_second": 0.961, |
|
"step": 1375 |
|
}, |
|
{ |
|
"epoch": 22.08, |
|
"learning_rate": 0.0007780645161290323, |
|
"loss": 0.3109, |
|
"step": 1380 |
|
}, |
|
{ |
|
"epoch": 22.24, |
|
"learning_rate": 0.0007764516129032258, |
|
"loss": 0.3082, |
|
"step": 1390 |
|
}, |
|
{ |
|
"epoch": 22.4, |
|
"learning_rate": 0.0007748387096774193, |
|
"loss": 0.3133, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 22.56, |
|
"learning_rate": 0.0007732258064516128, |
|
"loss": 0.3217, |
|
"step": 1410 |
|
}, |
|
{ |
|
"epoch": 22.72, |
|
"learning_rate": 0.0007716129032258065, |
|
"loss": 0.3145, |
|
"step": 1420 |
|
}, |
|
{ |
|
"epoch": 22.88, |
|
"learning_rate": 0.0007700000000000001, |
|
"loss": 0.3081, |
|
"step": 1430 |
|
}, |
|
{ |
|
"epoch": 22.99, |
|
"step": 1437, |
|
"train_accuracy": 0.9301247101585511, |
|
"train_f1": 0.9298726796945993, |
|
"train_loss": 0.2020701915025711, |
|
"train_precision": 0.9301061473852973, |
|
"train_recall": 0.9301247101585511, |
|
"train_runtime": 248.5533, |
|
"train_samples_per_second": 64.2, |
|
"train_steps_per_second": 1.006 |
|
}, |
|
{ |
|
"epoch": 22.99, |
|
"eval_accuracy": 0.8675310033821871, |
|
"eval_f1": 0.8662116604826631, |
|
"eval_loss": 0.39544782042503357, |
|
"eval_precision": 0.866086748268126, |
|
"eval_recall": 0.8675310033821871, |
|
"eval_runtime": 29.2034, |
|
"eval_samples_per_second": 60.746, |
|
"eval_steps_per_second": 0.959, |
|
"step": 1437 |
|
}, |
|
{ |
|
"epoch": 23.04, |
|
"learning_rate": 0.0007683870967741936, |
|
"loss": 0.3357, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 23.2, |
|
"learning_rate": 0.0007667741935483871, |
|
"loss": 0.2981, |
|
"step": 1450 |
|
}, |
|
{ |
|
"epoch": 23.36, |
|
"learning_rate": 0.0007651612903225806, |
|
"loss": 0.2823, |
|
"step": 1460 |
|
}, |
|
{ |
|
"epoch": 23.52, |
|
"learning_rate": 0.0007635483870967742, |
|
"loss": 0.3036, |
|
"step": 1470 |
|
}, |
|
{ |
|
"epoch": 23.68, |
|
"learning_rate": 0.0007619354838709678, |
|
"loss": 0.3097, |
|
"step": 1480 |
|
}, |
|
{ |
|
"epoch": 23.84, |
|
"learning_rate": 0.0007603225806451613, |
|
"loss": 0.3004, |
|
"step": 1490 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"learning_rate": 0.0007587096774193549, |
|
"loss": 0.3031, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"step": 1500, |
|
"train_accuracy": 0.9242965469699819, |
|
"train_f1": 0.9232184701149497, |
|
"train_loss": 0.20474377274513245, |
|
"train_precision": 0.9253522346156541, |
|
"train_recall": 0.9242965469699819, |
|
"train_runtime": 248.6452, |
|
"train_samples_per_second": 64.176, |
|
"train_steps_per_second": 1.005 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.8720405862457723, |
|
"eval_f1": 0.8716583234363133, |
|
"eval_loss": 0.42239370942115784, |
|
"eval_precision": 0.8734092383360484, |
|
"eval_recall": 0.8720405862457723, |
|
"eval_runtime": 29.0555, |
|
"eval_samples_per_second": 61.055, |
|
"eval_steps_per_second": 0.964, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 24.16, |
|
"learning_rate": 0.0007570967741935484, |
|
"loss": 0.2858, |
|
"step": 1510 |
|
}, |
|
{ |
|
"epoch": 24.32, |
|
"learning_rate": 0.000755483870967742, |
|
"loss": 0.2999, |
|
"step": 1520 |
|
}, |
|
{ |
|
"epoch": 24.48, |
|
"learning_rate": 0.0007538709677419355, |
|
"loss": 0.3135, |
|
"step": 1530 |
|
}, |
|
{ |
|
"epoch": 24.64, |
|
"learning_rate": 0.000752258064516129, |
|
"loss": 0.2951, |
|
"step": 1540 |
|
}, |
|
{ |
|
"epoch": 24.8, |
|
"learning_rate": 0.0007506451612903225, |
|
"loss": 0.3136, |
|
"step": 1550 |
|
}, |
|
{ |
|
"epoch": 24.96, |
|
"learning_rate": 0.0007490322580645161, |
|
"loss": 0.2918, |
|
"step": 1560 |
|
}, |
|
{ |
|
"epoch": 24.99, |
|
"step": 1562, |
|
"train_accuracy": 0.9315660838503478, |
|
"train_f1": 0.9309767971055543, |
|
"train_loss": 0.1887647807598114, |
|
"train_precision": 0.9311524146378474, |
|
"train_recall": 0.9315660838503478, |
|
"train_runtime": 249.2905, |
|
"train_samples_per_second": 64.01, |
|
"train_steps_per_second": 1.003 |
|
}, |
|
{ |
|
"epoch": 24.99, |
|
"eval_accuracy": 0.8680947012401353, |
|
"eval_f1": 0.8669054461224185, |
|
"eval_loss": 0.43037477135658264, |
|
"eval_precision": 0.8673301666844889, |
|
"eval_recall": 0.8680947012401353, |
|
"eval_runtime": 29.0965, |
|
"eval_samples_per_second": 60.97, |
|
"eval_steps_per_second": 0.962, |
|
"step": 1562 |
|
}, |
|
{ |
|
"epoch": 25.12, |
|
"learning_rate": 0.0007474193548387097, |
|
"loss": 0.2943, |
|
"step": 1570 |
|
}, |
|
{ |
|
"epoch": 25.28, |
|
"learning_rate": 0.0007458064516129033, |
|
"loss": 0.2796, |
|
"step": 1580 |
|
}, |
|
{ |
|
"epoch": 25.44, |
|
"learning_rate": 0.0007441935483870968, |
|
"loss": 0.2712, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 25.6, |
|
"learning_rate": 0.0007425806451612903, |
|
"loss": 0.2862, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 25.76, |
|
"learning_rate": 0.0007409677419354839, |
|
"loss": 0.2833, |
|
"step": 1610 |
|
}, |
|
{ |
|
"epoch": 25.92, |
|
"learning_rate": 0.0007393548387096775, |
|
"loss": 0.2594, |
|
"step": 1620 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"step": 1625, |
|
"train_accuracy": 0.934824841762236, |
|
"train_f1": 0.9340766757397655, |
|
"train_loss": 0.18092262744903564, |
|
"train_precision": 0.9349816666427498, |
|
"train_recall": 0.934824841762236, |
|
"train_runtime": 249.0812, |
|
"train_samples_per_second": 64.063, |
|
"train_steps_per_second": 1.004 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_accuracy": 0.8776775648252536, |
|
"eval_f1": 0.8766912677805229, |
|
"eval_loss": 0.421634703874588, |
|
"eval_precision": 0.8774332235361698, |
|
"eval_recall": 0.8776775648252536, |
|
"eval_runtime": 30.0967, |
|
"eval_samples_per_second": 58.943, |
|
"eval_steps_per_second": 0.93, |
|
"step": 1625 |
|
}, |
|
{ |
|
"epoch": 26.08, |
|
"learning_rate": 0.000737741935483871, |
|
"loss": 0.2729, |
|
"step": 1630 |
|
}, |
|
{ |
|
"epoch": 26.24, |
|
"learning_rate": 0.0007361290322580645, |
|
"loss": 0.2801, |
|
"step": 1640 |
|
}, |
|
{ |
|
"epoch": 26.4, |
|
"learning_rate": 0.000734516129032258, |
|
"loss": 0.2653, |
|
"step": 1650 |
|
}, |
|
{ |
|
"epoch": 26.56, |
|
"learning_rate": 0.0007329032258064517, |
|
"loss": 0.3044, |
|
"step": 1660 |
|
}, |
|
{ |
|
"epoch": 26.72, |
|
"learning_rate": 0.0007312903225806452, |
|
"loss": 0.2751, |
|
"step": 1670 |
|
}, |
|
{ |
|
"epoch": 26.88, |
|
"learning_rate": 0.0007296774193548388, |
|
"loss": 0.3028, |
|
"step": 1680 |
|
}, |
|
{ |
|
"epoch": 26.99, |
|
"step": 1687, |
|
"train_accuracy": 0.93670489440371, |
|
"train_f1": 0.9361197667432394, |
|
"train_loss": 0.1785627156496048, |
|
"train_precision": 0.9365292015778245, |
|
"train_recall": 0.93670489440371, |
|
"train_runtime": 255.0897, |
|
"train_samples_per_second": 62.554, |
|
"train_steps_per_second": 0.98 |
|
}, |
|
{ |
|
"epoch": 26.99, |
|
"eval_accuracy": 0.8810597519729425, |
|
"eval_f1": 0.8793922695566861, |
|
"eval_loss": 0.40421751141548157, |
|
"eval_precision": 0.8798634255905717, |
|
"eval_recall": 0.8810597519729425, |
|
"eval_runtime": 45.5693, |
|
"eval_samples_per_second": 38.93, |
|
"eval_steps_per_second": 0.614, |
|
"step": 1687 |
|
}, |
|
{ |
|
"epoch": 27.04, |
|
"learning_rate": 0.0007280645161290323, |
|
"loss": 0.2499, |
|
"step": 1690 |
|
}, |
|
{ |
|
"epoch": 27.2, |
|
"learning_rate": 0.0007264516129032258, |
|
"loss": 0.2792, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 27.36, |
|
"learning_rate": 0.0007248387096774194, |
|
"loss": 0.2792, |
|
"step": 1710 |
|
}, |
|
{ |
|
"epoch": 27.52, |
|
"learning_rate": 0.0007232258064516129, |
|
"loss": 0.2865, |
|
"step": 1720 |
|
}, |
|
{ |
|
"epoch": 27.68, |
|
"learning_rate": 0.0007216129032258064, |
|
"loss": 0.2845, |
|
"step": 1730 |
|
}, |
|
{ |
|
"epoch": 27.84, |
|
"learning_rate": 0.0007199999999999999, |
|
"loss": 0.2861, |
|
"step": 1740 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"learning_rate": 0.0007183870967741936, |
|
"loss": 0.2758, |
|
"step": 1750 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"step": 1750, |
|
"train_accuracy": 0.938459610202419, |
|
"train_f1": 0.9377525981628592, |
|
"train_loss": 0.1685272455215454, |
|
"train_precision": 0.9389554252034343, |
|
"train_recall": 0.938459610202419, |
|
"train_runtime": 253.2422, |
|
"train_samples_per_second": 63.011, |
|
"train_steps_per_second": 0.987 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_accuracy": 0.8680947012401353, |
|
"eval_f1": 0.8681614791663694, |
|
"eval_loss": 0.41954031586647034, |
|
"eval_precision": 0.8691594298818118, |
|
"eval_recall": 0.8680947012401353, |
|
"eval_runtime": 47.5593, |
|
"eval_samples_per_second": 37.301, |
|
"eval_steps_per_second": 0.589, |
|
"step": 1750 |
|
}, |
|
{ |
|
"epoch": 28.16, |
|
"learning_rate": 0.0007167741935483872, |
|
"loss": 0.2659, |
|
"step": 1760 |
|
}, |
|
{ |
|
"epoch": 28.32, |
|
"learning_rate": 0.0007151612903225807, |
|
"loss": 0.2522, |
|
"step": 1770 |
|
}, |
|
{ |
|
"epoch": 28.48, |
|
"learning_rate": 0.0007135483870967742, |
|
"loss": 0.2755, |
|
"step": 1780 |
|
}, |
|
{ |
|
"epoch": 28.64, |
|
"learning_rate": 0.0007119354838709677, |
|
"loss": 0.2736, |
|
"step": 1790 |
|
}, |
|
{ |
|
"epoch": 28.8, |
|
"learning_rate": 0.0007103225806451613, |
|
"loss": 0.2847, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 28.96, |
|
"learning_rate": 0.0007087096774193548, |
|
"loss": 0.2833, |
|
"step": 1810 |
|
}, |
|
{ |
|
"epoch": 28.99, |
|
"step": 1812, |
|
"train_accuracy": 0.9406530049508053, |
|
"train_f1": 0.9397675181987466, |
|
"train_loss": 0.16751761734485626, |
|
"train_precision": 0.9410854777530413, |
|
"train_recall": 0.9406530049508053, |
|
"train_runtime": 254.9572, |
|
"train_samples_per_second": 62.587, |
|
"train_steps_per_second": 0.981 |
|
}, |
|
{ |
|
"epoch": 28.99, |
|
"eval_accuracy": 0.8759864712514093, |
|
"eval_f1": 0.872766620485809, |
|
"eval_loss": 0.37792226672172546, |
|
"eval_precision": 0.8741418008848874, |
|
"eval_recall": 0.8759864712514093, |
|
"eval_runtime": 41.0022, |
|
"eval_samples_per_second": 43.266, |
|
"eval_steps_per_second": 0.683, |
|
"step": 1812 |
|
}, |
|
{ |
|
"epoch": 29.12, |
|
"learning_rate": 0.0007070967741935484, |
|
"loss": 0.2487, |
|
"step": 1820 |
|
}, |
|
{ |
|
"epoch": 29.28, |
|
"learning_rate": 0.000705483870967742, |
|
"loss": 0.2712, |
|
"step": 1830 |
|
}, |
|
{ |
|
"epoch": 29.44, |
|
"learning_rate": 0.0007038709677419355, |
|
"loss": 0.243, |
|
"step": 1840 |
|
}, |
|
{ |
|
"epoch": 29.6, |
|
"learning_rate": 0.0007022580645161291, |
|
"loss": 0.2438, |
|
"step": 1850 |
|
}, |
|
{ |
|
"epoch": 29.76, |
|
"learning_rate": 0.0007006451612903226, |
|
"loss": 0.2834, |
|
"step": 1860 |
|
}, |
|
{ |
|
"epoch": 29.92, |
|
"learning_rate": 0.0006990322580645161, |
|
"loss": 0.2414, |
|
"step": 1870 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"step": 1875, |
|
"train_accuracy": 0.9470451839318168, |
|
"train_f1": 0.9467087754155913, |
|
"train_loss": 0.15353631973266602, |
|
"train_precision": 0.9468910650190296, |
|
"train_recall": 0.9470451839318168, |
|
"train_runtime": 255.1175, |
|
"train_samples_per_second": 62.548, |
|
"train_steps_per_second": 0.98 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_accuracy": 0.8799323562570462, |
|
"eval_f1": 0.8785953814489085, |
|
"eval_loss": 0.4351659119129181, |
|
"eval_precision": 0.8796722516525893, |
|
"eval_recall": 0.8799323562570462, |
|
"eval_runtime": 38.7284, |
|
"eval_samples_per_second": 45.806, |
|
"eval_steps_per_second": 0.723, |
|
"step": 1875 |
|
}, |
|
{ |
|
"epoch": 30.08, |
|
"learning_rate": 0.0006974193548387096, |
|
"loss": 0.2458, |
|
"step": 1880 |
|
}, |
|
{ |
|
"epoch": 30.24, |
|
"learning_rate": 0.0006958064516129032, |
|
"loss": 0.2436, |
|
"step": 1890 |
|
}, |
|
{ |
|
"epoch": 30.4, |
|
"learning_rate": 0.0006941935483870968, |
|
"loss": 0.2279, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 30.56, |
|
"learning_rate": 0.0006925806451612904, |
|
"loss": 0.2496, |
|
"step": 1910 |
|
}, |
|
{ |
|
"epoch": 30.72, |
|
"learning_rate": 0.0006909677419354839, |
|
"loss": 0.2527, |
|
"step": 1920 |
|
}, |
|
{ |
|
"epoch": 30.88, |
|
"learning_rate": 0.0006893548387096774, |
|
"loss": 0.2508, |
|
"step": 1930 |
|
}, |
|
{ |
|
"epoch": 30.99, |
|
"step": 1937, |
|
"train_accuracy": 0.945729147082785, |
|
"train_f1": 0.9452594948649355, |
|
"train_loss": 0.14930781722068787, |
|
"train_precision": 0.9455852542228912, |
|
"train_recall": 0.945729147082785, |
|
"train_runtime": 254.6951, |
|
"train_samples_per_second": 62.651, |
|
"train_steps_per_second": 0.982 |
|
}, |
|
{ |
|
"epoch": 30.99, |
|
"eval_accuracy": 0.887260428410372, |
|
"eval_f1": 0.8853880807732613, |
|
"eval_loss": 0.418369859457016, |
|
"eval_precision": 0.8856923487657594, |
|
"eval_recall": 0.887260428410372, |
|
"eval_runtime": 39.5926, |
|
"eval_samples_per_second": 44.806, |
|
"eval_steps_per_second": 0.707, |
|
"step": 1937 |
|
}, |
|
{ |
|
"epoch": 31.04, |
|
"learning_rate": 0.000687741935483871, |
|
"loss": 0.2344, |
|
"step": 1940 |
|
}, |
|
{ |
|
"epoch": 31.2, |
|
"learning_rate": 0.0006861290322580645, |
|
"loss": 0.2417, |
|
"step": 1950 |
|
}, |
|
{ |
|
"epoch": 31.36, |
|
"learning_rate": 0.0006845161290322581, |
|
"loss": 0.252, |
|
"step": 1960 |
|
}, |
|
{ |
|
"epoch": 31.52, |
|
"learning_rate": 0.0006829032258064516, |
|
"loss": 0.2465, |
|
"step": 1970 |
|
}, |
|
{ |
|
"epoch": 31.68, |
|
"learning_rate": 0.0006812903225806451, |
|
"loss": 0.2405, |
|
"step": 1980 |
|
}, |
|
{ |
|
"epoch": 31.84, |
|
"learning_rate": 0.0006796774193548388, |
|
"loss": 0.2275, |
|
"step": 1990 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"learning_rate": 0.0006780645161290323, |
|
"loss": 0.2509, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"step": 2000, |
|
"train_accuracy": 0.9509932944789121, |
|
"train_f1": 0.950617708879211, |
|
"train_loss": 0.14158745110034943, |
|
"train_precision": 0.9510854186462011, |
|
"train_recall": 0.9509932944789121, |
|
"train_runtime": 255.2742, |
|
"train_samples_per_second": 62.509, |
|
"train_steps_per_second": 0.979 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_accuracy": 0.8889515219842165, |
|
"eval_f1": 0.8871024769373068, |
|
"eval_loss": 0.41492128372192383, |
|
"eval_precision": 0.8891530304505318, |
|
"eval_recall": 0.8889515219842165, |
|
"eval_runtime": 35.6073, |
|
"eval_samples_per_second": 49.821, |
|
"eval_steps_per_second": 0.786, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 32.16, |
|
"learning_rate": 0.0006764516129032258, |
|
"loss": 0.22, |
|
"step": 2010 |
|
}, |
|
{ |
|
"epoch": 32.32, |
|
"learning_rate": 0.0006748387096774193, |
|
"loss": 0.243, |
|
"step": 2020 |
|
}, |
|
{ |
|
"epoch": 32.48, |
|
"learning_rate": 0.0006732258064516129, |
|
"loss": 0.2465, |
|
"step": 2030 |
|
}, |
|
{ |
|
"epoch": 32.64, |
|
"learning_rate": 0.0006716129032258065, |
|
"loss": 0.2352, |
|
"step": 2040 |
|
}, |
|
{ |
|
"epoch": 32.8, |
|
"learning_rate": 0.00067, |
|
"loss": 0.2314, |
|
"step": 2050 |
|
}, |
|
{ |
|
"epoch": 32.96, |
|
"learning_rate": 0.0006683870967741935, |
|
"loss": 0.2425, |
|
"step": 2060 |
|
}, |
|
{ |
|
"epoch": 32.99, |
|
"step": 2062, |
|
"train_accuracy": 0.9521839944851789, |
|
"train_f1": 0.9519406193802002, |
|
"train_loss": 0.13532106578350067, |
|
"train_precision": 0.9520376150741188, |
|
"train_recall": 0.9521839944851789, |
|
"train_runtime": 253.863, |
|
"train_samples_per_second": 62.857, |
|
"train_steps_per_second": 0.985 |
|
}, |
|
{ |
|
"epoch": 32.99, |
|
"eval_accuracy": 0.8900789177001127, |
|
"eval_f1": 0.8892207946311137, |
|
"eval_loss": 0.41321179270744324, |
|
"eval_precision": 0.889613661345136, |
|
"eval_recall": 0.8900789177001127, |
|
"eval_runtime": 34.1249, |
|
"eval_samples_per_second": 51.985, |
|
"eval_steps_per_second": 0.821, |
|
"step": 2062 |
|
}, |
|
{ |
|
"epoch": 33.12, |
|
"learning_rate": 0.0006667741935483871, |
|
"loss": 0.2533, |
|
"step": 2070 |
|
}, |
|
{ |
|
"epoch": 33.28, |
|
"learning_rate": 0.0006651612903225807, |
|
"loss": 0.2495, |
|
"step": 2080 |
|
}, |
|
{ |
|
"epoch": 33.44, |
|
"learning_rate": 0.0006635483870967743, |
|
"loss": 0.2216, |
|
"step": 2090 |
|
}, |
|
{ |
|
"epoch": 33.6, |
|
"learning_rate": 0.0006619354838709678, |
|
"loss": 0.2334, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 33.76, |
|
"learning_rate": 0.0006603225806451613, |
|
"loss": 0.209, |
|
"step": 2110 |
|
}, |
|
{ |
|
"epoch": 33.92, |
|
"learning_rate": 0.0006587096774193548, |
|
"loss": 0.2319, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"step": 2125, |
|
"train_accuracy": 0.9527480102776211, |
|
"train_f1": 0.9523272165039456, |
|
"train_loss": 0.13454996049404144, |
|
"train_precision": 0.9527286937272258, |
|
"train_recall": 0.9527480102776211, |
|
"train_runtime": 253.9192, |
|
"train_samples_per_second": 62.843, |
|
"train_steps_per_second": 0.985 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_accuracy": 0.8906426155580609, |
|
"eval_f1": 0.8896475365939425, |
|
"eval_loss": 0.3986554443836212, |
|
"eval_precision": 0.889369678049395, |
|
"eval_recall": 0.8906426155580609, |
|
"eval_runtime": 32.2322, |
|
"eval_samples_per_second": 55.038, |
|
"eval_steps_per_second": 0.869, |
|
"step": 2125 |
|
}, |
|
{ |
|
"epoch": 34.08, |
|
"learning_rate": 0.0006570967741935484, |
|
"loss": 0.2142, |
|
"step": 2130 |
|
}, |
|
{ |
|
"epoch": 34.24, |
|
"learning_rate": 0.0006554838709677419, |
|
"loss": 0.195, |
|
"step": 2140 |
|
}, |
|
{ |
|
"epoch": 34.4, |
|
"learning_rate": 0.0006538709677419356, |
|
"loss": 0.2257, |
|
"step": 2150 |
|
}, |
|
{ |
|
"epoch": 34.56, |
|
"learning_rate": 0.000652258064516129, |
|
"loss": 0.2191, |
|
"step": 2160 |
|
}, |
|
{ |
|
"epoch": 34.72, |
|
"learning_rate": 0.0006506451612903226, |
|
"loss": 0.2472, |
|
"step": 2170 |
|
}, |
|
{ |
|
"epoch": 34.88, |
|
"learning_rate": 0.0006490322580645162, |
|
"loss": 0.256, |
|
"step": 2180 |
|
}, |
|
{ |
|
"epoch": 34.99, |
|
"step": 2187, |
|
"train_accuracy": 0.956633452403334, |
|
"train_f1": 0.9563227521739598, |
|
"train_loss": 0.13102850317955017, |
|
"train_precision": 0.9566100366343153, |
|
"train_recall": 0.956633452403334, |
|
"train_runtime": 255.8713, |
|
"train_samples_per_second": 62.363, |
|
"train_steps_per_second": 0.977 |
|
}, |
|
{ |
|
"epoch": 34.99, |
|
"eval_accuracy": 0.8878241262683202, |
|
"eval_f1": 0.8863562863477997, |
|
"eval_loss": 0.40525099635124207, |
|
"eval_precision": 0.8863594064224781, |
|
"eval_recall": 0.8878241262683202, |
|
"eval_runtime": 29.2139, |
|
"eval_samples_per_second": 60.725, |
|
"eval_steps_per_second": 0.958, |
|
"step": 2187 |
|
}, |
|
{ |
|
"epoch": 35.04, |
|
"learning_rate": 0.0006474193548387097, |
|
"loss": 0.2196, |
|
"step": 2190 |
|
}, |
|
{ |
|
"epoch": 35.2, |
|
"learning_rate": 0.0006458064516129032, |
|
"loss": 0.208, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 35.36, |
|
"learning_rate": 0.0006441935483870967, |
|
"loss": 0.2125, |
|
"step": 2210 |
|
}, |
|
{ |
|
"epoch": 35.52, |
|
"learning_rate": 0.0006425806451612903, |
|
"loss": 0.234, |
|
"step": 2220 |
|
}, |
|
{ |
|
"epoch": 35.68, |
|
"learning_rate": 0.0006409677419354839, |
|
"loss": 0.2161, |
|
"step": 2230 |
|
}, |
|
{ |
|
"epoch": 35.84, |
|
"learning_rate": 0.0006393548387096775, |
|
"loss": 0.2384, |
|
"step": 2240 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"learning_rate": 0.000637741935483871, |
|
"loss": 0.2005, |
|
"step": 2250 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"step": 2250, |
|
"train_accuracy": 0.9563201102964216, |
|
"train_f1": 0.9559487475587907, |
|
"train_loss": 0.1280374825000763, |
|
"train_precision": 0.95649817681943, |
|
"train_recall": 0.9563201102964216, |
|
"train_runtime": 249.7425, |
|
"train_samples_per_second": 63.894, |
|
"train_steps_per_second": 1.001 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_accuracy": 0.8906426155580609, |
|
"eval_f1": 0.8889303745678712, |
|
"eval_loss": 0.42412662506103516, |
|
"eval_precision": 0.8905735232548874, |
|
"eval_recall": 0.8906426155580609, |
|
"eval_runtime": 29.236, |
|
"eval_samples_per_second": 60.679, |
|
"eval_steps_per_second": 0.958, |
|
"step": 2250 |
|
}, |
|
{ |
|
"epoch": 36.16, |
|
"learning_rate": 0.0006361290322580645, |
|
"loss": 0.2062, |
|
"step": 2260 |
|
}, |
|
{ |
|
"epoch": 36.32, |
|
"learning_rate": 0.0006345161290322581, |
|
"loss": 0.2251, |
|
"step": 2270 |
|
}, |
|
{ |
|
"epoch": 36.48, |
|
"learning_rate": 0.0006329032258064516, |
|
"loss": 0.2086, |
|
"step": 2280 |
|
}, |
|
{ |
|
"epoch": 36.64, |
|
"learning_rate": 0.0006312903225806452, |
|
"loss": 0.2239, |
|
"step": 2290 |
|
}, |
|
{ |
|
"epoch": 36.8, |
|
"learning_rate": 0.0006296774193548387, |
|
"loss": 0.2053, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 36.96, |
|
"learning_rate": 0.0006280645161290322, |
|
"loss": 0.2151, |
|
"step": 2310 |
|
}, |
|
{ |
|
"epoch": 36.99, |
|
"step": 2312, |
|
"train_accuracy": 0.9576361471454534, |
|
"train_f1": 0.9574828276125282, |
|
"train_loss": 0.12214481085538864, |
|
"train_precision": 0.9575674620543635, |
|
"train_recall": 0.9576361471454534, |
|
"train_runtime": 250.154, |
|
"train_samples_per_second": 63.789, |
|
"train_steps_per_second": 0.999 |
|
}, |
|
{ |
|
"epoch": 36.99, |
|
"eval_accuracy": 0.8928974069898534, |
|
"eval_f1": 0.8924893933635943, |
|
"eval_loss": 0.44935598969459534, |
|
"eval_precision": 0.89342937260661, |
|
"eval_recall": 0.8928974069898534, |
|
"eval_runtime": 28.948, |
|
"eval_samples_per_second": 61.282, |
|
"eval_steps_per_second": 0.967, |
|
"step": 2312 |
|
}, |
|
{ |
|
"epoch": 37.12, |
|
"learning_rate": 0.0006264516129032259, |
|
"loss": 0.2049, |
|
"step": 2320 |
|
}, |
|
{ |
|
"epoch": 37.28, |
|
"learning_rate": 0.0006248387096774194, |
|
"loss": 0.2165, |
|
"step": 2330 |
|
}, |
|
{ |
|
"epoch": 37.44, |
|
"learning_rate": 0.0006232258064516129, |
|
"loss": 0.2106, |
|
"step": 2340 |
|
}, |
|
{ |
|
"epoch": 37.6, |
|
"learning_rate": 0.0006216129032258064, |
|
"loss": 0.211, |
|
"step": 2350 |
|
}, |
|
{ |
|
"epoch": 37.76, |
|
"learning_rate": 0.00062, |
|
"loss": 0.1914, |
|
"step": 2360 |
|
}, |
|
{ |
|
"epoch": 37.92, |
|
"learning_rate": 0.0006183870967741936, |
|
"loss": 0.2264, |
|
"step": 2370 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"step": 2375, |
|
"train_accuracy": 0.9594535313655449, |
|
"train_f1": 0.9591420123249457, |
|
"train_loss": 0.11748312413692474, |
|
"train_precision": 0.9594846416905936, |
|
"train_recall": 0.9594535313655449, |
|
"train_runtime": 250.2463, |
|
"train_samples_per_second": 63.765, |
|
"train_steps_per_second": 0.999 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_accuracy": 0.8889515219842165, |
|
"eval_f1": 0.8874516370478664, |
|
"eval_loss": 0.39475908875465393, |
|
"eval_precision": 0.8871997983000491, |
|
"eval_recall": 0.8889515219842165, |
|
"eval_runtime": 29.3223, |
|
"eval_samples_per_second": 60.5, |
|
"eval_steps_per_second": 0.955, |
|
"step": 2375 |
|
}, |
|
{ |
|
"epoch": 38.08, |
|
"learning_rate": 0.0006167741935483871, |
|
"loss": 0.2018, |
|
"step": 2380 |
|
}, |
|
{ |
|
"epoch": 38.24, |
|
"learning_rate": 0.0006151612903225806, |
|
"loss": 0.2047, |
|
"step": 2390 |
|
}, |
|
{ |
|
"epoch": 38.4, |
|
"learning_rate": 0.0006135483870967742, |
|
"loss": 0.1931, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 38.56, |
|
"learning_rate": 0.0006119354838709678, |
|
"loss": 0.1973, |
|
"step": 2410 |
|
}, |
|
{ |
|
"epoch": 38.72, |
|
"learning_rate": 0.0006103225806451613, |
|
"loss": 0.1901, |
|
"step": 2420 |
|
}, |
|
{ |
|
"epoch": 38.88, |
|
"learning_rate": 0.0006087096774193549, |
|
"loss": 0.2128, |
|
"step": 2430 |
|
}, |
|
{ |
|
"epoch": 38.99, |
|
"step": 2437, |
|
"train_accuracy": 0.9598295418938397, |
|
"train_f1": 0.959583924650842, |
|
"train_loss": 0.12042330950498581, |
|
"train_precision": 0.9599378088639902, |
|
"train_recall": 0.9598295418938397, |
|
"train_runtime": 250.3192, |
|
"train_samples_per_second": 63.747, |
|
"train_steps_per_second": 0.999 |
|
}, |
|
{ |
|
"epoch": 38.99, |
|
"eval_accuracy": 0.8934611048478016, |
|
"eval_f1": 0.8921610181685623, |
|
"eval_loss": 0.4096975028514862, |
|
"eval_precision": 0.8925841926833548, |
|
"eval_recall": 0.8934611048478016, |
|
"eval_runtime": 29.0714, |
|
"eval_samples_per_second": 61.022, |
|
"eval_steps_per_second": 0.963, |
|
"step": 2437 |
|
}, |
|
{ |
|
"epoch": 39.04, |
|
"learning_rate": 0.0006070967741935484, |
|
"loss": 0.2022, |
|
"step": 2440 |
|
}, |
|
{ |
|
"epoch": 39.2, |
|
"learning_rate": 0.0006054838709677419, |
|
"loss": 0.2015, |
|
"step": 2450 |
|
}, |
|
{ |
|
"epoch": 39.36, |
|
"learning_rate": 0.0006038709677419355, |
|
"loss": 0.1906, |
|
"step": 2460 |
|
}, |
|
{ |
|
"epoch": 39.52, |
|
"learning_rate": 0.000602258064516129, |
|
"loss": 0.2003, |
|
"step": 2470 |
|
}, |
|
{ |
|
"epoch": 39.68, |
|
"learning_rate": 0.0006006451612903226, |
|
"loss": 0.2248, |
|
"step": 2480 |
|
}, |
|
{ |
|
"epoch": 39.84, |
|
"learning_rate": 0.0005990322580645161, |
|
"loss": 0.1946, |
|
"step": 2490 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"learning_rate": 0.0005974193548387097, |
|
"loss": 0.2025, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"step": 2500, |
|
"train_accuracy": 0.9597668734724573, |
|
"train_f1": 0.9596223430089906, |
|
"train_loss": 0.11334564536809921, |
|
"train_precision": 0.9597271475233058, |
|
"train_recall": 0.9597668734724573, |
|
"train_runtime": 249.5517, |
|
"train_samples_per_second": 63.943, |
|
"train_steps_per_second": 1.002 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_accuracy": 0.8906426155580609, |
|
"eval_f1": 0.8896192336703185, |
|
"eval_loss": 0.4116363823413849, |
|
"eval_precision": 0.8906240785065708, |
|
"eval_recall": 0.8906426155580609, |
|
"eval_runtime": 29.0689, |
|
"eval_samples_per_second": 61.027, |
|
"eval_steps_per_second": 0.963, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 40.16, |
|
"learning_rate": 0.0005958064516129033, |
|
"loss": 0.1783, |
|
"step": 2510 |
|
}, |
|
{ |
|
"epoch": 40.32, |
|
"learning_rate": 0.0005941935483870968, |
|
"loss": 0.1915, |
|
"step": 2520 |
|
}, |
|
{ |
|
"epoch": 40.48, |
|
"learning_rate": 0.0005925806451612903, |
|
"loss": 0.2113, |
|
"step": 2530 |
|
}, |
|
{ |
|
"epoch": 40.64, |
|
"learning_rate": 0.0005909677419354838, |
|
"loss": 0.1906, |
|
"step": 2540 |
|
}, |
|
{ |
|
"epoch": 40.8, |
|
"learning_rate": 0.0005893548387096774, |
|
"loss": 0.1835, |
|
"step": 2550 |
|
}, |
|
{ |
|
"epoch": 40.96, |
|
"learning_rate": 0.0005877419354838711, |
|
"loss": 0.2171, |
|
"step": 2560 |
|
}, |
|
{ |
|
"epoch": 40.99, |
|
"step": 2562, |
|
"train_accuracy": 0.9614589208497838, |
|
"train_f1": 0.9612864417727561, |
|
"train_loss": 0.11530015617609024, |
|
"train_precision": 0.9614218707043837, |
|
"train_recall": 0.9614589208497838, |
|
"train_runtime": 250.011, |
|
"train_samples_per_second": 63.825, |
|
"train_steps_per_second": 1.0 |
|
}, |
|
{ |
|
"epoch": 40.99, |
|
"eval_accuracy": 0.8917700112739572, |
|
"eval_f1": 0.890807210174242, |
|
"eval_loss": 0.39598962664604187, |
|
"eval_precision": 0.8908114942653367, |
|
"eval_recall": 0.8917700112739572, |
|
"eval_runtime": 29.1379, |
|
"eval_samples_per_second": 60.883, |
|
"eval_steps_per_second": 0.961, |
|
"step": 2562 |
|
}, |
|
{ |
|
"epoch": 41.12, |
|
"learning_rate": 0.0005861290322580646, |
|
"loss": 0.1964, |
|
"step": 2570 |
|
}, |
|
{ |
|
"epoch": 41.28, |
|
"learning_rate": 0.0005845161290322581, |
|
"loss": 0.1827, |
|
"step": 2580 |
|
}, |
|
{ |
|
"epoch": 41.44, |
|
"learning_rate": 0.0005829032258064516, |
|
"loss": 0.2079, |
|
"step": 2590 |
|
}, |
|
{ |
|
"epoch": 41.6, |
|
"learning_rate": 0.0005812903225806452, |
|
"loss": 0.2013, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 41.76, |
|
"learning_rate": 0.0005796774193548387, |
|
"loss": 0.2037, |
|
"step": 2610 |
|
}, |
|
{ |
|
"epoch": 41.92, |
|
"learning_rate": 0.0005780645161290323, |
|
"loss": 0.2036, |
|
"step": 2620 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"step": 2625, |
|
"train_accuracy": 0.9622736103277558, |
|
"train_f1": 0.9620354688265563, |
|
"train_loss": 0.10922261327505112, |
|
"train_precision": 0.9625027768138478, |
|
"train_recall": 0.9622736103277558, |
|
"train_runtime": 249.7106, |
|
"train_samples_per_second": 63.902, |
|
"train_steps_per_second": 1.001 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_accuracy": 0.8928974069898534, |
|
"eval_f1": 0.891600694267099, |
|
"eval_loss": 0.3954656422138214, |
|
"eval_precision": 0.8932440084981708, |
|
"eval_recall": 0.8928974069898534, |
|
"eval_runtime": 29.1604, |
|
"eval_samples_per_second": 60.836, |
|
"eval_steps_per_second": 0.96, |
|
"step": 2625 |
|
}, |
|
{ |
|
"epoch": 42.08, |
|
"learning_rate": 0.0005764516129032257, |
|
"loss": 0.1971, |
|
"step": 2630 |
|
}, |
|
{ |
|
"epoch": 42.24, |
|
"learning_rate": 0.0005748387096774194, |
|
"loss": 0.1976, |
|
"step": 2640 |
|
}, |
|
{ |
|
"epoch": 42.4, |
|
"learning_rate": 0.000573225806451613, |
|
"loss": 0.2098, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 42.56, |
|
"learning_rate": 0.0005716129032258065, |
|
"loss": 0.1833, |
|
"step": 2660 |
|
}, |
|
{ |
|
"epoch": 42.72, |
|
"learning_rate": 0.00057, |
|
"loss": 0.1936, |
|
"step": 2670 |
|
}, |
|
{ |
|
"epoch": 42.88, |
|
"learning_rate": 0.0005683870967741935, |
|
"loss": 0.1849, |
|
"step": 2680 |
|
}, |
|
{ |
|
"epoch": 42.99, |
|
"step": 2687, |
|
"train_accuracy": 0.9676004261452654, |
|
"train_f1": 0.9675534222659815, |
|
"train_loss": 0.10426949709653854, |
|
"train_precision": 0.9676367935294685, |
|
"train_recall": 0.9676004261452654, |
|
"train_runtime": 251.7545, |
|
"train_samples_per_second": 63.383, |
|
"train_steps_per_second": 0.993 |
|
}, |
|
{ |
|
"epoch": 42.99, |
|
"eval_accuracy": 0.8996617812852311, |
|
"eval_f1": 0.8986036298251875, |
|
"eval_loss": 0.3904741108417511, |
|
"eval_precision": 0.8992691335353804, |
|
"eval_recall": 0.8996617812852311, |
|
"eval_runtime": 29.0995, |
|
"eval_samples_per_second": 60.963, |
|
"eval_steps_per_second": 0.962, |
|
"step": 2687 |
|
}, |
|
{ |
|
"epoch": 43.04, |
|
"learning_rate": 0.0005667741935483871, |
|
"loss": 0.2041, |
|
"step": 2690 |
|
}, |
|
{ |
|
"epoch": 43.2, |
|
"learning_rate": 0.0005651612903225807, |
|
"loss": 0.174, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 43.36, |
|
"learning_rate": 0.0005635483870967742, |
|
"loss": 0.1792, |
|
"step": 2710 |
|
}, |
|
{ |
|
"epoch": 43.52, |
|
"learning_rate": 0.0005619354838709677, |
|
"loss": 0.1688, |
|
"step": 2720 |
|
}, |
|
{ |
|
"epoch": 43.68, |
|
"learning_rate": 0.0005603225806451613, |
|
"loss": 0.1741, |
|
"step": 2730 |
|
}, |
|
{ |
|
"epoch": 43.84, |
|
"learning_rate": 0.0005587096774193549, |
|
"loss": 0.2102, |
|
"step": 2740 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"learning_rate": 0.0005570967741935484, |
|
"loss": 0.1852, |
|
"step": 2750 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"step": 2750, |
|
"train_accuracy": 0.964843015604437, |
|
"train_f1": 0.9647050151290405, |
|
"train_loss": 0.10291223973035812, |
|
"train_precision": 0.9649053412080801, |
|
"train_recall": 0.964843015604437, |
|
"train_runtime": 250.3464, |
|
"train_samples_per_second": 63.74, |
|
"train_steps_per_second": 0.999 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_accuracy": 0.891206313416009, |
|
"eval_f1": 0.8900612906872463, |
|
"eval_loss": 0.42409268021583557, |
|
"eval_precision": 0.891982003380522, |
|
"eval_recall": 0.891206313416009, |
|
"eval_runtime": 29.1706, |
|
"eval_samples_per_second": 60.815, |
|
"eval_steps_per_second": 0.96, |
|
"step": 2750 |
|
}, |
|
{ |
|
"epoch": 44.16, |
|
"learning_rate": 0.000555483870967742, |
|
"loss": 0.1816, |
|
"step": 2760 |
|
}, |
|
{ |
|
"epoch": 44.32, |
|
"learning_rate": 0.0005538709677419355, |
|
"loss": 0.1765, |
|
"step": 2770 |
|
}, |
|
{ |
|
"epoch": 44.48, |
|
"learning_rate": 0.000552258064516129, |
|
"loss": 0.1748, |
|
"step": 2780 |
|
}, |
|
{ |
|
"epoch": 44.64, |
|
"learning_rate": 0.0005506451612903226, |
|
"loss": 0.2168, |
|
"step": 2790 |
|
}, |
|
{ |
|
"epoch": 44.8, |
|
"learning_rate": 0.0005490322580645161, |
|
"loss": 0.215, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 44.96, |
|
"learning_rate": 0.0005474193548387097, |
|
"loss": 0.1721, |
|
"step": 2810 |
|
}, |
|
{ |
|
"epoch": 44.99, |
|
"step": 2812, |
|
"train_accuracy": 0.9665350629817635, |
|
"train_f1": 0.9664032195703065, |
|
"train_loss": 0.09303626418113708, |
|
"train_precision": 0.9665823467276443, |
|
"train_recall": 0.9665350629817635, |
|
"train_runtime": 250.871, |
|
"train_samples_per_second": 63.606, |
|
"train_steps_per_second": 0.997 |
|
}, |
|
{ |
|
"epoch": 44.99, |
|
"eval_accuracy": 0.8962795941375423, |
|
"eval_f1": 0.8948599549258702, |
|
"eval_loss": 0.4103808104991913, |
|
"eval_precision": 0.8955637765539853, |
|
"eval_recall": 0.8962795941375423, |
|
"eval_runtime": 29.0827, |
|
"eval_samples_per_second": 60.998, |
|
"eval_steps_per_second": 0.963, |
|
"step": 2812 |
|
}, |
|
{ |
|
"epoch": 45.12, |
|
"learning_rate": 0.0005458064516129032, |
|
"loss": 0.1553, |
|
"step": 2820 |
|
}, |
|
{ |
|
"epoch": 45.28, |
|
"learning_rate": 0.0005441935483870968, |
|
"loss": 0.1801, |
|
"step": 2830 |
|
}, |
|
{ |
|
"epoch": 45.44, |
|
"learning_rate": 0.0005425806451612904, |
|
"loss": 0.1815, |
|
"step": 2840 |
|
}, |
|
{ |
|
"epoch": 45.6, |
|
"learning_rate": 0.0005409677419354839, |
|
"loss": 0.2039, |
|
"step": 2850 |
|
}, |
|
{ |
|
"epoch": 45.76, |
|
"learning_rate": 0.0005393548387096774, |
|
"loss": 0.1867, |
|
"step": 2860 |
|
}, |
|
{ |
|
"epoch": 45.92, |
|
"learning_rate": 0.0005377419354838709, |
|
"loss": 0.186, |
|
"step": 2870 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"step": 2875, |
|
"train_accuracy": 0.9643416682333772, |
|
"train_f1": 0.9642012339068207, |
|
"train_loss": 0.09887776523828506, |
|
"train_precision": 0.9644991194334305, |
|
"train_recall": 0.9643416682333772, |
|
"train_runtime": 254.5578, |
|
"train_samples_per_second": 62.685, |
|
"train_steps_per_second": 0.982 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_accuracy": 0.8917700112739572, |
|
"eval_f1": 0.8901319153136237, |
|
"eval_loss": 0.4248127341270447, |
|
"eval_precision": 0.8912530636364911, |
|
"eval_recall": 0.8917700112739572, |
|
"eval_runtime": 29.5608, |
|
"eval_samples_per_second": 60.012, |
|
"eval_steps_per_second": 0.947, |
|
"step": 2875 |
|
}, |
|
{ |
|
"epoch": 46.08, |
|
"learning_rate": 0.0005361290322580645, |
|
"loss": 0.1569, |
|
"step": 2880 |
|
}, |
|
{ |
|
"epoch": 46.24, |
|
"learning_rate": 0.0005345161290322581, |
|
"loss": 0.1876, |
|
"step": 2890 |
|
}, |
|
{ |
|
"epoch": 46.4, |
|
"learning_rate": 0.0005329032258064517, |
|
"loss": 0.1667, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 46.56, |
|
"learning_rate": 0.0005312903225806452, |
|
"loss": 0.169, |
|
"step": 2910 |
|
}, |
|
{ |
|
"epoch": 46.72, |
|
"learning_rate": 0.0005296774193548387, |
|
"loss": 0.1803, |
|
"step": 2920 |
|
}, |
|
{ |
|
"epoch": 46.88, |
|
"learning_rate": 0.0005280645161290323, |
|
"loss": 0.1811, |
|
"step": 2930 |
|
}, |
|
{ |
|
"epoch": 46.99, |
|
"step": 2937, |
|
"train_accuracy": 0.9637149840195526, |
|
"train_f1": 0.9634798755891425, |
|
"train_loss": 0.10527843236923218, |
|
"train_precision": 0.9638723537275108, |
|
"train_recall": 0.9637149840195526, |
|
"train_runtime": 254.7727, |
|
"train_samples_per_second": 62.632, |
|
"train_steps_per_second": 0.981 |
|
}, |
|
{ |
|
"epoch": 46.99, |
|
"eval_accuracy": 0.9013528748590756, |
|
"eval_f1": 0.8999103289546431, |
|
"eval_loss": 0.42358672618865967, |
|
"eval_precision": 0.9005857132412932, |
|
"eval_recall": 0.9013528748590756, |
|
"eval_runtime": 29.8042, |
|
"eval_samples_per_second": 59.522, |
|
"eval_steps_per_second": 0.939, |
|
"step": 2937 |
|
}, |
|
{ |
|
"epoch": 47.04, |
|
"learning_rate": 0.0005264516129032258, |
|
"loss": 0.1698, |
|
"step": 2940 |
|
}, |
|
{ |
|
"epoch": 47.2, |
|
"learning_rate": 0.0005248387096774193, |
|
"loss": 0.1744, |
|
"step": 2950 |
|
}, |
|
{ |
|
"epoch": 47.36, |
|
"learning_rate": 0.0005232258064516128, |
|
"loss": 0.1718, |
|
"step": 2960 |
|
}, |
|
{ |
|
"epoch": 47.52, |
|
"learning_rate": 0.0005216129032258065, |
|
"loss": 0.1777, |
|
"step": 2970 |
|
}, |
|
{ |
|
"epoch": 47.68, |
|
"learning_rate": 0.0005200000000000001, |
|
"loss": 0.1872, |
|
"step": 2980 |
|
}, |
|
{ |
|
"epoch": 47.84, |
|
"learning_rate": 0.0005183870967741936, |
|
"loss": 0.1586, |
|
"step": 2990 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"learning_rate": 0.0005167741935483871, |
|
"loss": 0.1891, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"step": 3000, |
|
"train_accuracy": 0.9668484050886759, |
|
"train_f1": 0.966687633803237, |
|
"train_loss": 0.09668122977018356, |
|
"train_precision": 0.9668284956038484, |
|
"train_recall": 0.9668484050886759, |
|
"train_runtime": 255.4386, |
|
"train_samples_per_second": 62.469, |
|
"train_steps_per_second": 0.979 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_accuracy": 0.90304396843292, |
|
"eval_f1": 0.9023176970973613, |
|
"eval_loss": 0.40747305750846863, |
|
"eval_precision": 0.902276892363872, |
|
"eval_recall": 0.90304396843292, |
|
"eval_runtime": 29.6296, |
|
"eval_samples_per_second": 59.873, |
|
"eval_steps_per_second": 0.945, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 48.16, |
|
"learning_rate": 0.0005151612903225806, |
|
"loss": 0.1566, |
|
"step": 3010 |
|
}, |
|
{ |
|
"epoch": 48.32, |
|
"learning_rate": 0.0005135483870967742, |
|
"loss": 0.1511, |
|
"step": 3020 |
|
}, |
|
{ |
|
"epoch": 48.48, |
|
"learning_rate": 0.0005119354838709677, |
|
"loss": 0.1914, |
|
"step": 3030 |
|
}, |
|
{ |
|
"epoch": 48.64, |
|
"learning_rate": 0.0005103225806451613, |
|
"loss": 0.1828, |
|
"step": 3040 |
|
}, |
|
{ |
|
"epoch": 48.8, |
|
"learning_rate": 0.0005087096774193549, |
|
"loss": 0.1749, |
|
"step": 3050 |
|
}, |
|
{ |
|
"epoch": 48.96, |
|
"learning_rate": 0.0005070967741935484, |
|
"loss": 0.1791, |
|
"step": 3060 |
|
}, |
|
{ |
|
"epoch": 48.99, |
|
"step": 3062, |
|
"train_accuracy": 0.9676630945666479, |
|
"train_f1": 0.9675103889274802, |
|
"train_loss": 0.09363168478012085, |
|
"train_precision": 0.9676662039614543, |
|
"train_recall": 0.9676630945666479, |
|
"train_runtime": 255.9566, |
|
"train_samples_per_second": 62.343, |
|
"train_steps_per_second": 0.977 |
|
}, |
|
{ |
|
"epoch": 48.99, |
|
"eval_accuracy": 0.8996617812852311, |
|
"eval_f1": 0.8987006309929039, |
|
"eval_loss": 0.4219958186149597, |
|
"eval_precision": 0.8986787206496698, |
|
"eval_recall": 0.8996617812852311, |
|
"eval_runtime": 29.8773, |
|
"eval_samples_per_second": 59.376, |
|
"eval_steps_per_second": 0.937, |
|
"step": 3062 |
|
}, |
|
{ |
|
"epoch": 49.12, |
|
"learning_rate": 0.000505483870967742, |
|
"loss": 0.1666, |
|
"step": 3070 |
|
}, |
|
{ |
|
"epoch": 49.28, |
|
"learning_rate": 0.0005038709677419355, |
|
"loss": 0.1626, |
|
"step": 3080 |
|
}, |
|
{ |
|
"epoch": 49.44, |
|
"learning_rate": 0.000502258064516129, |
|
"loss": 0.1771, |
|
"step": 3090 |
|
}, |
|
{ |
|
"epoch": 49.6, |
|
"learning_rate": 0.0005006451612903225, |
|
"loss": 0.179, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 49.76, |
|
"learning_rate": 0.0004990322580645161, |
|
"loss": 0.1634, |
|
"step": 3110 |
|
}, |
|
{ |
|
"epoch": 49.92, |
|
"learning_rate": 0.0004974193548387097, |
|
"loss": 0.1702, |
|
"step": 3120 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"step": 3125, |
|
"train_accuracy": 0.9695431472081218, |
|
"train_f1": 0.9694274832881341, |
|
"train_loss": 0.09215661138296127, |
|
"train_precision": 0.9695025177310069, |
|
"train_recall": 0.9695431472081218, |
|
"train_runtime": 257.2202, |
|
"train_samples_per_second": 62.036, |
|
"train_steps_per_second": 0.972 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_accuracy": 0.8928974069898534, |
|
"eval_f1": 0.8922038394852897, |
|
"eval_loss": 0.4357841908931732, |
|
"eval_precision": 0.8922256622710033, |
|
"eval_recall": 0.8928974069898534, |
|
"eval_runtime": 30.2592, |
|
"eval_samples_per_second": 58.627, |
|
"eval_steps_per_second": 0.925, |
|
"step": 3125 |
|
}, |
|
{ |
|
"epoch": 50.08, |
|
"learning_rate": 0.0004958064516129032, |
|
"loss": 0.1738, |
|
"step": 3130 |
|
}, |
|
{ |
|
"epoch": 50.24, |
|
"learning_rate": 0.0004941935483870968, |
|
"loss": 0.1781, |
|
"step": 3140 |
|
}, |
|
{ |
|
"epoch": 50.4, |
|
"learning_rate": 0.0004925806451612903, |
|
"loss": 0.1814, |
|
"step": 3150 |
|
}, |
|
{ |
|
"epoch": 50.56, |
|
"learning_rate": 0.0004909677419354839, |
|
"loss": 0.1766, |
|
"step": 3160 |
|
}, |
|
{ |
|
"epoch": 50.72, |
|
"learning_rate": 0.0004893548387096775, |
|
"loss": 0.1689, |
|
"step": 3170 |
|
}, |
|
{ |
|
"epoch": 50.88, |
|
"learning_rate": 0.00048774193548387095, |
|
"loss": 0.1667, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 50.99, |
|
"step": 3187, |
|
"train_accuracy": 0.9679137682521777, |
|
"train_f1": 0.9678451858925848, |
|
"train_loss": 0.08850996196269989, |
|
"train_precision": 0.9680124054185439, |
|
"train_recall": 0.9679137682521777, |
|
"train_runtime": 259.9309, |
|
"train_samples_per_second": 61.389, |
|
"train_steps_per_second": 0.962 |
|
}, |
|
{ |
|
"epoch": 50.99, |
|
"eval_accuracy": 0.8957158962795941, |
|
"eval_f1": 0.8947220269155864, |
|
"eval_loss": 0.4486236274242401, |
|
"eval_precision": 0.8959867186310805, |
|
"eval_recall": 0.8957158962795941, |
|
"eval_runtime": 30.0872, |
|
"eval_samples_per_second": 58.962, |
|
"eval_steps_per_second": 0.931, |
|
"step": 3187 |
|
}, |
|
{ |
|
"epoch": 51.04, |
|
"learning_rate": 0.00048612903225806457, |
|
"loss": 0.1506, |
|
"step": 3190 |
|
}, |
|
{ |
|
"epoch": 51.2, |
|
"learning_rate": 0.00048451612903225807, |
|
"loss": 0.1555, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 51.36, |
|
"learning_rate": 0.00048290322580645163, |
|
"loss": 0.164, |
|
"step": 3210 |
|
}, |
|
{ |
|
"epoch": 51.52, |
|
"learning_rate": 0.00048129032258064513, |
|
"loss": 0.1574, |
|
"step": 3220 |
|
}, |
|
{ |
|
"epoch": 51.68, |
|
"learning_rate": 0.0004796774193548387, |
|
"loss": 0.1554, |
|
"step": 3230 |
|
}, |
|
{ |
|
"epoch": 51.84, |
|
"learning_rate": 0.0004780645161290323, |
|
"loss": 0.1653, |
|
"step": 3240 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"learning_rate": 0.0004764516129032258, |
|
"loss": 0.1733, |
|
"step": 3250 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"step": 3250, |
|
"train_accuracy": 0.9680391050949426, |
|
"train_f1": 0.9679543842076324, |
|
"train_loss": 0.09445594996213913, |
|
"train_precision": 0.9681396256853804, |
|
"train_recall": 0.9680391050949426, |
|
"train_runtime": 256.4705, |
|
"train_samples_per_second": 62.218, |
|
"train_steps_per_second": 0.975 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_accuracy": 0.8990980834272829, |
|
"eval_f1": 0.8984372111101244, |
|
"eval_loss": 0.43172532320022583, |
|
"eval_precision": 0.8994814917612028, |
|
"eval_recall": 0.8990980834272829, |
|
"eval_runtime": 29.5992, |
|
"eval_samples_per_second": 59.934, |
|
"eval_steps_per_second": 0.946, |
|
"step": 3250 |
|
}, |
|
{ |
|
"epoch": 52.16, |
|
"learning_rate": 0.00047483870967741937, |
|
"loss": 0.1639, |
|
"step": 3260 |
|
}, |
|
{ |
|
"epoch": 52.32, |
|
"learning_rate": 0.00047322580645161287, |
|
"loss": 0.1541, |
|
"step": 3270 |
|
}, |
|
{ |
|
"epoch": 52.48, |
|
"learning_rate": 0.0004716129032258065, |
|
"loss": 0.1554, |
|
"step": 3280 |
|
}, |
|
{ |
|
"epoch": 52.64, |
|
"learning_rate": 0.00047, |
|
"loss": 0.175, |
|
"step": 3290 |
|
}, |
|
{ |
|
"epoch": 52.8, |
|
"learning_rate": 0.00046838709677419354, |
|
"loss": 0.1697, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 52.96, |
|
"learning_rate": 0.0004667741935483871, |
|
"loss": 0.1704, |
|
"step": 3310 |
|
}, |
|
{ |
|
"epoch": 52.99, |
|
"step": 3312, |
|
"train_accuracy": 0.9716112051137432, |
|
"train_f1": 0.9715237218187844, |
|
"train_loss": 0.08361362665891647, |
|
"train_precision": 0.9715640137675557, |
|
"train_recall": 0.9716112051137432, |
|
"train_runtime": 251.4627, |
|
"train_samples_per_second": 63.457, |
|
"train_steps_per_second": 0.994 |
|
}, |
|
{ |
|
"epoch": 52.99, |
|
"eval_accuracy": 0.9052987598647125, |
|
"eval_f1": 0.9044568554057598, |
|
"eval_loss": 0.41901707649230957, |
|
"eval_precision": 0.9045753701091548, |
|
"eval_recall": 0.9052987598647125, |
|
"eval_runtime": 29.1923, |
|
"eval_samples_per_second": 60.769, |
|
"eval_steps_per_second": 0.959, |
|
"step": 3312 |
|
}, |
|
{ |
|
"epoch": 53.12, |
|
"learning_rate": 0.00046516129032258066, |
|
"loss": 0.1537, |
|
"step": 3320 |
|
}, |
|
{ |
|
"epoch": 53.28, |
|
"learning_rate": 0.0004635483870967742, |
|
"loss": 0.158, |
|
"step": 3330 |
|
}, |
|
{ |
|
"epoch": 53.44, |
|
"learning_rate": 0.0004619354838709677, |
|
"loss": 0.1493, |
|
"step": 3340 |
|
}, |
|
{ |
|
"epoch": 53.6, |
|
"learning_rate": 0.0004603225806451613, |
|
"loss": 0.1429, |
|
"step": 3350 |
|
}, |
|
{ |
|
"epoch": 53.76, |
|
"learning_rate": 0.00045870967741935484, |
|
"loss": 0.1628, |
|
"step": 3360 |
|
}, |
|
{ |
|
"epoch": 53.92, |
|
"learning_rate": 0.0004570967741935484, |
|
"loss": 0.1584, |
|
"step": 3370 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"step": 3375, |
|
"train_accuracy": 0.9703578366860939, |
|
"train_f1": 0.970311857800694, |
|
"train_loss": 0.08544992655515671, |
|
"train_precision": 0.9704579277168014, |
|
"train_recall": 0.9703578366860939, |
|
"train_runtime": 251.0811, |
|
"train_samples_per_second": 63.553, |
|
"train_steps_per_second": 0.996 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_accuracy": 0.9052987598647125, |
|
"eval_f1": 0.904599065142192, |
|
"eval_loss": 0.4305163323879242, |
|
"eval_precision": 0.9055272931459877, |
|
"eval_recall": 0.9052987598647125, |
|
"eval_runtime": 29.1269, |
|
"eval_samples_per_second": 60.906, |
|
"eval_steps_per_second": 0.961, |
|
"step": 3375 |
|
}, |
|
{ |
|
"epoch": 54.08, |
|
"learning_rate": 0.00045548387096774196, |
|
"loss": 0.1577, |
|
"step": 3380 |
|
}, |
|
{ |
|
"epoch": 54.24, |
|
"learning_rate": 0.00045387096774193546, |
|
"loss": 0.168, |
|
"step": 3390 |
|
}, |
|
{ |
|
"epoch": 54.4, |
|
"learning_rate": 0.00045225806451612907, |
|
"loss": 0.1541, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 54.56, |
|
"learning_rate": 0.0004506451612903226, |
|
"loss": 0.1443, |
|
"step": 3410 |
|
}, |
|
{ |
|
"epoch": 54.72, |
|
"learning_rate": 0.00044903225806451613, |
|
"loss": 0.1363, |
|
"step": 3420 |
|
}, |
|
{ |
|
"epoch": 54.88, |
|
"learning_rate": 0.0004474193548387097, |
|
"loss": 0.1763, |
|
"step": 3430 |
|
}, |
|
{ |
|
"epoch": 54.99, |
|
"step": 3437, |
|
"train_accuracy": 0.9722378893275678, |
|
"train_f1": 0.9722304845282628, |
|
"train_loss": 0.08548293262720108, |
|
"train_precision": 0.9724014188580902, |
|
"train_recall": 0.9722378893275678, |
|
"train_runtime": 250.8193, |
|
"train_samples_per_second": 63.62, |
|
"train_steps_per_second": 0.997 |
|
}, |
|
{ |
|
"epoch": 54.99, |
|
"eval_accuracy": 0.8940248027057497, |
|
"eval_f1": 0.8945776482571843, |
|
"eval_loss": 0.4349919259548187, |
|
"eval_precision": 0.896683319174708, |
|
"eval_recall": 0.8940248027057497, |
|
"eval_runtime": 29.0389, |
|
"eval_samples_per_second": 61.09, |
|
"eval_steps_per_second": 0.964, |
|
"step": 3437 |
|
}, |
|
{ |
|
"epoch": 55.04, |
|
"learning_rate": 0.00044580645161290325, |
|
"loss": 0.163, |
|
"step": 3440 |
|
}, |
|
{ |
|
"epoch": 55.2, |
|
"learning_rate": 0.0004441935483870968, |
|
"loss": 0.1468, |
|
"step": 3450 |
|
}, |
|
{ |
|
"epoch": 55.36, |
|
"learning_rate": 0.0004425806451612903, |
|
"loss": 0.1356, |
|
"step": 3460 |
|
}, |
|
{ |
|
"epoch": 55.52, |
|
"learning_rate": 0.00044096774193548387, |
|
"loss": 0.1485, |
|
"step": 3470 |
|
}, |
|
{ |
|
"epoch": 55.68, |
|
"learning_rate": 0.00043935483870967743, |
|
"loss": 0.1444, |
|
"step": 3480 |
|
}, |
|
{ |
|
"epoch": 55.84, |
|
"learning_rate": 0.000437741935483871, |
|
"loss": 0.1463, |
|
"step": 3490 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"learning_rate": 0.00043612903225806454, |
|
"loss": 0.1609, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"step": 3500, |
|
"train_accuracy": 0.9711725261640659, |
|
"train_f1": 0.9710418724528065, |
|
"train_loss": 0.08499421924352646, |
|
"train_precision": 0.9711871907063745, |
|
"train_recall": 0.9711725261640659, |
|
"train_runtime": 251.6401, |
|
"train_samples_per_second": 63.412, |
|
"train_steps_per_second": 0.993 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_accuracy": 0.90304396843292, |
|
"eval_f1": 0.901618221901619, |
|
"eval_loss": 0.4472709894180298, |
|
"eval_precision": 0.9023465256016576, |
|
"eval_recall": 0.90304396843292, |
|
"eval_runtime": 29.9118, |
|
"eval_samples_per_second": 59.308, |
|
"eval_steps_per_second": 0.936, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 56.16, |
|
"learning_rate": 0.00043451612903225805, |
|
"loss": 0.1393, |
|
"step": 3510 |
|
}, |
|
{ |
|
"epoch": 56.32, |
|
"learning_rate": 0.00043290322580645166, |
|
"loss": 0.1481, |
|
"step": 3520 |
|
}, |
|
{ |
|
"epoch": 56.48, |
|
"learning_rate": 0.00043129032258064516, |
|
"loss": 0.1449, |
|
"step": 3530 |
|
}, |
|
{ |
|
"epoch": 56.64, |
|
"learning_rate": 0.0004296774193548387, |
|
"loss": 0.168, |
|
"step": 3540 |
|
}, |
|
{ |
|
"epoch": 56.8, |
|
"learning_rate": 0.0004280645161290322, |
|
"loss": 0.1722, |
|
"step": 3550 |
|
}, |
|
{ |
|
"epoch": 56.96, |
|
"learning_rate": 0.00042645161290322584, |
|
"loss": 0.1549, |
|
"step": 3560 |
|
}, |
|
{ |
|
"epoch": 56.99, |
|
"step": 3562, |
|
"train_accuracy": 0.9697311524722693, |
|
"train_f1": 0.96954160239289, |
|
"train_loss": 0.0850997045636177, |
|
"train_precision": 0.9698850921890346, |
|
"train_recall": 0.9697311524722693, |
|
"train_runtime": 250.5824, |
|
"train_samples_per_second": 63.68, |
|
"train_steps_per_second": 0.998 |
|
}, |
|
{ |
|
"epoch": 56.99, |
|
"eval_accuracy": 0.9041713641488163, |
|
"eval_f1": 0.9027359585690536, |
|
"eval_loss": 0.4477776885032654, |
|
"eval_precision": 0.9037863994127037, |
|
"eval_recall": 0.9041713641488163, |
|
"eval_runtime": 29.1274, |
|
"eval_samples_per_second": 60.905, |
|
"eval_steps_per_second": 0.961, |
|
"step": 3562 |
|
}, |
|
{ |
|
"epoch": 57.12, |
|
"learning_rate": 0.0004248387096774194, |
|
"loss": 0.1415, |
|
"step": 3570 |
|
}, |
|
{ |
|
"epoch": 57.28, |
|
"learning_rate": 0.0004232258064516129, |
|
"loss": 0.1557, |
|
"step": 3580 |
|
}, |
|
{ |
|
"epoch": 57.44, |
|
"learning_rate": 0.00042161290322580646, |
|
"loss": 0.143, |
|
"step": 3590 |
|
}, |
|
{ |
|
"epoch": 57.6, |
|
"learning_rate": 0.00042, |
|
"loss": 0.154, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 57.76, |
|
"learning_rate": 0.0004183870967741936, |
|
"loss": 0.1325, |
|
"step": 3610 |
|
}, |
|
{ |
|
"epoch": 57.92, |
|
"learning_rate": 0.0004167741935483871, |
|
"loss": 0.1586, |
|
"step": 3620 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"step": 3625, |
|
"train_accuracy": 0.9711098577426834, |
|
"train_f1": 0.9710190406318763, |
|
"train_loss": 0.08111045509576797, |
|
"train_precision": 0.971108783894692, |
|
"train_recall": 0.9711098577426834, |
|
"train_runtime": 252.5322, |
|
"train_samples_per_second": 63.188, |
|
"train_steps_per_second": 0.99 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_accuracy": 0.9024802705749718, |
|
"eval_f1": 0.9011546163080018, |
|
"eval_loss": 0.4446905255317688, |
|
"eval_precision": 0.9024443209930092, |
|
"eval_recall": 0.9024802705749718, |
|
"eval_runtime": 29.4234, |
|
"eval_samples_per_second": 60.292, |
|
"eval_steps_per_second": 0.952, |
|
"step": 3625 |
|
}, |
|
{ |
|
"epoch": 58.08, |
|
"learning_rate": 0.00041516129032258064, |
|
"loss": 0.1589, |
|
"step": 3630 |
|
}, |
|
{ |
|
"epoch": 58.24, |
|
"learning_rate": 0.00041354838709677425, |
|
"loss": 0.1368, |
|
"step": 3640 |
|
}, |
|
{ |
|
"epoch": 58.4, |
|
"learning_rate": 0.00041193548387096775, |
|
"loss": 0.135, |
|
"step": 3650 |
|
}, |
|
{ |
|
"epoch": 58.56, |
|
"learning_rate": 0.0004103225806451613, |
|
"loss": 0.1393, |
|
"step": 3660 |
|
}, |
|
{ |
|
"epoch": 58.72, |
|
"learning_rate": 0.0004087096774193548, |
|
"loss": 0.1414, |
|
"step": 3670 |
|
}, |
|
{ |
|
"epoch": 58.88, |
|
"learning_rate": 0.00040709677419354843, |
|
"loss": 0.1476, |
|
"step": 3680 |
|
}, |
|
{ |
|
"epoch": 58.99, |
|
"step": 3687, |
|
"train_accuracy": 0.9716738735351257, |
|
"train_f1": 0.9716109081205196, |
|
"train_loss": 0.08109210431575775, |
|
"train_precision": 0.971619589233349, |
|
"train_recall": 0.9716738735351257, |
|
"train_runtime": 251.3717, |
|
"train_samples_per_second": 63.48, |
|
"train_steps_per_second": 0.995 |
|
}, |
|
{ |
|
"epoch": 58.99, |
|
"eval_accuracy": 0.9007891770011274, |
|
"eval_f1": 0.8998310286529279, |
|
"eval_loss": 0.46749255061149597, |
|
"eval_precision": 0.9005611855026796, |
|
"eval_recall": 0.9007891770011274, |
|
"eval_runtime": 29.4648, |
|
"eval_samples_per_second": 60.207, |
|
"eval_steps_per_second": 0.95, |
|
"step": 3687 |
|
}, |
|
{ |
|
"epoch": 59.04, |
|
"learning_rate": 0.00040548387096774193, |
|
"loss": 0.1469, |
|
"step": 3690 |
|
}, |
|
{ |
|
"epoch": 59.2, |
|
"learning_rate": 0.0004038709677419355, |
|
"loss": 0.1285, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 59.36, |
|
"learning_rate": 0.00040225806451612905, |
|
"loss": 0.1543, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 59.52, |
|
"learning_rate": 0.00040064516129032255, |
|
"loss": 0.1576, |
|
"step": 3720 |
|
}, |
|
{ |
|
"epoch": 59.68, |
|
"learning_rate": 0.00039903225806451616, |
|
"loss": 0.1639, |
|
"step": 3730 |
|
}, |
|
{ |
|
"epoch": 59.84, |
|
"learning_rate": 0.00039741935483870967, |
|
"loss": 0.1602, |
|
"step": 3740 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"learning_rate": 0.0003958064516129032, |
|
"loss": 0.1308, |
|
"step": 3750 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"step": 3750, |
|
"train_accuracy": 0.9714231998495958, |
|
"train_f1": 0.9713301650863866, |
|
"train_loss": 0.08129285275936127, |
|
"train_precision": 0.9713703959271734, |
|
"train_recall": 0.9714231998495958, |
|
"train_runtime": 251.5017, |
|
"train_samples_per_second": 63.447, |
|
"train_steps_per_second": 0.994 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_accuracy": 0.9047350620067643, |
|
"eval_f1": 0.9038436882672473, |
|
"eval_loss": 0.4706019163131714, |
|
"eval_precision": 0.9044402371933982, |
|
"eval_recall": 0.9047350620067643, |
|
"eval_runtime": 30.419, |
|
"eval_samples_per_second": 58.319, |
|
"eval_steps_per_second": 0.92, |
|
"step": 3750 |
|
}, |
|
{ |
|
"epoch": 60.16, |
|
"learning_rate": 0.00039419354838709673, |
|
"loss": 0.1425, |
|
"step": 3760 |
|
}, |
|
{ |
|
"epoch": 60.32, |
|
"learning_rate": 0.00039258064516129034, |
|
"loss": 0.1372, |
|
"step": 3770 |
|
}, |
|
{ |
|
"epoch": 60.48, |
|
"learning_rate": 0.0003909677419354839, |
|
"loss": 0.1429, |
|
"step": 3780 |
|
}, |
|
{ |
|
"epoch": 60.64, |
|
"learning_rate": 0.0003893548387096774, |
|
"loss": 0.1366, |
|
"step": 3790 |
|
}, |
|
{ |
|
"epoch": 60.8, |
|
"learning_rate": 0.00038774193548387096, |
|
"loss": 0.1503, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 60.96, |
|
"learning_rate": 0.0003861290322580645, |
|
"loss": 0.1558, |
|
"step": 3810 |
|
}, |
|
{ |
|
"epoch": 60.99, |
|
"step": 3812, |
|
"train_accuracy": 0.9736165945979821, |
|
"train_f1": 0.9735015663251901, |
|
"train_loss": 0.07483678311109543, |
|
"train_precision": 0.9736053164344912, |
|
"train_recall": 0.9736165945979821, |
|
"train_runtime": 250.9181, |
|
"train_samples_per_second": 63.594, |
|
"train_steps_per_second": 0.996 |
|
}, |
|
{ |
|
"epoch": 60.99, |
|
"eval_accuracy": 0.9024802705749718, |
|
"eval_f1": 0.9010669627888577, |
|
"eval_loss": 0.45878297090530396, |
|
"eval_precision": 0.9016661622070999, |
|
"eval_recall": 0.9024802705749718, |
|
"eval_runtime": 30.1022, |
|
"eval_samples_per_second": 58.933, |
|
"eval_steps_per_second": 0.93, |
|
"step": 3812 |
|
}, |
|
{ |
|
"epoch": 61.12, |
|
"learning_rate": 0.0003845161290322581, |
|
"loss": 0.1222, |
|
"step": 3820 |
|
}, |
|
{ |
|
"epoch": 61.28, |
|
"learning_rate": 0.0003829032258064516, |
|
"loss": 0.1555, |
|
"step": 3830 |
|
}, |
|
{ |
|
"epoch": 61.44, |
|
"learning_rate": 0.00038129032258064514, |
|
"loss": 0.1306, |
|
"step": 3840 |
|
}, |
|
{ |
|
"epoch": 61.6, |
|
"learning_rate": 0.00037967741935483875, |
|
"loss": 0.1618, |
|
"step": 3850 |
|
}, |
|
{ |
|
"epoch": 61.76, |
|
"learning_rate": 0.00037806451612903226, |
|
"loss": 0.1436, |
|
"step": 3860 |
|
}, |
|
{ |
|
"epoch": 61.92, |
|
"learning_rate": 0.0003764516129032258, |
|
"loss": 0.1418, |
|
"step": 3870 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"step": 3875, |
|
"train_accuracy": 0.9729899103841574, |
|
"train_f1": 0.9729148616100128, |
|
"train_loss": 0.07707332819700241, |
|
"train_precision": 0.9730221901785945, |
|
"train_recall": 0.9729899103841574, |
|
"train_runtime": 254.0917, |
|
"train_samples_per_second": 62.8, |
|
"train_steps_per_second": 0.984 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_accuracy": 0.9013528748590756, |
|
"eval_f1": 0.9008617353869077, |
|
"eval_loss": 0.4513218104839325, |
|
"eval_precision": 0.9012600116180024, |
|
"eval_recall": 0.9013528748590756, |
|
"eval_runtime": 29.9385, |
|
"eval_samples_per_second": 59.255, |
|
"eval_steps_per_second": 0.935, |
|
"step": 3875 |
|
}, |
|
{ |
|
"epoch": 62.08, |
|
"learning_rate": 0.0003748387096774193, |
|
"loss": 0.173, |
|
"step": 3880 |
|
}, |
|
{ |
|
"epoch": 62.24, |
|
"learning_rate": 0.00037322580645161293, |
|
"loss": 0.1304, |
|
"step": 3890 |
|
}, |
|
{ |
|
"epoch": 62.4, |
|
"learning_rate": 0.0003716129032258065, |
|
"loss": 0.1579, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 62.56, |
|
"learning_rate": 0.00037, |
|
"loss": 0.1388, |
|
"step": 3910 |
|
}, |
|
{ |
|
"epoch": 62.72, |
|
"learning_rate": 0.00036838709677419355, |
|
"loss": 0.152, |
|
"step": 3920 |
|
}, |
|
{ |
|
"epoch": 62.88, |
|
"learning_rate": 0.0003667741935483871, |
|
"loss": 0.1283, |
|
"step": 3930 |
|
}, |
|
{ |
|
"epoch": 62.99, |
|
"step": 3937, |
|
"train_accuracy": 0.9760606630318982, |
|
"train_f1": 0.9759960239064865, |
|
"train_loss": 0.07244587689638138, |
|
"train_precision": 0.9760629730336429, |
|
"train_recall": 0.9760606630318982, |
|
"train_runtime": 252.7156, |
|
"train_samples_per_second": 63.142, |
|
"train_steps_per_second": 0.989 |
|
}, |
|
{ |
|
"epoch": 62.99, |
|
"eval_accuracy": 0.8990980834272829, |
|
"eval_f1": 0.8976577160373229, |
|
"eval_loss": 0.46622931957244873, |
|
"eval_precision": 0.8981920636717567, |
|
"eval_recall": 0.8990980834272829, |
|
"eval_runtime": 30.0055, |
|
"eval_samples_per_second": 59.122, |
|
"eval_steps_per_second": 0.933, |
|
"step": 3937 |
|
}, |
|
{ |
|
"epoch": 63.04, |
|
"learning_rate": 0.00036516129032258067, |
|
"loss": 0.1423, |
|
"step": 3940 |
|
}, |
|
{ |
|
"epoch": 63.2, |
|
"learning_rate": 0.0003635483870967742, |
|
"loss": 0.1345, |
|
"step": 3950 |
|
}, |
|
{ |
|
"epoch": 63.36, |
|
"learning_rate": 0.00036193548387096773, |
|
"loss": 0.1225, |
|
"step": 3960 |
|
}, |
|
{ |
|
"epoch": 63.52, |
|
"learning_rate": 0.00036032258064516134, |
|
"loss": 0.1399, |
|
"step": 3970 |
|
}, |
|
{ |
|
"epoch": 63.68, |
|
"learning_rate": 0.00035870967741935485, |
|
"loss": 0.1409, |
|
"step": 3980 |
|
}, |
|
{ |
|
"epoch": 63.84, |
|
"learning_rate": 0.0003570967741935484, |
|
"loss": 0.1431, |
|
"step": 3990 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"learning_rate": 0.0003554838709677419, |
|
"loss": 0.1375, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"step": 4000, |
|
"train_accuracy": 0.9777527104092248, |
|
"train_f1": 0.9776952189068061, |
|
"train_loss": 0.07026933133602142, |
|
"train_precision": 0.9777982624530956, |
|
"train_recall": 0.9777527104092248, |
|
"train_runtime": 254.2798, |
|
"train_samples_per_second": 62.754, |
|
"train_steps_per_second": 0.983 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_accuracy": 0.90304396843292, |
|
"eval_f1": 0.9018013838304384, |
|
"eval_loss": 0.43738722801208496, |
|
"eval_precision": 0.9018869567596777, |
|
"eval_recall": 0.90304396843292, |
|
"eval_runtime": 30.384, |
|
"eval_samples_per_second": 58.386, |
|
"eval_steps_per_second": 0.922, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 64.16, |
|
"learning_rate": 0.0003538709677419355, |
|
"loss": 0.121, |
|
"step": 4010 |
|
}, |
|
{ |
|
"epoch": 64.32, |
|
"learning_rate": 0.000352258064516129, |
|
"loss": 0.1532, |
|
"step": 4020 |
|
}, |
|
{ |
|
"epoch": 64.48, |
|
"learning_rate": 0.0003506451612903226, |
|
"loss": 0.1307, |
|
"step": 4030 |
|
}, |
|
{ |
|
"epoch": 64.64, |
|
"learning_rate": 0.00034903225806451614, |
|
"loss": 0.1403, |
|
"step": 4040 |
|
}, |
|
{ |
|
"epoch": 64.8, |
|
"learning_rate": 0.0003474193548387097, |
|
"loss": 0.1467, |
|
"step": 4050 |
|
}, |
|
{ |
|
"epoch": 64.96, |
|
"learning_rate": 0.00034580645161290326, |
|
"loss": 0.1255, |
|
"step": 4060 |
|
}, |
|
{ |
|
"epoch": 64.99, |
|
"step": 4062, |
|
"train_accuracy": 0.9758099893463683, |
|
"train_f1": 0.9757450720707583, |
|
"train_loss": 0.0738762691617012, |
|
"train_precision": 0.9758253961539621, |
|
"train_recall": 0.9758099893463683, |
|
"train_runtime": 270.7799, |
|
"train_samples_per_second": 58.93, |
|
"train_steps_per_second": 0.923 |
|
}, |
|
{ |
|
"epoch": 64.99, |
|
"eval_accuracy": 0.9041713641488163, |
|
"eval_f1": 0.9027682806702938, |
|
"eval_loss": 0.43671032786369324, |
|
"eval_precision": 0.9029520225388282, |
|
"eval_recall": 0.9041713641488163, |
|
"eval_runtime": 46.2, |
|
"eval_samples_per_second": 38.398, |
|
"eval_steps_per_second": 0.606, |
|
"step": 4062 |
|
}, |
|
{ |
|
"epoch": 65.12, |
|
"learning_rate": 0.00034419354838709676, |
|
"loss": 0.1398, |
|
"step": 4070 |
|
}, |
|
{ |
|
"epoch": 65.28, |
|
"learning_rate": 0.0003425806451612903, |
|
"loss": 0.1294, |
|
"step": 4080 |
|
}, |
|
{ |
|
"epoch": 65.44, |
|
"learning_rate": 0.0003409677419354839, |
|
"loss": 0.1192, |
|
"step": 4090 |
|
}, |
|
{ |
|
"epoch": 65.6, |
|
"learning_rate": 0.00033935483870967744, |
|
"loss": 0.1274, |
|
"step": 4100 |
|
}, |
|
{ |
|
"epoch": 65.76, |
|
"learning_rate": 0.000337741935483871, |
|
"loss": 0.1332, |
|
"step": 4110 |
|
}, |
|
{ |
|
"epoch": 65.92, |
|
"learning_rate": 0.0003361290322580645, |
|
"loss": 0.1356, |
|
"step": 4120 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"step": 4125, |
|
"train_accuracy": 0.9761233314532807, |
|
"train_f1": 0.9759950169974181, |
|
"train_loss": 0.07223277539014816, |
|
"train_precision": 0.9761999631640097, |
|
"train_recall": 0.9761233314532807, |
|
"train_runtime": 254.9857, |
|
"train_samples_per_second": 62.58, |
|
"train_steps_per_second": 0.98 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_accuracy": 0.9002254791431793, |
|
"eval_f1": 0.8985023992882097, |
|
"eval_loss": 0.47199180722236633, |
|
"eval_precision": 0.8998740225780659, |
|
"eval_recall": 0.9002254791431793, |
|
"eval_runtime": 46.4259, |
|
"eval_samples_per_second": 38.211, |
|
"eval_steps_per_second": 0.603, |
|
"step": 4125 |
|
}, |
|
{ |
|
"epoch": 66.08, |
|
"learning_rate": 0.0003345161290322581, |
|
"loss": 0.1288, |
|
"step": 4130 |
|
}, |
|
{ |
|
"epoch": 66.24, |
|
"learning_rate": 0.0003329032258064516, |
|
"loss": 0.1373, |
|
"step": 4140 |
|
}, |
|
{ |
|
"epoch": 66.4, |
|
"learning_rate": 0.0003312903225806452, |
|
"loss": 0.1424, |
|
"step": 4150 |
|
}, |
|
{ |
|
"epoch": 66.56, |
|
"learning_rate": 0.0003296774193548387, |
|
"loss": 0.1369, |
|
"step": 4160 |
|
}, |
|
{ |
|
"epoch": 66.72, |
|
"learning_rate": 0.0003280645161290323, |
|
"loss": 0.1366, |
|
"step": 4170 |
|
}, |
|
{ |
|
"epoch": 66.88, |
|
"learning_rate": 0.00032645161290322585, |
|
"loss": 0.1363, |
|
"step": 4180 |
|
}, |
|
{ |
|
"epoch": 66.99, |
|
"step": 4187, |
|
"train_accuracy": 0.9745566209187191, |
|
"train_f1": 0.9744197447101088, |
|
"train_loss": 0.07206864655017853, |
|
"train_precision": 0.9746863463745119, |
|
"train_recall": 0.9745566209187191, |
|
"train_runtime": 255.3323, |
|
"train_samples_per_second": 62.495, |
|
"train_steps_per_second": 0.979 |
|
}, |
|
{ |
|
"epoch": 66.99, |
|
"eval_accuracy": 0.8974069898534386, |
|
"eval_f1": 0.8958287812129277, |
|
"eval_loss": 0.4912644624710083, |
|
"eval_precision": 0.897064496045103, |
|
"eval_recall": 0.8974069898534386, |
|
"eval_runtime": 42.5384, |
|
"eval_samples_per_second": 41.703, |
|
"eval_steps_per_second": 0.658, |
|
"step": 4187 |
|
}, |
|
{ |
|
"epoch": 67.04, |
|
"learning_rate": 0.00032483870967741935, |
|
"loss": 0.1427, |
|
"step": 4190 |
|
}, |
|
{ |
|
"epoch": 67.2, |
|
"learning_rate": 0.0003232258064516129, |
|
"loss": 0.1423, |
|
"step": 4200 |
|
}, |
|
{ |
|
"epoch": 67.36, |
|
"learning_rate": 0.00032161290322580647, |
|
"loss": 0.1346, |
|
"step": 4210 |
|
}, |
|
{ |
|
"epoch": 67.52, |
|
"learning_rate": 0.00032, |
|
"loss": 0.1349, |
|
"step": 4220 |
|
}, |
|
{ |
|
"epoch": 67.68, |
|
"learning_rate": 0.00031838709677419353, |
|
"loss": 0.1222, |
|
"step": 4230 |
|
}, |
|
{ |
|
"epoch": 67.84, |
|
"learning_rate": 0.0003167741935483871, |
|
"loss": 0.1332, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"learning_rate": 0.0003151612903225807, |
|
"loss": 0.1307, |
|
"step": 4250 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"step": 4250, |
|
"train_accuracy": 0.9771260261954001, |
|
"train_f1": 0.9770837683590446, |
|
"train_loss": 0.06861759722232819, |
|
"train_precision": 0.9771261688994373, |
|
"train_recall": 0.9771260261954001, |
|
"train_runtime": 258.9242, |
|
"train_samples_per_second": 61.628, |
|
"train_steps_per_second": 0.966 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_accuracy": 0.9041713641488163, |
|
"eval_f1": 0.9032565731221586, |
|
"eval_loss": 0.440946489572525, |
|
"eval_precision": 0.9031641144165843, |
|
"eval_recall": 0.9041713641488163, |
|
"eval_runtime": 39.476, |
|
"eval_samples_per_second": 44.939, |
|
"eval_steps_per_second": 0.709, |
|
"step": 4250 |
|
}, |
|
{ |
|
"epoch": 68.16, |
|
"learning_rate": 0.0003135483870967742, |
|
"loss": 0.1264, |
|
"step": 4260 |
|
}, |
|
{ |
|
"epoch": 68.32, |
|
"learning_rate": 0.00031193548387096776, |
|
"loss": 0.1441, |
|
"step": 4270 |
|
}, |
|
{ |
|
"epoch": 68.48, |
|
"learning_rate": 0.00031032258064516127, |
|
"loss": 0.127, |
|
"step": 4280 |
|
}, |
|
{ |
|
"epoch": 68.64, |
|
"learning_rate": 0.0003087096774193548, |
|
"loss": 0.1392, |
|
"step": 4290 |
|
}, |
|
{ |
|
"epoch": 68.8, |
|
"learning_rate": 0.0003070967741935484, |
|
"loss": 0.143, |
|
"step": 4300 |
|
}, |
|
{ |
|
"epoch": 68.96, |
|
"learning_rate": 0.00030548387096774194, |
|
"loss": 0.1209, |
|
"step": 4310 |
|
}, |
|
{ |
|
"epoch": 68.99, |
|
"step": 4312, |
|
"train_accuracy": 0.975621984082221, |
|
"train_f1": 0.9755696733303983, |
|
"train_loss": 0.07073085755109787, |
|
"train_precision": 0.9756366046304416, |
|
"train_recall": 0.975621984082221, |
|
"train_runtime": 256.8947, |
|
"train_samples_per_second": 62.115, |
|
"train_steps_per_second": 0.973 |
|
}, |
|
{ |
|
"epoch": 68.99, |
|
"eval_accuracy": 0.9075535512965051, |
|
"eval_f1": 0.9068001649833212, |
|
"eval_loss": 0.4593234956264496, |
|
"eval_precision": 0.9074473642395492, |
|
"eval_recall": 0.9075535512965051, |
|
"eval_runtime": 44.7864, |
|
"eval_samples_per_second": 39.61, |
|
"eval_steps_per_second": 0.625, |
|
"step": 4312 |
|
}, |
|
{ |
|
"epoch": 69.12, |
|
"learning_rate": 0.0003038709677419355, |
|
"loss": 0.1404, |
|
"step": 4320 |
|
}, |
|
{ |
|
"epoch": 69.28, |
|
"learning_rate": 0.000302258064516129, |
|
"loss": 0.1417, |
|
"step": 4330 |
|
}, |
|
{ |
|
"epoch": 69.44, |
|
"learning_rate": 0.0003006451612903226, |
|
"loss": 0.1137, |
|
"step": 4340 |
|
}, |
|
{ |
|
"epoch": 69.6, |
|
"learning_rate": 0.0002990322580645161, |
|
"loss": 0.118, |
|
"step": 4350 |
|
}, |
|
{ |
|
"epoch": 69.76, |
|
"learning_rate": 0.0002974193548387097, |
|
"loss": 0.1159, |
|
"step": 4360 |
|
}, |
|
{ |
|
"epoch": 69.92, |
|
"learning_rate": 0.0002958064516129032, |
|
"loss": 0.1463, |
|
"step": 4370 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"step": 4375, |
|
"train_accuracy": 0.9780660525161371, |
|
"train_f1": 0.9780045954132663, |
|
"train_loss": 0.06600172072649002, |
|
"train_precision": 0.9780539223141508, |
|
"train_recall": 0.9780660525161371, |
|
"train_runtime": 257.4363, |
|
"train_samples_per_second": 61.984, |
|
"train_steps_per_second": 0.971 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_accuracy": 0.9036076662908681, |
|
"eval_f1": 0.9023949767425765, |
|
"eval_loss": 0.4772753119468689, |
|
"eval_precision": 0.9028653821326578, |
|
"eval_recall": 0.9036076662908681, |
|
"eval_runtime": 40.3083, |
|
"eval_samples_per_second": 44.011, |
|
"eval_steps_per_second": 0.695, |
|
"step": 4375 |
|
}, |
|
{ |
|
"epoch": 70.08, |
|
"learning_rate": 0.0002941935483870968, |
|
"loss": 0.1154, |
|
"step": 4380 |
|
}, |
|
{ |
|
"epoch": 70.24, |
|
"learning_rate": 0.00029258064516129035, |
|
"loss": 0.1401, |
|
"step": 4390 |
|
}, |
|
{ |
|
"epoch": 70.4, |
|
"learning_rate": 0.00029096774193548386, |
|
"loss": 0.1348, |
|
"step": 4400 |
|
}, |
|
{ |
|
"epoch": 70.56, |
|
"learning_rate": 0.0002893548387096774, |
|
"loss": 0.1333, |
|
"step": 4410 |
|
}, |
|
{ |
|
"epoch": 70.72, |
|
"learning_rate": 0.00028774193548387097, |
|
"loss": 0.1292, |
|
"step": 4420 |
|
}, |
|
{ |
|
"epoch": 70.88, |
|
"learning_rate": 0.00028612903225806453, |
|
"loss": 0.1217, |
|
"step": 4430 |
|
}, |
|
{ |
|
"epoch": 70.99, |
|
"step": 4437, |
|
"train_accuracy": 0.976562010402958, |
|
"train_f1": 0.976489238828708, |
|
"train_loss": 0.0662013366818428, |
|
"train_precision": 0.9765934380829007, |
|
"train_recall": 0.976562010402958, |
|
"train_runtime": 257.6318, |
|
"train_samples_per_second": 61.937, |
|
"train_steps_per_second": 0.97 |
|
}, |
|
{ |
|
"epoch": 70.99, |
|
"eval_accuracy": 0.9098083427282976, |
|
"eval_f1": 0.9089720394690067, |
|
"eval_loss": 0.44329407811164856, |
|
"eval_precision": 0.9092946695808038, |
|
"eval_recall": 0.9098083427282976, |
|
"eval_runtime": 34.2569, |
|
"eval_samples_per_second": 51.785, |
|
"eval_steps_per_second": 0.817, |
|
"step": 4437 |
|
}, |
|
{ |
|
"epoch": 71.04, |
|
"learning_rate": 0.0002845161290322581, |
|
"loss": 0.1271, |
|
"step": 4440 |
|
}, |
|
{ |
|
"epoch": 71.2, |
|
"learning_rate": 0.0002829032258064516, |
|
"loss": 0.1108, |
|
"step": 4450 |
|
}, |
|
{ |
|
"epoch": 71.36, |
|
"learning_rate": 0.0002812903225806452, |
|
"loss": 0.1156, |
|
"step": 4460 |
|
}, |
|
{ |
|
"epoch": 71.52, |
|
"learning_rate": 0.0002796774193548387, |
|
"loss": 0.1385, |
|
"step": 4470 |
|
}, |
|
{ |
|
"epoch": 71.68, |
|
"learning_rate": 0.00027806451612903227, |
|
"loss": 0.1333, |
|
"step": 4480 |
|
}, |
|
{ |
|
"epoch": 71.84, |
|
"learning_rate": 0.00027645161290322577, |
|
"loss": 0.107, |
|
"step": 4490 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"learning_rate": 0.0002748387096774194, |
|
"loss": 0.1361, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"step": 4500, |
|
"train_accuracy": 0.9758726577677508, |
|
"train_f1": 0.9758377736683368, |
|
"train_loss": 0.0710226520895958, |
|
"train_precision": 0.9758628894264394, |
|
"train_recall": 0.9758726577677508, |
|
"train_runtime": 260.0539, |
|
"train_samples_per_second": 61.36, |
|
"train_steps_per_second": 0.961 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_accuracy": 0.9075535512965051, |
|
"eval_f1": 0.9071424091130842, |
|
"eval_loss": 0.43427780270576477, |
|
"eval_precision": 0.907402566021774, |
|
"eval_recall": 0.9075535512965051, |
|
"eval_runtime": 30.9428, |
|
"eval_samples_per_second": 57.332, |
|
"eval_steps_per_second": 0.905, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 72.16, |
|
"learning_rate": 0.00027322580645161294, |
|
"loss": 0.1166, |
|
"step": 4510 |
|
}, |
|
{ |
|
"epoch": 72.32, |
|
"learning_rate": 0.00027161290322580645, |
|
"loss": 0.1422, |
|
"step": 4520 |
|
}, |
|
{ |
|
"epoch": 72.48, |
|
"learning_rate": 0.00027, |
|
"loss": 0.1253, |
|
"step": 4530 |
|
}, |
|
{ |
|
"epoch": 72.64, |
|
"learning_rate": 0.00026838709677419356, |
|
"loss": 0.1287, |
|
"step": 4540 |
|
}, |
|
{ |
|
"epoch": 72.8, |
|
"learning_rate": 0.0002667741935483871, |
|
"loss": 0.1257, |
|
"step": 4550 |
|
}, |
|
{ |
|
"epoch": 72.96, |
|
"learning_rate": 0.0002651612903225806, |
|
"loss": 0.1164, |
|
"step": 4560 |
|
}, |
|
{ |
|
"epoch": 72.99, |
|
"step": 4562, |
|
"train_accuracy": 0.9780660525161371, |
|
"train_f1": 0.9780243494069962, |
|
"train_loss": 0.0632663145661354, |
|
"train_precision": 0.978042686088855, |
|
"train_recall": 0.9780660525161371, |
|
"train_runtime": 253.9785, |
|
"train_samples_per_second": 62.828, |
|
"train_steps_per_second": 0.984 |
|
}, |
|
{ |
|
"epoch": 72.99, |
|
"eval_accuracy": 0.9013528748590756, |
|
"eval_f1": 0.90025705081473, |
|
"eval_loss": 0.4536808431148529, |
|
"eval_precision": 0.9003205156911865, |
|
"eval_recall": 0.9013528748590756, |
|
"eval_runtime": 30.6887, |
|
"eval_samples_per_second": 57.806, |
|
"eval_steps_per_second": 0.912, |
|
"step": 4562 |
|
}, |
|
{ |
|
"epoch": 73.12, |
|
"learning_rate": 0.0002635483870967742, |
|
"loss": 0.1255, |
|
"step": 4570 |
|
}, |
|
{ |
|
"epoch": 73.28, |
|
"learning_rate": 0.0002619354838709678, |
|
"loss": 0.1278, |
|
"step": 4580 |
|
}, |
|
{ |
|
"epoch": 73.44, |
|
"learning_rate": 0.0002603225806451613, |
|
"loss": 0.1296, |
|
"step": 4590 |
|
}, |
|
{ |
|
"epoch": 73.6, |
|
"learning_rate": 0.00025870967741935486, |
|
"loss": 0.1337, |
|
"step": 4600 |
|
}, |
|
{ |
|
"epoch": 73.76, |
|
"learning_rate": 0.00025709677419354836, |
|
"loss": 0.1215, |
|
"step": 4610 |
|
}, |
|
{ |
|
"epoch": 73.92, |
|
"learning_rate": 0.00025548387096774197, |
|
"loss": 0.1313, |
|
"step": 4620 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"step": 4625, |
|
"train_accuracy": 0.9766246788243405, |
|
"train_f1": 0.9765319317829301, |
|
"train_loss": 0.06763936579227448, |
|
"train_precision": 0.976670123477298, |
|
"train_recall": 0.9766246788243405, |
|
"train_runtime": 252.1633, |
|
"train_samples_per_second": 63.28, |
|
"train_steps_per_second": 0.991 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_accuracy": 0.90304396843292, |
|
"eval_f1": 0.9020628517400072, |
|
"eval_loss": 0.44354888796806335, |
|
"eval_precision": 0.9022087129927616, |
|
"eval_recall": 0.90304396843292, |
|
"eval_runtime": 29.2384, |
|
"eval_samples_per_second": 60.674, |
|
"eval_steps_per_second": 0.958, |
|
"step": 4625 |
|
}, |
|
{ |
|
"epoch": 74.08, |
|
"learning_rate": 0.0002538709677419355, |
|
"loss": 0.1295, |
|
"step": 4630 |
|
}, |
|
{ |
|
"epoch": 74.24, |
|
"learning_rate": 0.00025225806451612903, |
|
"loss": 0.1257, |
|
"step": 4640 |
|
}, |
|
{ |
|
"epoch": 74.4, |
|
"learning_rate": 0.0002506451612903226, |
|
"loss": 0.1009, |
|
"step": 4650 |
|
}, |
|
{ |
|
"epoch": 74.56, |
|
"learning_rate": 0.00024903225806451615, |
|
"loss": 0.1254, |
|
"step": 4660 |
|
}, |
|
{ |
|
"epoch": 74.72, |
|
"learning_rate": 0.00024741935483870965, |
|
"loss": 0.1291, |
|
"step": 4670 |
|
}, |
|
{ |
|
"epoch": 74.88, |
|
"learning_rate": 0.00024580645161290327, |
|
"loss": 0.1291, |
|
"step": 4680 |
|
}, |
|
{ |
|
"epoch": 74.99, |
|
"step": 4687, |
|
"train_accuracy": 0.97737669988093, |
|
"train_f1": 0.9773174710084362, |
|
"train_loss": 0.06480351090431213, |
|
"train_precision": 0.9773832839286731, |
|
"train_recall": 0.97737669988093, |
|
"train_runtime": 266.3469, |
|
"train_samples_per_second": 59.911, |
|
"train_steps_per_second": 0.939 |
|
}, |
|
{ |
|
"epoch": 74.99, |
|
"eval_accuracy": 0.9052987598647125, |
|
"eval_f1": 0.9045329930179677, |
|
"eval_loss": 0.44802290201187134, |
|
"eval_precision": 0.9044815010640291, |
|
"eval_recall": 0.9052987598647125, |
|
"eval_runtime": 46.7594, |
|
"eval_samples_per_second": 37.939, |
|
"eval_steps_per_second": 0.599, |
|
"step": 4687 |
|
}, |
|
{ |
|
"epoch": 75.04, |
|
"learning_rate": 0.00024419354838709677, |
|
"loss": 0.1316, |
|
"step": 4690 |
|
}, |
|
{ |
|
"epoch": 75.2, |
|
"learning_rate": 0.00024258064516129033, |
|
"loss": 0.1315, |
|
"step": 4700 |
|
}, |
|
{ |
|
"epoch": 75.36, |
|
"learning_rate": 0.0002409677419354839, |
|
"loss": 0.11, |
|
"step": 4710 |
|
}, |
|
{ |
|
"epoch": 75.52, |
|
"learning_rate": 0.00023935483870967742, |
|
"loss": 0.1253, |
|
"step": 4720 |
|
}, |
|
{ |
|
"epoch": 75.68, |
|
"learning_rate": 0.00023774193548387098, |
|
"loss": 0.1193, |
|
"step": 4730 |
|
}, |
|
{ |
|
"epoch": 75.84, |
|
"learning_rate": 0.0002361290322580645, |
|
"loss": 0.1122, |
|
"step": 4740 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"learning_rate": 0.0002345161290322581, |
|
"loss": 0.132, |
|
"step": 4750 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"step": 4750, |
|
"train_accuracy": 0.9790060788368741, |
|
"train_f1": 0.9789581823313721, |
|
"train_loss": 0.060503240674734116, |
|
"train_precision": 0.9790325316940118, |
|
"train_recall": 0.9790060788368741, |
|
"train_runtime": 258.2855, |
|
"train_samples_per_second": 61.78, |
|
"train_steps_per_second": 0.968 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_accuracy": 0.9058624577226606, |
|
"eval_f1": 0.904482480434317, |
|
"eval_loss": 0.46171513199806213, |
|
"eval_precision": 0.9050040535484158, |
|
"eval_recall": 0.9058624577226606, |
|
"eval_runtime": 42.9199, |
|
"eval_samples_per_second": 41.333, |
|
"eval_steps_per_second": 0.652, |
|
"step": 4750 |
|
}, |
|
{ |
|
"epoch": 76.16, |
|
"learning_rate": 0.00023290322580645162, |
|
"loss": 0.1141, |
|
"step": 4760 |
|
}, |
|
{ |
|
"epoch": 76.32, |
|
"learning_rate": 0.00023129032258064516, |
|
"loss": 0.111, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 76.48, |
|
"learning_rate": 0.0002296774193548387, |
|
"loss": 0.1362, |
|
"step": 4780 |
|
}, |
|
{ |
|
"epoch": 76.64, |
|
"learning_rate": 0.00022806451612903224, |
|
"loss": 0.1303, |
|
"step": 4790 |
|
}, |
|
{ |
|
"epoch": 76.8, |
|
"learning_rate": 0.0002264516129032258, |
|
"loss": 0.1128, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 76.96, |
|
"learning_rate": 0.00022483870967741936, |
|
"loss": 0.1197, |
|
"step": 4810 |
|
}, |
|
{ |
|
"epoch": 76.99, |
|
"step": 4812, |
|
"train_accuracy": 0.9780033840947546, |
|
"train_f1": 0.9779246149243382, |
|
"train_loss": 0.06653548032045364, |
|
"train_precision": 0.9780194906548296, |
|
"train_recall": 0.9780033840947546, |
|
"train_runtime": 255.9446, |
|
"train_samples_per_second": 62.346, |
|
"train_steps_per_second": 0.977 |
|
}, |
|
{ |
|
"epoch": 76.99, |
|
"eval_accuracy": 0.9058624577226606, |
|
"eval_f1": 0.904136777153852, |
|
"eval_loss": 0.45922645926475525, |
|
"eval_precision": 0.9042117586049208, |
|
"eval_recall": 0.9058624577226606, |
|
"eval_runtime": 37.615, |
|
"eval_samples_per_second": 47.162, |
|
"eval_steps_per_second": 0.744, |
|
"step": 4812 |
|
}, |
|
{ |
|
"epoch": 77.12, |
|
"learning_rate": 0.00022322580645161292, |
|
"loss": 0.1185, |
|
"step": 4820 |
|
}, |
|
{ |
|
"epoch": 77.28, |
|
"learning_rate": 0.00022161290322580645, |
|
"loss": 0.1297, |
|
"step": 4830 |
|
}, |
|
{ |
|
"epoch": 77.44, |
|
"learning_rate": 0.00022, |
|
"loss": 0.1167, |
|
"step": 4840 |
|
}, |
|
{ |
|
"epoch": 77.6, |
|
"learning_rate": 0.00021838709677419354, |
|
"loss": 0.1185, |
|
"step": 4850 |
|
}, |
|
{ |
|
"epoch": 77.76, |
|
"learning_rate": 0.0002167741935483871, |
|
"loss": 0.1095, |
|
"step": 4860 |
|
}, |
|
{ |
|
"epoch": 77.92, |
|
"learning_rate": 0.00021516129032258063, |
|
"loss": 0.1199, |
|
"step": 4870 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"step": 4875, |
|
"train_accuracy": 0.9789434104154916, |
|
"train_f1": 0.9789055395945256, |
|
"train_loss": 0.06331050395965576, |
|
"train_precision": 0.9789060427186901, |
|
"train_recall": 0.9789434104154916, |
|
"train_runtime": 255.8602, |
|
"train_samples_per_second": 62.366, |
|
"train_steps_per_second": 0.977 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_accuracy": 0.9160090191657272, |
|
"eval_f1": 0.9156304372279399, |
|
"eval_loss": 0.4329167902469635, |
|
"eval_precision": 0.9156707582414666, |
|
"eval_recall": 0.9160090191657272, |
|
"eval_runtime": 36.868, |
|
"eval_samples_per_second": 48.118, |
|
"eval_steps_per_second": 0.759, |
|
"step": 4875 |
|
}, |
|
{ |
|
"epoch": 78.08, |
|
"learning_rate": 0.0002135483870967742, |
|
"loss": 0.1098, |
|
"step": 4880 |
|
}, |
|
{ |
|
"epoch": 78.24, |
|
"learning_rate": 0.00021193548387096774, |
|
"loss": 0.1134, |
|
"step": 4890 |
|
}, |
|
{ |
|
"epoch": 78.4, |
|
"learning_rate": 0.0002103225806451613, |
|
"loss": 0.1103, |
|
"step": 4900 |
|
}, |
|
{ |
|
"epoch": 78.56, |
|
"learning_rate": 0.00020870967741935483, |
|
"loss": 0.1266, |
|
"step": 4910 |
|
}, |
|
{ |
|
"epoch": 78.72, |
|
"learning_rate": 0.0002070967741935484, |
|
"loss": 0.1083, |
|
"step": 4920 |
|
}, |
|
{ |
|
"epoch": 78.88, |
|
"learning_rate": 0.00020548387096774192, |
|
"loss": 0.124, |
|
"step": 4930 |
|
}, |
|
{ |
|
"epoch": 78.99, |
|
"step": 4937, |
|
"train_accuracy": 0.978191389358902, |
|
"train_f1": 0.9781684943478942, |
|
"train_loss": 0.06074240058660507, |
|
"train_precision": 0.9782183084448501, |
|
"train_recall": 0.978191389358902, |
|
"train_runtime": 255.7407, |
|
"train_samples_per_second": 62.395, |
|
"train_steps_per_second": 0.978 |
|
}, |
|
{ |
|
"epoch": 78.99, |
|
"eval_accuracy": 0.9148816234498309, |
|
"eval_f1": 0.914220821168919, |
|
"eval_loss": 0.4336497485637665, |
|
"eval_precision": 0.9142236947687447, |
|
"eval_recall": 0.9148816234498309, |
|
"eval_runtime": 31.4364, |
|
"eval_samples_per_second": 56.431, |
|
"eval_steps_per_second": 0.891, |
|
"step": 4937 |
|
}, |
|
{ |
|
"epoch": 79.04, |
|
"learning_rate": 0.00020387096774193548, |
|
"loss": 0.13, |
|
"step": 4940 |
|
}, |
|
{ |
|
"epoch": 79.2, |
|
"learning_rate": 0.00020225806451612904, |
|
"loss": 0.1212, |
|
"step": 4950 |
|
}, |
|
{ |
|
"epoch": 79.36, |
|
"learning_rate": 0.0002006451612903226, |
|
"loss": 0.0928, |
|
"step": 4960 |
|
}, |
|
{ |
|
"epoch": 79.52, |
|
"learning_rate": 0.00019903225806451613, |
|
"loss": 0.1227, |
|
"step": 4970 |
|
}, |
|
{ |
|
"epoch": 79.68, |
|
"learning_rate": 0.00019741935483870969, |
|
"loss": 0.1283, |
|
"step": 4980 |
|
}, |
|
{ |
|
"epoch": 79.84, |
|
"learning_rate": 0.00019580645161290322, |
|
"loss": 0.1174, |
|
"step": 4990 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"learning_rate": 0.00019419354838709678, |
|
"loss": 0.118, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"step": 5000, |
|
"train_accuracy": 0.9766246788243405, |
|
"train_f1": 0.9765541131510495, |
|
"train_loss": 0.0666293278336525, |
|
"train_precision": 0.9766229850859756, |
|
"train_recall": 0.9766246788243405, |
|
"train_runtime": 259.1008, |
|
"train_samples_per_second": 61.586, |
|
"train_steps_per_second": 0.965 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_accuracy": 0.9086809470124013, |
|
"eval_f1": 0.90750875812957, |
|
"eval_loss": 0.45560184121131897, |
|
"eval_precision": 0.9079785564126395, |
|
"eval_recall": 0.9086809470124013, |
|
"eval_runtime": 31.9115, |
|
"eval_samples_per_second": 55.591, |
|
"eval_steps_per_second": 0.877, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 80.16, |
|
"learning_rate": 0.0001925806451612903, |
|
"loss": 0.0913, |
|
"step": 5010 |
|
}, |
|
{ |
|
"epoch": 80.32, |
|
"learning_rate": 0.0001909677419354839, |
|
"loss": 0.124, |
|
"step": 5020 |
|
}, |
|
{ |
|
"epoch": 80.48, |
|
"learning_rate": 0.00018935483870967742, |
|
"loss": 0.1009, |
|
"step": 5030 |
|
}, |
|
{ |
|
"epoch": 80.64, |
|
"learning_rate": 0.00018774193548387098, |
|
"loss": 0.1101, |
|
"step": 5040 |
|
}, |
|
{ |
|
"epoch": 80.8, |
|
"learning_rate": 0.0001861290322580645, |
|
"loss": 0.1066, |
|
"step": 5050 |
|
}, |
|
{ |
|
"epoch": 80.96, |
|
"learning_rate": 0.00018451612903225807, |
|
"loss": 0.1135, |
|
"step": 5060 |
|
}, |
|
{ |
|
"epoch": 80.99, |
|
"step": 5062, |
|
"train_accuracy": 0.9778153788306072, |
|
"train_f1": 0.9777754434919425, |
|
"train_loss": 0.0617908276617527, |
|
"train_precision": 0.9778452684709104, |
|
"train_recall": 0.9778153788306072, |
|
"train_runtime": 256.2036, |
|
"train_samples_per_second": 62.282, |
|
"train_steps_per_second": 0.976 |
|
}, |
|
{ |
|
"epoch": 80.99, |
|
"eval_accuracy": 0.9098083427282976, |
|
"eval_f1": 0.9089912962963755, |
|
"eval_loss": 0.4518835246562958, |
|
"eval_precision": 0.9089474065575852, |
|
"eval_recall": 0.9098083427282976, |
|
"eval_runtime": 30.3175, |
|
"eval_samples_per_second": 58.514, |
|
"eval_steps_per_second": 0.924, |
|
"step": 5062 |
|
}, |
|
{ |
|
"epoch": 81.12, |
|
"learning_rate": 0.0001829032258064516, |
|
"loss": 0.1126, |
|
"step": 5070 |
|
}, |
|
{ |
|
"epoch": 81.28, |
|
"learning_rate": 0.0001812903225806452, |
|
"loss": 0.1193, |
|
"step": 5080 |
|
}, |
|
{ |
|
"epoch": 81.44, |
|
"learning_rate": 0.00017967741935483872, |
|
"loss": 0.1, |
|
"step": 5090 |
|
}, |
|
{ |
|
"epoch": 81.6, |
|
"learning_rate": 0.00017806451612903228, |
|
"loss": 0.1133, |
|
"step": 5100 |
|
}, |
|
{ |
|
"epoch": 81.76, |
|
"learning_rate": 0.0001764516129032258, |
|
"loss": 0.1108, |
|
"step": 5110 |
|
}, |
|
{ |
|
"epoch": 81.92, |
|
"learning_rate": 0.00017483870967741936, |
|
"loss": 0.1047, |
|
"step": 5120 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"step": 5125, |
|
"train_accuracy": 0.9804474525286708, |
|
"train_f1": 0.9803932668866718, |
|
"train_loss": 0.05864088237285614, |
|
"train_precision": 0.9804524158920493, |
|
"train_recall": 0.9804474525286708, |
|
"train_runtime": 255.5222, |
|
"train_samples_per_second": 62.449, |
|
"train_steps_per_second": 0.978 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_accuracy": 0.9086809470124013, |
|
"eval_f1": 0.9077573719855858, |
|
"eval_loss": 0.46281760931015015, |
|
"eval_precision": 0.9078136987288633, |
|
"eval_recall": 0.9086809470124013, |
|
"eval_runtime": 29.6004, |
|
"eval_samples_per_second": 59.932, |
|
"eval_steps_per_second": 0.946, |
|
"step": 5125 |
|
}, |
|
{ |
|
"epoch": 82.08, |
|
"learning_rate": 0.0001732258064516129, |
|
"loss": 0.1049, |
|
"step": 5130 |
|
}, |
|
{ |
|
"epoch": 82.24, |
|
"learning_rate": 0.00017161290322580645, |
|
"loss": 0.1198, |
|
"step": 5140 |
|
}, |
|
{ |
|
"epoch": 82.4, |
|
"learning_rate": 0.00017, |
|
"loss": 0.1013, |
|
"step": 5150 |
|
}, |
|
{ |
|
"epoch": 82.56, |
|
"learning_rate": 0.00016838709677419357, |
|
"loss": 0.1196, |
|
"step": 5160 |
|
}, |
|
{ |
|
"epoch": 82.72, |
|
"learning_rate": 0.0001667741935483871, |
|
"loss": 0.1076, |
|
"step": 5170 |
|
}, |
|
{ |
|
"epoch": 82.88, |
|
"learning_rate": 0.00016516129032258066, |
|
"loss": 0.0977, |
|
"step": 5180 |
|
}, |
|
{ |
|
"epoch": 82.99, |
|
"step": 5187, |
|
"train_accuracy": 0.9785047314658144, |
|
"train_f1": 0.9784666340134569, |
|
"train_loss": 0.061825916171073914, |
|
"train_precision": 0.9784978840692157, |
|
"train_recall": 0.9785047314658144, |
|
"train_runtime": 254.0139, |
|
"train_samples_per_second": 62.819, |
|
"train_steps_per_second": 0.984 |
|
}, |
|
{ |
|
"epoch": 82.99, |
|
"eval_accuracy": 0.9098083427282976, |
|
"eval_f1": 0.9089103848523707, |
|
"eval_loss": 0.4576462209224701, |
|
"eval_precision": 0.9088881743285697, |
|
"eval_recall": 0.9098083427282976, |
|
"eval_runtime": 29.6463, |
|
"eval_samples_per_second": 59.839, |
|
"eval_steps_per_second": 0.944, |
|
"step": 5187 |
|
}, |
|
{ |
|
"epoch": 83.04, |
|
"learning_rate": 0.0001635483870967742, |
|
"loss": 0.0983, |
|
"step": 5190 |
|
}, |
|
{ |
|
"epoch": 83.2, |
|
"learning_rate": 0.00016193548387096775, |
|
"loss": 0.1126, |
|
"step": 5200 |
|
}, |
|
{ |
|
"epoch": 83.36, |
|
"learning_rate": 0.00016032258064516128, |
|
"loss": 0.1362, |
|
"step": 5210 |
|
}, |
|
{ |
|
"epoch": 83.52, |
|
"learning_rate": 0.00015870967741935487, |
|
"loss": 0.1073, |
|
"step": 5220 |
|
}, |
|
{ |
|
"epoch": 83.68, |
|
"learning_rate": 0.0001570967741935484, |
|
"loss": 0.111, |
|
"step": 5230 |
|
}, |
|
{ |
|
"epoch": 83.84, |
|
"learning_rate": 0.00015548387096774195, |
|
"loss": 0.1125, |
|
"step": 5240 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"learning_rate": 0.00015387096774193549, |
|
"loss": 0.1149, |
|
"step": 5250 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"step": 5250, |
|
"train_accuracy": 0.980886131478348, |
|
"train_f1": 0.9808510090193131, |
|
"train_loss": 0.05500573664903641, |
|
"train_precision": 0.9808883134493344, |
|
"train_recall": 0.980886131478348, |
|
"train_runtime": 260.1325, |
|
"train_samples_per_second": 61.342, |
|
"train_steps_per_second": 0.961 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_accuracy": 0.9120631341600902, |
|
"eval_f1": 0.911138462348306, |
|
"eval_loss": 0.4605374038219452, |
|
"eval_precision": 0.9110930924781012, |
|
"eval_recall": 0.9120631341600902, |
|
"eval_runtime": 29.9251, |
|
"eval_samples_per_second": 59.281, |
|
"eval_steps_per_second": 0.936, |
|
"step": 5250 |
|
}, |
|
{ |
|
"epoch": 84.16, |
|
"learning_rate": 0.00015225806451612904, |
|
"loss": 0.0955, |
|
"step": 5260 |
|
}, |
|
{ |
|
"epoch": 84.32, |
|
"learning_rate": 0.00015064516129032257, |
|
"loss": 0.1187, |
|
"step": 5270 |
|
}, |
|
{ |
|
"epoch": 84.48, |
|
"learning_rate": 0.0001490322580645161, |
|
"loss": 0.1101, |
|
"step": 5280 |
|
}, |
|
{ |
|
"epoch": 84.64, |
|
"learning_rate": 0.0001474193548387097, |
|
"loss": 0.106, |
|
"step": 5290 |
|
}, |
|
{ |
|
"epoch": 84.8, |
|
"learning_rate": 0.00014580645161290322, |
|
"loss": 0.099, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 84.96, |
|
"learning_rate": 0.00014419354838709678, |
|
"loss": 0.1241, |
|
"step": 5310 |
|
}, |
|
{ |
|
"epoch": 84.99, |
|
"step": 5312, |
|
"train_accuracy": 0.9786927367299618, |
|
"train_f1": 0.9786376256812076, |
|
"train_loss": 0.0632563978433609, |
|
"train_precision": 0.9786888233858622, |
|
"train_recall": 0.9786927367299618, |
|
"train_runtime": 253.1029, |
|
"train_samples_per_second": 63.046, |
|
"train_steps_per_second": 0.988 |
|
}, |
|
{ |
|
"epoch": 84.99, |
|
"eval_accuracy": 0.9131905298759865, |
|
"eval_f1": 0.9126492909049198, |
|
"eval_loss": 0.4541684687137604, |
|
"eval_precision": 0.9125019654104216, |
|
"eval_recall": 0.9131905298759865, |
|
"eval_runtime": 36.7528, |
|
"eval_samples_per_second": 48.268, |
|
"eval_steps_per_second": 0.762, |
|
"step": 5312 |
|
}, |
|
{ |
|
"epoch": 85.12, |
|
"learning_rate": 0.0001425806451612903, |
|
"loss": 0.1174, |
|
"step": 5320 |
|
}, |
|
{ |
|
"epoch": 85.28, |
|
"learning_rate": 0.00014096774193548387, |
|
"loss": 0.1129, |
|
"step": 5330 |
|
}, |
|
{ |
|
"epoch": 85.44, |
|
"learning_rate": 0.0001393548387096774, |
|
"loss": 0.0965, |
|
"step": 5340 |
|
}, |
|
{ |
|
"epoch": 85.6, |
|
"learning_rate": 0.00013774193548387099, |
|
"loss": 0.0996, |
|
"step": 5350 |
|
}, |
|
{ |
|
"epoch": 85.76, |
|
"learning_rate": 0.00013612903225806452, |
|
"loss": 0.1188, |
|
"step": 5360 |
|
}, |
|
{ |
|
"epoch": 85.92, |
|
"learning_rate": 0.00013451612903225807, |
|
"loss": 0.1262, |
|
"step": 5370 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"step": 5375, |
|
"train_accuracy": 0.9786927367299618, |
|
"train_f1": 0.9786430332999637, |
|
"train_loss": 0.06230182945728302, |
|
"train_precision": 0.9787228334576183, |
|
"train_recall": 0.9786927367299618, |
|
"train_runtime": 254.0805, |
|
"train_samples_per_second": 62.803, |
|
"train_steps_per_second": 0.984 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_accuracy": 0.9081172491544532, |
|
"eval_f1": 0.9073973897547527, |
|
"eval_loss": 0.45515382289886475, |
|
"eval_precision": 0.9074033025441, |
|
"eval_recall": 0.9081172491544532, |
|
"eval_runtime": 29.4676, |
|
"eval_samples_per_second": 60.202, |
|
"eval_steps_per_second": 0.95, |
|
"step": 5375 |
|
}, |
|
{ |
|
"epoch": 86.08, |
|
"learning_rate": 0.0001329032258064516, |
|
"loss": 0.1058, |
|
"step": 5380 |
|
}, |
|
{ |
|
"epoch": 86.24, |
|
"learning_rate": 0.00013129032258064516, |
|
"loss": 0.1131, |
|
"step": 5390 |
|
}, |
|
{ |
|
"epoch": 86.4, |
|
"learning_rate": 0.0001296774193548387, |
|
"loss": 0.1009, |
|
"step": 5400 |
|
}, |
|
{ |
|
"epoch": 86.56, |
|
"learning_rate": 0.00012806451612903225, |
|
"loss": 0.1047, |
|
"step": 5410 |
|
}, |
|
{ |
|
"epoch": 86.72, |
|
"learning_rate": 0.0001264516129032258, |
|
"loss": 0.1055, |
|
"step": 5420 |
|
}, |
|
{ |
|
"epoch": 86.88, |
|
"learning_rate": 0.00012483870967741934, |
|
"loss": 0.1114, |
|
"step": 5430 |
|
}, |
|
{ |
|
"epoch": 86.99, |
|
"step": 5437, |
|
"train_accuracy": 0.9789434104154916, |
|
"train_f1": 0.9788727186488501, |
|
"train_loss": 0.05873732641339302, |
|
"train_precision": 0.9789898516890257, |
|
"train_recall": 0.9789434104154916, |
|
"train_runtime": 252.3787, |
|
"train_samples_per_second": 63.226, |
|
"train_steps_per_second": 0.991 |
|
}, |
|
{ |
|
"epoch": 86.99, |
|
"eval_accuracy": 0.9081172491544532, |
|
"eval_f1": 0.907050844291005, |
|
"eval_loss": 0.46865400671958923, |
|
"eval_precision": 0.9071698989671065, |
|
"eval_recall": 0.9081172491544532, |
|
"eval_runtime": 29.1201, |
|
"eval_samples_per_second": 60.92, |
|
"eval_steps_per_second": 0.962, |
|
"step": 5437 |
|
}, |
|
{ |
|
"epoch": 87.04, |
|
"learning_rate": 0.0001232258064516129, |
|
"loss": 0.0953, |
|
"step": 5440 |
|
}, |
|
{ |
|
"epoch": 87.2, |
|
"learning_rate": 0.00012161290322580646, |
|
"loss": 0.0895, |
|
"step": 5450 |
|
}, |
|
{ |
|
"epoch": 87.36, |
|
"learning_rate": 0.00012, |
|
"loss": 0.1122, |
|
"step": 5460 |
|
}, |
|
{ |
|
"epoch": 87.52, |
|
"learning_rate": 0.00011838709677419356, |
|
"loss": 0.1169, |
|
"step": 5470 |
|
}, |
|
{ |
|
"epoch": 87.68, |
|
"learning_rate": 0.0001167741935483871, |
|
"loss": 0.1031, |
|
"step": 5480 |
|
}, |
|
{ |
|
"epoch": 87.84, |
|
"learning_rate": 0.00011516129032258065, |
|
"loss": 0.1052, |
|
"step": 5490 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"learning_rate": 0.00011354838709677421, |
|
"loss": 0.0835, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"step": 5500, |
|
"train_accuracy": 0.9811994735852604, |
|
"train_f1": 0.9811537862655559, |
|
"train_loss": 0.05588332563638687, |
|
"train_precision": 0.9812213014473542, |
|
"train_recall": 0.9811994735852604, |
|
"train_runtime": 251.2614, |
|
"train_samples_per_second": 63.508, |
|
"train_steps_per_second": 0.995 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_accuracy": 0.9098083427282976, |
|
"eval_f1": 0.908811337868185, |
|
"eval_loss": 0.4702069163322449, |
|
"eval_precision": 0.9089224577124531, |
|
"eval_recall": 0.9098083427282976, |
|
"eval_runtime": 29.3425, |
|
"eval_samples_per_second": 60.458, |
|
"eval_steps_per_second": 0.954, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 88.16, |
|
"learning_rate": 0.00011193548387096775, |
|
"loss": 0.1158, |
|
"step": 5510 |
|
}, |
|
{ |
|
"epoch": 88.32, |
|
"learning_rate": 0.0001103225806451613, |
|
"loss": 0.1029, |
|
"step": 5520 |
|
}, |
|
{ |
|
"epoch": 88.48, |
|
"learning_rate": 0.00010870967741935483, |
|
"loss": 0.0978, |
|
"step": 5530 |
|
}, |
|
{ |
|
"epoch": 88.64, |
|
"learning_rate": 0.00010709677419354839, |
|
"loss": 0.1028, |
|
"step": 5540 |
|
}, |
|
{ |
|
"epoch": 88.8, |
|
"learning_rate": 0.00010548387096774193, |
|
"loss": 0.1053, |
|
"step": 5550 |
|
}, |
|
{ |
|
"epoch": 88.96, |
|
"learning_rate": 0.00010387096774193548, |
|
"loss": 0.1174, |
|
"step": 5560 |
|
}, |
|
{ |
|
"epoch": 88.99, |
|
"step": 5562, |
|
"train_accuracy": 0.9806981262142007, |
|
"train_f1": 0.980651790063678, |
|
"train_loss": 0.05491610988974571, |
|
"train_precision": 0.9806996834447476, |
|
"train_recall": 0.9806981262142007, |
|
"train_runtime": 252.31, |
|
"train_samples_per_second": 63.244, |
|
"train_steps_per_second": 0.991 |
|
}, |
|
{ |
|
"epoch": 88.99, |
|
"eval_accuracy": 0.9058624577226606, |
|
"eval_f1": 0.9047448567468519, |
|
"eval_loss": 0.4772195518016815, |
|
"eval_precision": 0.9049010825589036, |
|
"eval_recall": 0.9058624577226606, |
|
"eval_runtime": 29.443, |
|
"eval_samples_per_second": 60.252, |
|
"eval_steps_per_second": 0.951, |
|
"step": 5562 |
|
}, |
|
{ |
|
"epoch": 89.12, |
|
"learning_rate": 0.00010225806451612903, |
|
"loss": 0.1106, |
|
"step": 5570 |
|
}, |
|
{ |
|
"epoch": 89.28, |
|
"learning_rate": 0.00010064516129032258, |
|
"loss": 0.0965, |
|
"step": 5580 |
|
}, |
|
{ |
|
"epoch": 89.44, |
|
"learning_rate": 9.903225806451612e-05, |
|
"loss": 0.1145, |
|
"step": 5590 |
|
}, |
|
{ |
|
"epoch": 89.6, |
|
"learning_rate": 9.741935483870967e-05, |
|
"loss": 0.1069, |
|
"step": 5600 |
|
}, |
|
{ |
|
"epoch": 89.76, |
|
"learning_rate": 9.580645161290323e-05, |
|
"loss": 0.1008, |
|
"step": 5610 |
|
}, |
|
{ |
|
"epoch": 89.92, |
|
"learning_rate": 9.419354838709677e-05, |
|
"loss": 0.103, |
|
"step": 5620 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"step": 5625, |
|
"train_accuracy": 0.9815754841135552, |
|
"train_f1": 0.9815346716904167, |
|
"train_loss": 0.05348266288638115, |
|
"train_precision": 0.9815797384790222, |
|
"train_recall": 0.9815754841135552, |
|
"train_runtime": 252.062, |
|
"train_samples_per_second": 63.306, |
|
"train_steps_per_second": 0.992 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_accuracy": 0.9075535512965051, |
|
"eval_f1": 0.9065308517183118, |
|
"eval_loss": 0.4701833724975586, |
|
"eval_precision": 0.9065469838144254, |
|
"eval_recall": 0.9075535512965051, |
|
"eval_runtime": 29.5689, |
|
"eval_samples_per_second": 59.995, |
|
"eval_steps_per_second": 0.947, |
|
"step": 5625 |
|
}, |
|
{ |
|
"epoch": 90.08, |
|
"learning_rate": 9.258064516129032e-05, |
|
"loss": 0.0977, |
|
"step": 5630 |
|
}, |
|
{ |
|
"epoch": 90.24, |
|
"learning_rate": 9.096774193548387e-05, |
|
"loss": 0.0948, |
|
"step": 5640 |
|
}, |
|
{ |
|
"epoch": 90.4, |
|
"learning_rate": 8.935483870967742e-05, |
|
"loss": 0.0803, |
|
"step": 5650 |
|
}, |
|
{ |
|
"epoch": 90.56, |
|
"learning_rate": 8.774193548387096e-05, |
|
"loss": 0.1025, |
|
"step": 5660 |
|
}, |
|
{ |
|
"epoch": 90.72, |
|
"learning_rate": 8.612903225806452e-05, |
|
"loss": 0.1056, |
|
"step": 5670 |
|
}, |
|
{ |
|
"epoch": 90.88, |
|
"learning_rate": 8.451612903225807e-05, |
|
"loss": 0.1086, |
|
"step": 5680 |
|
}, |
|
{ |
|
"epoch": 90.99, |
|
"step": 5687, |
|
"train_accuracy": 0.9794447577865514, |
|
"train_f1": 0.9794042503142155, |
|
"train_loss": 0.05922425910830498, |
|
"train_precision": 0.979461044879249, |
|
"train_recall": 0.9794447577865514, |
|
"train_runtime": 253.2112, |
|
"train_samples_per_second": 63.019, |
|
"train_steps_per_second": 0.987 |
|
}, |
|
{ |
|
"epoch": 90.99, |
|
"eval_accuracy": 0.9081172491544532, |
|
"eval_f1": 0.9074336656449804, |
|
"eval_loss": 0.4727869927883148, |
|
"eval_precision": 0.9075490421138191, |
|
"eval_recall": 0.9081172491544532, |
|
"eval_runtime": 29.3104, |
|
"eval_samples_per_second": 60.525, |
|
"eval_steps_per_second": 0.955, |
|
"step": 5687 |
|
}, |
|
{ |
|
"epoch": 91.04, |
|
"learning_rate": 8.290322580645161e-05, |
|
"loss": 0.1074, |
|
"step": 5690 |
|
}, |
|
{ |
|
"epoch": 91.2, |
|
"learning_rate": 8.129032258064515e-05, |
|
"loss": 0.1017, |
|
"step": 5700 |
|
}, |
|
{ |
|
"epoch": 91.36, |
|
"learning_rate": 7.967741935483871e-05, |
|
"loss": 0.0971, |
|
"step": 5710 |
|
}, |
|
{ |
|
"epoch": 91.52, |
|
"learning_rate": 7.806451612903226e-05, |
|
"loss": 0.1191, |
|
"step": 5720 |
|
}, |
|
{ |
|
"epoch": 91.68, |
|
"learning_rate": 7.64516129032258e-05, |
|
"loss": 0.0995, |
|
"step": 5730 |
|
}, |
|
{ |
|
"epoch": 91.84, |
|
"learning_rate": 7.483870967741936e-05, |
|
"loss": 0.1142, |
|
"step": 5740 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"learning_rate": 7.32258064516129e-05, |
|
"loss": 0.1087, |
|
"step": 5750 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"step": 5750, |
|
"train_accuracy": 0.9796954314720813, |
|
"train_f1": 0.9796272548376432, |
|
"train_loss": 0.05848938599228859, |
|
"train_precision": 0.9797640627474504, |
|
"train_recall": 0.9796954314720813, |
|
"train_runtime": 254.0646, |
|
"train_samples_per_second": 62.807, |
|
"train_steps_per_second": 0.984 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_accuracy": 0.9075535512965051, |
|
"eval_f1": 0.9065640932569152, |
|
"eval_loss": 0.4691586196422577, |
|
"eval_precision": 0.9068629961295476, |
|
"eval_recall": 0.9075535512965051, |
|
"eval_runtime": 29.6211, |
|
"eval_samples_per_second": 59.89, |
|
"eval_steps_per_second": 0.945, |
|
"step": 5750 |
|
}, |
|
{ |
|
"epoch": 92.16, |
|
"learning_rate": 7.161290322580645e-05, |
|
"loss": 0.1036, |
|
"step": 5760 |
|
}, |
|
{ |
|
"epoch": 92.32, |
|
"learning_rate": 7.000000000000001e-05, |
|
"loss": 0.0991, |
|
"step": 5770 |
|
}, |
|
{ |
|
"epoch": 92.48, |
|
"learning_rate": 6.838709677419355e-05, |
|
"loss": 0.1042, |
|
"step": 5780 |
|
}, |
|
{ |
|
"epoch": 92.64, |
|
"learning_rate": 6.67741935483871e-05, |
|
"loss": 0.0997, |
|
"step": 5790 |
|
}, |
|
{ |
|
"epoch": 92.8, |
|
"learning_rate": 6.516129032258064e-05, |
|
"loss": 0.0921, |
|
"step": 5800 |
|
}, |
|
{ |
|
"epoch": 92.96, |
|
"learning_rate": 6.35483870967742e-05, |
|
"loss": 0.1041, |
|
"step": 5810 |
|
}, |
|
{ |
|
"epoch": 92.99, |
|
"step": 5812, |
|
"train_accuracy": 0.979131415679639, |
|
"train_f1": 0.9790799084691278, |
|
"train_loss": 0.0558781623840332, |
|
"train_precision": 0.9791236279775183, |
|
"train_recall": 0.979131415679639, |
|
"train_runtime": 253.4519, |
|
"train_samples_per_second": 62.959, |
|
"train_steps_per_second": 0.986 |
|
}, |
|
{ |
|
"epoch": 92.99, |
|
"eval_accuracy": 0.9086809470124013, |
|
"eval_f1": 0.9078901238987158, |
|
"eval_loss": 0.45839613676071167, |
|
"eval_precision": 0.9079266988153948, |
|
"eval_recall": 0.9086809470124013, |
|
"eval_runtime": 29.4342, |
|
"eval_samples_per_second": 60.27, |
|
"eval_steps_per_second": 0.951, |
|
"step": 5812 |
|
}, |
|
{ |
|
"epoch": 93.12, |
|
"learning_rate": 6.193548387096774e-05, |
|
"loss": 0.116, |
|
"step": 5820 |
|
}, |
|
{ |
|
"epoch": 93.28, |
|
"learning_rate": 6.0322580645161295e-05, |
|
"loss": 0.103, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 93.44, |
|
"learning_rate": 5.870967741935484e-05, |
|
"loss": 0.1129, |
|
"step": 5840 |
|
}, |
|
{ |
|
"epoch": 93.6, |
|
"learning_rate": 5.709677419354839e-05, |
|
"loss": 0.1034, |
|
"step": 5850 |
|
}, |
|
{ |
|
"epoch": 93.76, |
|
"learning_rate": 5.5483870967741936e-05, |
|
"loss": 0.1134, |
|
"step": 5860 |
|
}, |
|
{ |
|
"epoch": 93.92, |
|
"learning_rate": 5.387096774193549e-05, |
|
"loss": 0.1109, |
|
"step": 5870 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"step": 5875, |
|
"train_accuracy": 0.9796327630506988, |
|
"train_f1": 0.9795750790681897, |
|
"train_loss": 0.05882110819220543, |
|
"train_precision": 0.9796458578935032, |
|
"train_recall": 0.9796327630506988, |
|
"train_runtime": 253.4567, |
|
"train_samples_per_second": 62.957, |
|
"train_steps_per_second": 0.986 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_accuracy": 0.9092446448703495, |
|
"eval_f1": 0.9084684905580462, |
|
"eval_loss": 0.45630526542663574, |
|
"eval_precision": 0.9085750924367912, |
|
"eval_recall": 0.9092446448703495, |
|
"eval_runtime": 29.3382, |
|
"eval_samples_per_second": 60.467, |
|
"eval_steps_per_second": 0.954, |
|
"step": 5875 |
|
}, |
|
{ |
|
"epoch": 94.08, |
|
"learning_rate": 5.225806451612904e-05, |
|
"loss": 0.0848, |
|
"step": 5880 |
|
}, |
|
{ |
|
"epoch": 94.24, |
|
"learning_rate": 5.064516129032258e-05, |
|
"loss": 0.1063, |
|
"step": 5890 |
|
}, |
|
{ |
|
"epoch": 94.4, |
|
"learning_rate": 4.9032258064516135e-05, |
|
"loss": 0.0929, |
|
"step": 5900 |
|
}, |
|
{ |
|
"epoch": 94.56, |
|
"learning_rate": 4.741935483870968e-05, |
|
"loss": 0.1039, |
|
"step": 5910 |
|
}, |
|
{ |
|
"epoch": 94.72, |
|
"learning_rate": 4.580645161290323e-05, |
|
"loss": 0.099, |
|
"step": 5920 |
|
}, |
|
{ |
|
"epoch": 94.88, |
|
"learning_rate": 4.4193548387096775e-05, |
|
"loss": 0.1026, |
|
"step": 5930 |
|
}, |
|
{ |
|
"epoch": 94.99, |
|
"step": 5937, |
|
"train_accuracy": 0.9824528420129097, |
|
"train_f1": 0.9824112060096897, |
|
"train_loss": 0.05392773821949959, |
|
"train_precision": 0.9824786275566851, |
|
"train_recall": 0.9824528420129097, |
|
"train_runtime": 252.5661, |
|
"train_samples_per_second": 63.179, |
|
"train_steps_per_second": 0.99 |
|
}, |
|
{ |
|
"epoch": 94.99, |
|
"eval_accuracy": 0.9126268320180383, |
|
"eval_f1": 0.9117417948122799, |
|
"eval_loss": 0.4614848494529724, |
|
"eval_precision": 0.911808467672524, |
|
"eval_recall": 0.9126268320180383, |
|
"eval_runtime": 29.3223, |
|
"eval_samples_per_second": 60.5, |
|
"eval_steps_per_second": 0.955, |
|
"step": 5937 |
|
}, |
|
{ |
|
"epoch": 95.04, |
|
"learning_rate": 4.258064516129032e-05, |
|
"loss": 0.1026, |
|
"step": 5940 |
|
}, |
|
{ |
|
"epoch": 95.2, |
|
"learning_rate": 4.096774193548387e-05, |
|
"loss": 0.0942, |
|
"step": 5950 |
|
}, |
|
{ |
|
"epoch": 95.36, |
|
"learning_rate": 3.9354838709677416e-05, |
|
"loss": 0.0936, |
|
"step": 5960 |
|
}, |
|
{ |
|
"epoch": 95.52, |
|
"learning_rate": 3.774193548387097e-05, |
|
"loss": 0.0833, |
|
"step": 5970 |
|
}, |
|
{ |
|
"epoch": 95.68, |
|
"learning_rate": 3.612903225806452e-05, |
|
"loss": 0.096, |
|
"step": 5980 |
|
}, |
|
{ |
|
"epoch": 95.84, |
|
"learning_rate": 3.451612903225806e-05, |
|
"loss": 0.106, |
|
"step": 5990 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"learning_rate": 3.2903225806451614e-05, |
|
"loss": 0.0895, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"step": 6000, |
|
"train_accuracy": 0.9817634893777025, |
|
"train_f1": 0.9817217910538368, |
|
"train_loss": 0.053316567093133926, |
|
"train_precision": 0.981748670799393, |
|
"train_recall": 0.9817634893777025, |
|
"train_runtime": 254.5693, |
|
"train_samples_per_second": 62.682, |
|
"train_steps_per_second": 0.982 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_accuracy": 0.9092446448703495, |
|
"eval_f1": 0.908628347766777, |
|
"eval_loss": 0.4585205316543579, |
|
"eval_precision": 0.9086756206676724, |
|
"eval_recall": 0.9092446448703495, |
|
"eval_runtime": 29.7078, |
|
"eval_samples_per_second": 59.715, |
|
"eval_steps_per_second": 0.943, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 96.16, |
|
"learning_rate": 3.129032258064516e-05, |
|
"loss": 0.1019, |
|
"step": 6010 |
|
}, |
|
{ |
|
"epoch": 96.32, |
|
"learning_rate": 2.967741935483871e-05, |
|
"loss": 0.1046, |
|
"step": 6020 |
|
}, |
|
{ |
|
"epoch": 96.48, |
|
"learning_rate": 2.806451612903226e-05, |
|
"loss": 0.125, |
|
"step": 6030 |
|
}, |
|
{ |
|
"epoch": 96.64, |
|
"learning_rate": 2.6451612903225806e-05, |
|
"loss": 0.0977, |
|
"step": 6040 |
|
}, |
|
{ |
|
"epoch": 96.8, |
|
"learning_rate": 2.4838709677419354e-05, |
|
"loss": 0.104, |
|
"step": 6050 |
|
}, |
|
{ |
|
"epoch": 96.96, |
|
"learning_rate": 2.3225806451612906e-05, |
|
"loss": 0.1045, |
|
"step": 6060 |
|
}, |
|
{ |
|
"epoch": 96.99, |
|
"step": 6062, |
|
"train_accuracy": 0.9817008209563202, |
|
"train_f1": 0.9816508134314273, |
|
"train_loss": 0.05279777571558952, |
|
"train_precision": 0.9816910608821193, |
|
"train_recall": 0.9817008209563202, |
|
"train_runtime": 252.7534, |
|
"train_samples_per_second": 63.133, |
|
"train_steps_per_second": 0.989 |
|
}, |
|
{ |
|
"epoch": 96.99, |
|
"eval_accuracy": 0.9098083427282976, |
|
"eval_f1": 0.909112926020381, |
|
"eval_loss": 0.45533671975135803, |
|
"eval_precision": 0.9090721377215957, |
|
"eval_recall": 0.9098083427282976, |
|
"eval_runtime": 33.0675, |
|
"eval_samples_per_second": 53.648, |
|
"eval_steps_per_second": 0.847, |
|
"step": 6062 |
|
}, |
|
{ |
|
"epoch": 97.12, |
|
"learning_rate": 2.1612903225806454e-05, |
|
"loss": 0.0862, |
|
"step": 6070 |
|
}, |
|
{ |
|
"epoch": 97.28, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1078, |
|
"step": 6080 |
|
}, |
|
{ |
|
"epoch": 97.44, |
|
"learning_rate": 1.838709677419355e-05, |
|
"loss": 0.1078, |
|
"step": 6090 |
|
}, |
|
{ |
|
"epoch": 97.6, |
|
"learning_rate": 1.6774193548387098e-05, |
|
"loss": 0.107, |
|
"step": 6100 |
|
}, |
|
{ |
|
"epoch": 97.76, |
|
"learning_rate": 1.5161290322580646e-05, |
|
"loss": 0.1139, |
|
"step": 6110 |
|
}, |
|
{ |
|
"epoch": 97.92, |
|
"learning_rate": 1.3548387096774194e-05, |
|
"loss": 0.1081, |
|
"step": 6120 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"step": 6125, |
|
"train_accuracy": 0.9812621420066429, |
|
"train_f1": 0.9812114737389049, |
|
"train_loss": 0.054921120405197144, |
|
"train_precision": 0.9812508070970374, |
|
"train_recall": 0.9812621420066429, |
|
"train_runtime": 252.6106, |
|
"train_samples_per_second": 63.168, |
|
"train_steps_per_second": 0.99 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_accuracy": 0.9103720405862458, |
|
"eval_f1": 0.9096321309054232, |
|
"eval_loss": 0.4532192647457123, |
|
"eval_precision": 0.9096536769299824, |
|
"eval_recall": 0.9103720405862458, |
|
"eval_runtime": 29.6384, |
|
"eval_samples_per_second": 59.855, |
|
"eval_steps_per_second": 0.945, |
|
"step": 6125 |
|
}, |
|
{ |
|
"epoch": 98.08, |
|
"learning_rate": 1.1935483870967743e-05, |
|
"loss": 0.1011, |
|
"step": 6130 |
|
}, |
|
{ |
|
"epoch": 98.24, |
|
"learning_rate": 1.0322580645161291e-05, |
|
"loss": 0.1031, |
|
"step": 6140 |
|
}, |
|
{ |
|
"epoch": 98.4, |
|
"learning_rate": 8.709677419354838e-06, |
|
"loss": 0.0821, |
|
"step": 6150 |
|
}, |
|
{ |
|
"epoch": 98.56, |
|
"learning_rate": 7.096774193548388e-06, |
|
"loss": 0.0901, |
|
"step": 6160 |
|
}, |
|
{ |
|
"epoch": 98.72, |
|
"learning_rate": 5.483870967741935e-06, |
|
"loss": 0.0809, |
|
"step": 6170 |
|
}, |
|
{ |
|
"epoch": 98.88, |
|
"learning_rate": 3.870967741935484e-06, |
|
"loss": 0.0932, |
|
"step": 6180 |
|
}, |
|
{ |
|
"epoch": 98.99, |
|
"step": 6187, |
|
"train_accuracy": 0.9805101209500533, |
|
"train_f1": 0.9804742522228167, |
|
"train_loss": 0.055186156183481216, |
|
"train_precision": 0.980498073403408, |
|
"train_recall": 0.9805101209500533, |
|
"train_runtime": 254.3736, |
|
"train_samples_per_second": 62.731, |
|
"train_steps_per_second": 0.983 |
|
}, |
|
{ |
|
"epoch": 98.99, |
|
"eval_accuracy": 0.9098083427282976, |
|
"eval_f1": 0.9090900239365977, |
|
"eval_loss": 0.4536750614643097, |
|
"eval_precision": 0.9091114953941556, |
|
"eval_recall": 0.9098083427282976, |
|
"eval_runtime": 29.5537, |
|
"eval_samples_per_second": 60.026, |
|
"eval_steps_per_second": 0.947, |
|
"step": 6187 |
|
}, |
|
{ |
|
"epoch": 99.04, |
|
"learning_rate": 2.2580645161290324e-06, |
|
"loss": 0.1136, |
|
"step": 6190 |
|
}, |
|
{ |
|
"epoch": 99.2, |
|
"learning_rate": 6.451612903225807e-07, |
|
"loss": 0.0934, |
|
"step": 6200 |
|
}, |
|
{ |
|
"epoch": 99.2, |
|
"step": 6200, |
|
"train_accuracy": 0.9809487998997305, |
|
"train_f1": 0.9809066394306372, |
|
"train_loss": 0.05620851740241051, |
|
"train_precision": 0.9809434303564252, |
|
"train_recall": 0.9809487998997305, |
|
"train_runtime": 257.0414, |
|
"train_samples_per_second": 62.08, |
|
"train_steps_per_second": 0.973 |
|
}, |
|
{ |
|
"epoch": 99.2, |
|
"eval_accuracy": 0.9098083427282976, |
|
"eval_f1": 0.9090900239365977, |
|
"eval_loss": 0.4539656639099121, |
|
"eval_precision": 0.9091114953941556, |
|
"eval_recall": 0.9098083427282976, |
|
"eval_runtime": 29.6217, |
|
"eval_samples_per_second": 59.889, |
|
"eval_steps_per_second": 0.945, |
|
"step": 6200 |
|
}, |
|
{ |
|
"epoch": 99.2, |
|
"step": 6200, |
|
"total_flos": 9.4522774317222e+19, |
|
"train_loss": 0.2388173005080992, |
|
"train_runtime": 58791.9316, |
|
"train_samples_per_second": 27.141, |
|
"train_steps_per_second": 0.105 |
|
} |
|
], |
|
"logging_steps": 10, |
|
"max_steps": 6200, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 9.4522774317222e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|