wav2vec2-xls-r-300m-italian / trainer_state.json
g8a9's picture
End of training
85f14aa
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 5.0,
"global_step": 11395,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.04,
"eval_loss": Infinity,
"eval_runtime": 762.0088,
"eval_samples_per_second": 19.376,
"eval_steps_per_second": 2.423,
"eval_wer": 1.0,
"step": 100
},
{
"epoch": 0.09,
"eval_loss": Infinity,
"eval_runtime": 760.7665,
"eval_samples_per_second": 19.408,
"eval_steps_per_second": 2.427,
"eval_wer": 0.9983381717130623,
"step": 200
},
{
"epoch": 0.13,
"eval_loss": Infinity,
"eval_runtime": 758.492,
"eval_samples_per_second": 19.466,
"eval_steps_per_second": 2.434,
"eval_wer": 0.7671578598961529,
"step": 300
},
{
"epoch": 0.18,
"eval_loss": Infinity,
"eval_runtime": 763.9298,
"eval_samples_per_second": 19.328,
"eval_steps_per_second": 2.416,
"eval_wer": 0.6919342715882527,
"step": 400
},
{
"epoch": 0.22,
"learning_rate": 0.000996,
"loss": 2.9929,
"step": 500
},
{
"epoch": 0.22,
"eval_loss": Infinity,
"eval_runtime": 771.5199,
"eval_samples_per_second": 19.138,
"eval_steps_per_second": 2.393,
"eval_wer": 0.6265920108122272,
"step": 500
},
{
"epoch": 0.26,
"eval_loss": Infinity,
"eval_runtime": 768.8673,
"eval_samples_per_second": 19.204,
"eval_steps_per_second": 2.401,
"eval_wer": 0.5512649892084595,
"step": 600
},
{
"epoch": 0.31,
"eval_loss": Infinity,
"eval_runtime": 774.562,
"eval_samples_per_second": 19.062,
"eval_steps_per_second": 2.383,
"eval_wer": 0.508133304831714,
"step": 700
},
{
"epoch": 0.35,
"eval_loss": Infinity,
"eval_runtime": 770.4155,
"eval_samples_per_second": 19.165,
"eval_steps_per_second": 2.396,
"eval_wer": 0.4944870053302625,
"step": 800
},
{
"epoch": 0.39,
"eval_loss": Infinity,
"eval_runtime": 769.5888,
"eval_samples_per_second": 19.186,
"eval_steps_per_second": 2.399,
"eval_wer": 0.4720419801270161,
"step": 900
},
{
"epoch": 0.44,
"learning_rate": 0.0009542909591555759,
"loss": 0.5311,
"step": 1000
},
{
"epoch": 0.44,
"eval_loss": Infinity,
"eval_runtime": 772.8626,
"eval_samples_per_second": 19.104,
"eval_steps_per_second": 2.389,
"eval_wer": 0.4387433544107405,
"step": 1000
},
{
"epoch": 0.48,
"eval_loss": Infinity,
"eval_runtime": 769.5289,
"eval_samples_per_second": 19.187,
"eval_steps_per_second": 2.399,
"eval_wer": 0.4410533646851146,
"step": 1100
},
{
"epoch": 0.53,
"eval_loss": Infinity,
"eval_runtime": 780.8054,
"eval_samples_per_second": 18.91,
"eval_steps_per_second": 2.364,
"eval_wer": 0.44290826845767167,
"step": 1200
},
{
"epoch": 0.57,
"eval_loss": Infinity,
"eval_runtime": 774.2302,
"eval_samples_per_second": 19.071,
"eval_steps_per_second": 2.384,
"eval_wer": 0.43216499679356785,
"step": 1300
},
{
"epoch": 0.61,
"eval_loss": Infinity,
"eval_runtime": 768.9729,
"eval_samples_per_second": 19.201,
"eval_steps_per_second": 2.401,
"eval_wer": 0.4531826425138428,
"step": 1400
},
{
"epoch": 0.66,
"learning_rate": 0.0009083983478659936,
"loss": 0.4654,
"step": 1500
},
{
"epoch": 0.66,
"eval_loss": Infinity,
"eval_runtime": 777.4905,
"eval_samples_per_second": 18.991,
"eval_steps_per_second": 2.374,
"eval_wer": 0.44915563952806836,
"step": 1500
},
{
"epoch": 0.7,
"eval_loss": Infinity,
"eval_runtime": 773.9985,
"eval_samples_per_second": 19.076,
"eval_steps_per_second": 2.385,
"eval_wer": 0.3878817550561643,
"step": 1600
},
{
"epoch": 0.75,
"eval_loss": Infinity,
"eval_runtime": 773.8841,
"eval_samples_per_second": 19.079,
"eval_steps_per_second": 2.385,
"eval_wer": 0.3835927210541922,
"step": 1700
},
{
"epoch": 0.79,
"eval_loss": Infinity,
"eval_runtime": 773.515,
"eval_samples_per_second": 19.088,
"eval_steps_per_second": 2.387,
"eval_wer": 0.37425614221388626,
"step": 1800
},
{
"epoch": 0.83,
"eval_loss": Infinity,
"eval_runtime": 774.3742,
"eval_samples_per_second": 19.067,
"eval_steps_per_second": 2.384,
"eval_wer": 0.36867074423704155,
"step": 1900
},
{
"epoch": 0.88,
"learning_rate": 0.0008625975217989904,
"loss": 0.4254,
"step": 2000
},
{
"epoch": 0.88,
"eval_loss": Infinity,
"eval_runtime": 774.0591,
"eval_samples_per_second": 19.075,
"eval_steps_per_second": 2.385,
"eval_wer": 0.3792830003930465,
"step": 2000
},
{
"epoch": 0.92,
"eval_loss": Infinity,
"eval_runtime": 768.0215,
"eval_samples_per_second": 19.225,
"eval_steps_per_second": 2.404,
"eval_wer": 0.3766006302535495,
"step": 2100
},
{
"epoch": 0.97,
"eval_loss": Infinity,
"eval_runtime": 772.2372,
"eval_samples_per_second": 19.12,
"eval_steps_per_second": 2.39,
"eval_wer": 0.3705256480095986,
"step": 2200
},
{
"epoch": 1.01,
"eval_loss": Infinity,
"eval_runtime": 767.2028,
"eval_samples_per_second": 19.245,
"eval_steps_per_second": 2.406,
"eval_wer": 0.3271802014880604,
"step": 2300
},
{
"epoch": 1.05,
"eval_loss": Infinity,
"eval_runtime": 768.4281,
"eval_samples_per_second": 19.215,
"eval_steps_per_second": 2.402,
"eval_wer": 0.31850559574130644,
"step": 2400
},
{
"epoch": 1.1,
"learning_rate": 0.000816704910509408,
"loss": 0.3997,
"step": 2500
},
{
"epoch": 1.1,
"eval_loss": Infinity,
"eval_runtime": 767.2666,
"eval_samples_per_second": 19.244,
"eval_steps_per_second": 2.406,
"eval_wer": 0.3244426669241006,
"step": 2500
},
{
"epoch": 1.14,
"eval_loss": Infinity,
"eval_runtime": 767.2447,
"eval_samples_per_second": 19.244,
"eval_steps_per_second": 2.406,
"eval_wer": 0.30816916170761477,
"step": 2600
},
{
"epoch": 1.18,
"eval_loss": Infinity,
"eval_runtime": 771.1785,
"eval_samples_per_second": 19.146,
"eval_steps_per_second": 2.394,
"eval_wer": 0.30403872542597277,
"step": 2700
},
{
"epoch": 1.23,
"eval_loss": Infinity,
"eval_runtime": 761.2544,
"eval_samples_per_second": 19.396,
"eval_steps_per_second": 2.425,
"eval_wer": 0.30282510808779417,
"step": 2800
},
{
"epoch": 1.27,
"eval_loss": Infinity,
"eval_runtime": 770.9042,
"eval_samples_per_second": 19.153,
"eval_steps_per_second": 2.395,
"eval_wer": 0.3112101006061191,
"step": 2900
},
{
"epoch": 1.32,
"learning_rate": 0.0007709040844424048,
"loss": 0.3668,
"step": 3000
},
{
"epoch": 1.32,
"eval_loss": Infinity,
"eval_runtime": 763.6174,
"eval_samples_per_second": 19.336,
"eval_steps_per_second": 2.417,
"eval_wer": 0.31098944290826847,
"step": 3000
},
{
"epoch": 1.36,
"eval_loss": Infinity,
"eval_runtime": 765.7415,
"eval_samples_per_second": 19.282,
"eval_steps_per_second": 2.411,
"eval_wer": 0.3066521400348915,
"step": 3100
},
{
"epoch": 1.4,
"eval_loss": Infinity,
"eval_runtime": 762.1465,
"eval_samples_per_second": 19.373,
"eval_steps_per_second": 2.422,
"eval_wer": 0.29612952606863835,
"step": 3200
},
{
"epoch": 1.45,
"eval_loss": Infinity,
"eval_runtime": 764.1293,
"eval_samples_per_second": 19.323,
"eval_steps_per_second": 2.416,
"eval_wer": 0.3080933106239786,
"step": 3300
},
{
"epoch": 1.49,
"eval_loss": Infinity,
"eval_runtime": 764.6533,
"eval_samples_per_second": 19.309,
"eval_steps_per_second": 2.414,
"eval_wer": 0.2936195447555871,
"step": 3400
},
{
"epoch": 1.54,
"learning_rate": 0.0007250114731528225,
"loss": 0.3645,
"step": 3500
},
{
"epoch": 1.54,
"eval_loss": Infinity,
"eval_runtime": 762.2683,
"eval_samples_per_second": 19.37,
"eval_steps_per_second": 2.422,
"eval_wer": 0.30368015666696546,
"step": 3500
},
{
"epoch": 1.58,
"eval_loss": Infinity,
"eval_runtime": 760.0026,
"eval_samples_per_second": 19.428,
"eval_steps_per_second": 2.429,
"eval_wer": 0.2973914122782218,
"step": 3600
},
{
"epoch": 1.62,
"eval_loss": Infinity,
"eval_runtime": 760.5942,
"eval_samples_per_second": 19.412,
"eval_steps_per_second": 2.427,
"eval_wer": 0.30096330876217925,
"step": 3700
},
{
"epoch": 1.67,
"eval_loss": Infinity,
"eval_runtime": 761.2356,
"eval_samples_per_second": 19.396,
"eval_steps_per_second": 2.425,
"eval_wer": 0.2985498651919377,
"step": 3800
},
{
"epoch": 1.71,
"eval_loss": Infinity,
"eval_runtime": 767.0946,
"eval_samples_per_second": 19.248,
"eval_steps_per_second": 2.406,
"eval_wer": 0.2975775922107833,
"step": 3900
},
{
"epoch": 1.76,
"learning_rate": 0.00067911886186324,
"loss": 0.3624,
"step": 4000
},
{
"epoch": 1.76,
"eval_loss": Infinity,
"eval_runtime": 764.3373,
"eval_samples_per_second": 19.317,
"eval_steps_per_second": 2.415,
"eval_wer": 0.292757600623358,
"step": 4000
},
{
"epoch": 1.8,
"eval_loss": Infinity,
"eval_runtime": 778.1044,
"eval_samples_per_second": 18.976,
"eval_steps_per_second": 2.372,
"eval_wer": 0.2859516897552768,
"step": 4100
},
{
"epoch": 1.84,
"eval_loss": Infinity,
"eval_runtime": 780.7174,
"eval_samples_per_second": 18.912,
"eval_steps_per_second": 2.364,
"eval_wer": 0.29222664303790485,
"step": 4200
},
{
"epoch": 1.89,
"eval_loss": Infinity,
"eval_runtime": 778.463,
"eval_samples_per_second": 18.967,
"eval_steps_per_second": 2.371,
"eval_wer": 0.2865929761896553,
"step": 4300
},
{
"epoch": 1.93,
"eval_loss": Infinity,
"eval_runtime": 777.1309,
"eval_samples_per_second": 18.999,
"eval_steps_per_second": 2.375,
"eval_wer": 0.2775529061308362,
"step": 4400
},
{
"epoch": 1.97,
"learning_rate": 0.0006332262505736577,
"loss": 0.3527,
"step": 4500
},
{
"epoch": 1.97,
"eval_loss": Infinity,
"eval_runtime": 776.0915,
"eval_samples_per_second": 19.025,
"eval_steps_per_second": 2.379,
"eval_wer": 0.27924921218306314,
"step": 4500
},
{
"epoch": 2.02,
"eval_loss": Infinity,
"eval_runtime": 777.8615,
"eval_samples_per_second": 18.982,
"eval_steps_per_second": 2.373,
"eval_wer": 0.2857655098227153,
"step": 4600
},
{
"epoch": 2.06,
"eval_loss": Infinity,
"eval_runtime": 779.7088,
"eval_samples_per_second": 18.937,
"eval_steps_per_second": 2.368,
"eval_wer": 0.27665648423331796,
"step": 4700
},
{
"epoch": 2.11,
"eval_loss": Infinity,
"eval_runtime": 780.5896,
"eval_samples_per_second": 18.915,
"eval_steps_per_second": 2.365,
"eval_wer": 0.28240047993049283,
"step": 4800
},
{
"epoch": 2.15,
"eval_loss": Infinity,
"eval_runtime": 781.7435,
"eval_samples_per_second": 18.887,
"eval_steps_per_second": 2.361,
"eval_wer": 0.27986291640521027,
"step": 4900
},
{
"epoch": 2.19,
"learning_rate": 0.0005873336392840752,
"loss": 0.3162,
"step": 5000
},
{
"epoch": 2.19,
"eval_loss": Infinity,
"eval_runtime": 785.7508,
"eval_samples_per_second": 18.791,
"eval_steps_per_second": 2.349,
"eval_wer": 0.26727853207466507,
"step": 5000
},
{
"epoch": 2.24,
"eval_loss": Infinity,
"eval_runtime": 789.097,
"eval_samples_per_second": 18.711,
"eval_steps_per_second": 2.339,
"eval_wer": 0.2961915860461588,
"step": 5100
},
{
"epoch": 2.28,
"eval_loss": Infinity,
"eval_runtime": 782.4986,
"eval_samples_per_second": 18.869,
"eval_steps_per_second": 2.359,
"eval_wer": 0.2735948586756401,
"step": 5200
},
{
"epoch": 2.33,
"eval_loss": Infinity,
"eval_runtime": 780.5596,
"eval_samples_per_second": 18.916,
"eval_steps_per_second": 2.365,
"eval_wer": 0.2651547017328525,
"step": 5300
},
{
"epoch": 2.37,
"eval_loss": Infinity,
"eval_runtime": 782.8773,
"eval_samples_per_second": 18.86,
"eval_steps_per_second": 2.358,
"eval_wer": 0.2550527165031271,
"step": 5400
},
{
"epoch": 2.41,
"learning_rate": 0.0005414410279944929,
"loss": 0.3063,
"step": 5500
},
{
"epoch": 2.41,
"eval_loss": Infinity,
"eval_runtime": 779.9742,
"eval_samples_per_second": 18.93,
"eval_steps_per_second": 2.367,
"eval_wer": 0.26804393846408453,
"step": 5500
},
{
"epoch": 2.46,
"eval_loss": Infinity,
"eval_runtime": 783.4711,
"eval_samples_per_second": 18.846,
"eval_steps_per_second": 2.356,
"eval_wer": 0.2557767495741996,
"step": 5600
},
{
"epoch": 2.5,
"eval_loss": Infinity,
"eval_runtime": 792.9653,
"eval_samples_per_second": 18.62,
"eval_steps_per_second": 2.328,
"eval_wer": 0.2597830659008006,
"step": 5700
},
{
"epoch": 2.54,
"eval_loss": Infinity,
"eval_runtime": 788.5494,
"eval_samples_per_second": 18.724,
"eval_steps_per_second": 2.341,
"eval_wer": 0.25175664214148297,
"step": 5800
},
{
"epoch": 2.59,
"eval_loss": Infinity,
"eval_runtime": 777.5477,
"eval_samples_per_second": 18.989,
"eval_steps_per_second": 2.374,
"eval_wer": 0.254149399052551,
"step": 5900
},
{
"epoch": 2.63,
"learning_rate": 0.0004955484167049105,
"loss": 0.2913,
"step": 6000
},
{
"epoch": 2.63,
"eval_loss": Infinity,
"eval_runtime": 785.1255,
"eval_samples_per_second": 18.806,
"eval_steps_per_second": 2.351,
"eval_wer": 0.2507361002889237,
"step": 6000
},
{
"epoch": 2.68,
"eval_loss": Infinity,
"eval_runtime": 785.3479,
"eval_samples_per_second": 18.801,
"eval_steps_per_second": 2.351,
"eval_wer": 0.24998448500561987,
"step": 6100
},
{
"epoch": 2.72,
"eval_loss": Infinity,
"eval_runtime": 781.3987,
"eval_samples_per_second": 18.896,
"eval_steps_per_second": 2.362,
"eval_wer": 0.24352335179043036,
"step": 6200
},
{
"epoch": 2.76,
"eval_loss": Infinity,
"eval_runtime": 781.4686,
"eval_samples_per_second": 18.894,
"eval_steps_per_second": 2.362,
"eval_wer": 0.23755180284234698,
"step": 6300
},
{
"epoch": 2.81,
"eval_loss": Infinity,
"eval_runtime": 775.7634,
"eval_samples_per_second": 19.033,
"eval_steps_per_second": 2.38,
"eval_wer": 0.23476599940698245,
"step": 6400
},
{
"epoch": 2.85,
"learning_rate": 0.0004497475906379073,
"loss": 0.2797,
"step": 6500
},
{
"epoch": 2.85,
"eval_loss": Infinity,
"eval_runtime": 772.9219,
"eval_samples_per_second": 19.103,
"eval_steps_per_second": 2.388,
"eval_wer": 0.2512049978968563,
"step": 6500
},
{
"epoch": 2.9,
"eval_loss": Infinity,
"eval_runtime": 771.2336,
"eval_samples_per_second": 19.145,
"eval_steps_per_second": 2.394,
"eval_wer": 0.23818619372366762,
"step": 6600
},
{
"epoch": 2.94,
"eval_loss": Infinity,
"eval_runtime": 777.0185,
"eval_samples_per_second": 19.002,
"eval_steps_per_second": 2.376,
"eval_wer": 0.2523082863861096,
"step": 6700
},
{
"epoch": 2.98,
"eval_loss": Infinity,
"eval_runtime": 773.6017,
"eval_samples_per_second": 19.086,
"eval_steps_per_second": 2.386,
"eval_wer": 0.25221864419635776,
"step": 6800
},
{
"epoch": 3.03,
"eval_loss": Infinity,
"eval_runtime": 780.1394,
"eval_samples_per_second": 18.926,
"eval_steps_per_second": 2.366,
"eval_wer": 0.24091683273456949,
"step": 6900
},
{
"epoch": 3.07,
"learning_rate": 0.0004038549793483249,
"loss": 0.2766,
"step": 7000
},
{
"epoch": 3.07,
"eval_loss": Infinity,
"eval_runtime": 783.1904,
"eval_samples_per_second": 18.852,
"eval_steps_per_second": 2.357,
"eval_wer": 0.24534377779769825,
"step": 7000
},
{
"epoch": 3.12,
"eval_loss": Infinity,
"eval_runtime": 777.1186,
"eval_samples_per_second": 19.0,
"eval_steps_per_second": 2.375,
"eval_wer": 0.2326076912998807,
"step": 7100
},
{
"epoch": 3.16,
"eval_loss": Infinity,
"eval_runtime": 781.1613,
"eval_samples_per_second": 18.901,
"eval_steps_per_second": 2.363,
"eval_wer": 0.22860137497327973,
"step": 7200
},
{
"epoch": 3.2,
"eval_loss": Infinity,
"eval_runtime": 786.2675,
"eval_samples_per_second": 18.779,
"eval_steps_per_second": 2.348,
"eval_wer": 0.23420745960929795,
"step": 7300
},
{
"epoch": 3.25,
"eval_loss": Infinity,
"eval_runtime": 781.7233,
"eval_samples_per_second": 18.888,
"eval_steps_per_second": 2.361,
"eval_wer": 0.23047006985195248,
"step": 7400
},
{
"epoch": 3.29,
"learning_rate": 0.0003579623680587425,
"loss": 0.2468,
"step": 7500
},
{
"epoch": 3.29,
"eval_loss": Infinity,
"eval_runtime": 777.7207,
"eval_samples_per_second": 18.985,
"eval_steps_per_second": 2.374,
"eval_wer": 0.2238089655980858,
"step": 7500
},
{
"epoch": 3.33,
"eval_loss": Infinity,
"eval_runtime": 786.7846,
"eval_samples_per_second": 18.766,
"eval_steps_per_second": 2.346,
"eval_wer": 0.23211121147971672,
"step": 7600
},
{
"epoch": 3.38,
"eval_loss": Infinity,
"eval_runtime": 784.5553,
"eval_samples_per_second": 18.82,
"eval_steps_per_second": 2.353,
"eval_wer": 0.23048386095806814,
"step": 7700
},
{
"epoch": 3.42,
"eval_loss": Infinity,
"eval_runtime": 776.8796,
"eval_samples_per_second": 19.006,
"eval_steps_per_second": 2.376,
"eval_wer": 0.21740989236041677,
"step": 7800
},
{
"epoch": 3.47,
"eval_loss": Infinity,
"eval_runtime": 778.8968,
"eval_samples_per_second": 18.956,
"eval_steps_per_second": 2.37,
"eval_wer": 0.22008536694685596,
"step": 7900
},
{
"epoch": 3.51,
"learning_rate": 0.00031206975676916014,
"loss": 0.2439,
"step": 8000
},
{
"epoch": 3.51,
"eval_loss": Infinity,
"eval_runtime": 785.8625,
"eval_samples_per_second": 18.788,
"eval_steps_per_second": 2.349,
"eval_wer": 0.21332772495017963,
"step": 8000
},
{
"epoch": 3.55,
"eval_loss": Infinity,
"eval_runtime": 778.9388,
"eval_samples_per_second": 18.955,
"eval_steps_per_second": 2.37,
"eval_wer": 0.22168513525627323,
"step": 8100
},
{
"epoch": 3.6,
"eval_loss": Infinity,
"eval_runtime": 779.3965,
"eval_samples_per_second": 18.944,
"eval_steps_per_second": 2.368,
"eval_wer": 0.21885106294950388,
"step": 8200
},
{
"epoch": 3.64,
"eval_loss": Infinity,
"eval_runtime": 786.4104,
"eval_samples_per_second": 18.775,
"eval_steps_per_second": 2.347,
"eval_wer": 0.2105212348556416,
"step": 8300
},
{
"epoch": 3.69,
"eval_loss": Infinity,
"eval_runtime": 784.1132,
"eval_samples_per_second": 18.83,
"eval_steps_per_second": 2.354,
"eval_wer": 0.21176932995910938,
"step": 8400
},
{
"epoch": 3.73,
"learning_rate": 0.0002661771454795778,
"loss": 0.2357,
"step": 8500
},
{
"epoch": 3.73,
"eval_loss": Infinity,
"eval_runtime": 776.0702,
"eval_samples_per_second": 19.025,
"eval_steps_per_second": 2.379,
"eval_wer": 0.20932830417663648,
"step": 8500
},
{
"epoch": 3.77,
"eval_loss": Infinity,
"eval_runtime": 777.6609,
"eval_samples_per_second": 18.986,
"eval_steps_per_second": 2.374,
"eval_wer": 0.21030747271084876,
"step": 8600
},
{
"epoch": 3.82,
"eval_loss": Infinity,
"eval_runtime": 773.9787,
"eval_samples_per_second": 19.077,
"eval_steps_per_second": 2.385,
"eval_wer": 0.20353603960805677,
"step": 8700
},
{
"epoch": 3.86,
"eval_loss": Infinity,
"eval_runtime": 780.5659,
"eval_samples_per_second": 18.916,
"eval_steps_per_second": 2.365,
"eval_wer": 0.2019362712986395,
"step": 8800
},
{
"epoch": 3.91,
"eval_loss": Infinity,
"eval_runtime": 779.996,
"eval_samples_per_second": 18.93,
"eval_steps_per_second": 2.367,
"eval_wer": 0.20323953082656995,
"step": 8900
},
{
"epoch": 3.95,
"learning_rate": 0.0002203763194125746,
"loss": 0.2217,
"step": 9000
},
{
"epoch": 3.95,
"eval_loss": Infinity,
"eval_runtime": 778.6538,
"eval_samples_per_second": 18.962,
"eval_steps_per_second": 2.371,
"eval_wer": 0.20561849663152232,
"step": 9000
},
{
"epoch": 3.99,
"eval_loss": Infinity,
"eval_runtime": 778.3405,
"eval_samples_per_second": 18.97,
"eval_steps_per_second": 2.372,
"eval_wer": 0.20215003344343233,
"step": 9100
},
{
"epoch": 4.04,
"eval_loss": Infinity,
"eval_runtime": 787.2038,
"eval_samples_per_second": 18.756,
"eval_steps_per_second": 2.345,
"eval_wer": 0.19324787444576993,
"step": 9200
},
{
"epoch": 4.08,
"eval_loss": Infinity,
"eval_runtime": 775.7143,
"eval_samples_per_second": 19.034,
"eval_steps_per_second": 2.38,
"eval_wer": 0.19350300990890976,
"step": 9300
},
{
"epoch": 4.12,
"eval_loss": Infinity,
"eval_runtime": 773.9153,
"eval_samples_per_second": 19.078,
"eval_steps_per_second": 2.385,
"eval_wer": 0.1905655043062729,
"step": 9400
},
{
"epoch": 4.17,
"learning_rate": 0.0001744837081229922,
"loss": 0.2025,
"step": 9500
},
{
"epoch": 4.17,
"eval_loss": Infinity,
"eval_runtime": 779.0392,
"eval_samples_per_second": 18.953,
"eval_steps_per_second": 2.37,
"eval_wer": 0.18794519414429633,
"step": 9500
},
{
"epoch": 4.21,
"eval_loss": Infinity,
"eval_runtime": 779.0747,
"eval_samples_per_second": 18.952,
"eval_steps_per_second": 2.369,
"eval_wer": 0.18824859847884098,
"step": 9600
},
{
"epoch": 4.26,
"eval_loss": Infinity,
"eval_runtime": 777.6573,
"eval_samples_per_second": 18.987,
"eval_steps_per_second": 2.374,
"eval_wer": 0.18538004840678246,
"step": 9700
},
{
"epoch": 4.3,
"eval_loss": Infinity,
"eval_runtime": 772.7615,
"eval_samples_per_second": 19.107,
"eval_steps_per_second": 2.389,
"eval_wer": 0.18654539687355626,
"step": 9800
},
{
"epoch": 4.34,
"eval_loss": Infinity,
"eval_runtime": 778.0179,
"eval_samples_per_second": 18.978,
"eval_steps_per_second": 2.373,
"eval_wer": 0.18438708876645452,
"step": 9900
},
{
"epoch": 4.39,
"learning_rate": 0.00012859109683340984,
"loss": 0.1869,
"step": 10000
},
{
"epoch": 4.39,
"eval_loss": Infinity,
"eval_runtime": 778.8028,
"eval_samples_per_second": 18.959,
"eval_steps_per_second": 2.37,
"eval_wer": 0.1821667206818323,
"step": 10000
},
{
"epoch": 4.43,
"eval_loss": Infinity,
"eval_runtime": 777.366,
"eval_samples_per_second": 18.994,
"eval_steps_per_second": 2.375,
"eval_wer": 0.1815461209066273,
"step": 10100
},
{
"epoch": 4.48,
"eval_loss": Infinity,
"eval_runtime": 781.9611,
"eval_samples_per_second": 18.882,
"eval_steps_per_second": 2.361,
"eval_wer": 0.18118755214762,
"step": 10200
},
{
"epoch": 4.52,
"eval_loss": Infinity,
"eval_runtime": 760.9314,
"eval_samples_per_second": 19.404,
"eval_steps_per_second": 2.426,
"eval_wer": 0.17923611063225325,
"step": 10300
},
{
"epoch": 4.56,
"eval_loss": Infinity,
"eval_runtime": 761.9088,
"eval_samples_per_second": 19.379,
"eval_steps_per_second": 2.423,
"eval_wer": 0.17967742602795458,
"step": 10400
},
{
"epoch": 4.61,
"learning_rate": 8.269848554382745e-05,
"loss": 0.1863,
"step": 10500
},
{
"epoch": 4.61,
"eval_loss": Infinity,
"eval_runtime": 760.7934,
"eval_samples_per_second": 19.407,
"eval_steps_per_second": 2.426,
"eval_wer": 0.1773812068596962,
"step": 10500
},
{
"epoch": 4.65,
"eval_loss": Infinity,
"eval_runtime": 755.7192,
"eval_samples_per_second": 19.538,
"eval_steps_per_second": 2.443,
"eval_wer": 0.1767330248722599,
"step": 10600
},
{
"epoch": 4.7,
"eval_loss": Infinity,
"eval_runtime": 756.3189,
"eval_samples_per_second": 19.522,
"eval_steps_per_second": 2.441,
"eval_wer": 0.17650547162135138,
"step": 10700
},
{
"epoch": 4.74,
"eval_loss": Infinity,
"eval_runtime": 761.0501,
"eval_samples_per_second": 19.401,
"eval_steps_per_second": 2.426,
"eval_wer": 0.1752918542831728,
"step": 10800
},
{
"epoch": 4.78,
"eval_loss": Infinity,
"eval_runtime": 756.3701,
"eval_samples_per_second": 19.521,
"eval_steps_per_second": 2.441,
"eval_wer": 0.17308527730466622,
"step": 10900
},
{
"epoch": 4.83,
"learning_rate": 3.6805874254245066e-05,
"loss": 0.178,
"step": 11000
},
{
"epoch": 4.83,
"eval_loss": Infinity,
"eval_runtime": 758.6147,
"eval_samples_per_second": 19.463,
"eval_steps_per_second": 2.433,
"eval_wer": 0.17265775301508057,
"step": 11000
},
{
"epoch": 4.87,
"eval_loss": Infinity,
"eval_runtime": 759.5074,
"eval_samples_per_second": 19.44,
"eval_steps_per_second": 2.431,
"eval_wer": 0.17243709531722992,
"step": 11100
},
{
"epoch": 4.91,
"eval_loss": Infinity,
"eval_runtime": 757.3653,
"eval_samples_per_second": 19.495,
"eval_steps_per_second": 2.437,
"eval_wer": 0.17223022872549493,
"step": 11200
},
{
"epoch": 4.96,
"eval_loss": Infinity,
"eval_runtime": 756.4761,
"eval_samples_per_second": 19.518,
"eval_steps_per_second": 2.44,
"eval_wer": 0.17115452244847298,
"step": 11300
},
{
"epoch": 5.0,
"step": 11395,
"total_flos": 1.0194681891264653e+20,
"train_loss": 0.4200820018974194,
"train_runtime": 124144.1421,
"train_samples_per_second": 5.872,
"train_steps_per_second": 0.092
}
],
"max_steps": 11395,
"num_train_epochs": 5,
"total_flos": 1.0194681891264653e+20,
"trial_name": null,
"trial_params": null
}