|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 20.8, |
|
"global_step": 5200, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.6, |
|
"learning_rate": 0.0002394, |
|
"loss": 3.4203, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1205.6526, |
|
"eval_samples_per_second": 3.822, |
|
"eval_steps_per_second": 0.478, |
|
"eval_wer": 0.5028872209091932, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 3.2, |
|
"learning_rate": 0.0002873142857142857, |
|
"loss": 0.4156, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 3.2, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1205.8762, |
|
"eval_samples_per_second": 3.821, |
|
"eval_steps_per_second": 0.478, |
|
"eval_wer": 0.21501354872780476, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 4.8, |
|
"learning_rate": 0.0002702142857142857, |
|
"loss": 0.248, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 4.8, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1206.2112, |
|
"eval_samples_per_second": 3.82, |
|
"eval_steps_per_second": 0.478, |
|
"eval_wer": 0.19620116181423092, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 6.4, |
|
"learning_rate": 0.00025315714285714284, |
|
"loss": 0.1884, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 6.4, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1198.1731, |
|
"eval_samples_per_second": 3.846, |
|
"eval_steps_per_second": 0.481, |
|
"eval_wer": 0.18049675782839433, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 0.00023605714285714283, |
|
"loss": 0.1488, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1195.3799, |
|
"eval_samples_per_second": 3.855, |
|
"eval_steps_per_second": 0.482, |
|
"eval_wer": 0.18608073829744867, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 9.6, |
|
"learning_rate": 0.00021899999999999998, |
|
"loss": 0.1232, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 9.6, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1196.1097, |
|
"eval_samples_per_second": 3.852, |
|
"eval_steps_per_second": 0.482, |
|
"eval_wer": 0.17618540546624073, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 11.2, |
|
"learning_rate": 0.0002019, |
|
"loss": 0.107, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 11.2, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1192.8335, |
|
"eval_samples_per_second": 3.863, |
|
"eval_steps_per_second": 0.483, |
|
"eval_wer": 0.17763118025435248, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 12.8, |
|
"learning_rate": 0.0001848428571428571, |
|
"loss": 0.2435, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 12.8, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1189.2109, |
|
"eval_samples_per_second": 3.875, |
|
"eval_steps_per_second": 0.484, |
|
"eval_wer": 0.5853483278359262, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 14.4, |
|
"learning_rate": 0.00016774285714285715, |
|
"loss": 0.7331, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 14.4, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1196.7777, |
|
"eval_samples_per_second": 3.85, |
|
"eval_steps_per_second": 0.481, |
|
"eval_wer": 0.5020128301690777, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"learning_rate": 0.0001506857142857143, |
|
"loss": 0.5402, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1194.9864, |
|
"eval_samples_per_second": 3.856, |
|
"eval_steps_per_second": 0.482, |
|
"eval_wer": 0.29286895393432544, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 17.6, |
|
"learning_rate": 0.00013358571428571426, |
|
"loss": 1.3361, |
|
"step": 4400 |
|
}, |
|
{ |
|
"epoch": 17.6, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1207.0654, |
|
"eval_samples_per_second": 3.818, |
|
"eval_steps_per_second": 0.477, |
|
"eval_wer": 0.9734566137703555, |
|
"step": 4400 |
|
}, |
|
{ |
|
"epoch": 19.2, |
|
"learning_rate": 0.0001165285714285714, |
|
"loss": 0.9035, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 19.2, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1210.7223, |
|
"eval_samples_per_second": 3.806, |
|
"eval_steps_per_second": 0.476, |
|
"eval_wer": 0.4126085413257841, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 20.8, |
|
"learning_rate": 9.947142857142856e-05, |
|
"loss": 0.5824, |
|
"step": 5200 |
|
}, |
|
{ |
|
"epoch": 20.8, |
|
"eval_loss": Infinity, |
|
"eval_runtime": 1209.2109, |
|
"eval_samples_per_second": 3.811, |
|
"eval_steps_per_second": 0.476, |
|
"eval_wer": 0.2804110502211949, |
|
"step": 5200 |
|
} |
|
], |
|
"max_steps": 7500, |
|
"num_train_epochs": 30, |
|
"total_flos": 8.725540278590487e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|