|
{ |
|
"best_metric": 30.481593707691317, |
|
"best_model_checkpoint": "./checkpoint-200", |
|
"epoch": 38.012, |
|
"global_step": 500, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.02, |
|
"learning_rate": 2.3000000000000004e-06, |
|
"loss": 1.7169, |
|
"step": 25 |
|
}, |
|
{ |
|
"epoch": 3.02, |
|
"learning_rate": 4.800000000000001e-06, |
|
"loss": 0.8922, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 5.02, |
|
"learning_rate": 7.3e-06, |
|
"loss": 0.4752, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 7.02, |
|
"learning_rate": 9.800000000000001e-06, |
|
"loss": 0.2693, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 7.02, |
|
"eval_loss": 0.6740689277648926, |
|
"eval_runtime": 1376.3341, |
|
"eval_samples_per_second": 0.732, |
|
"eval_steps_per_second": 0.023, |
|
"eval_wer": 35.48449487460512, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 9.02, |
|
"learning_rate": 9.425e-06, |
|
"loss": 0.1224, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 11.01, |
|
"learning_rate": 8.8e-06, |
|
"loss": 0.0482, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 13.01, |
|
"learning_rate": 8.175e-06, |
|
"loss": 0.0171, |
|
"step": 175 |
|
}, |
|
{ |
|
"epoch": 15.01, |
|
"learning_rate": 7.5500000000000006e-06, |
|
"loss": 0.0084, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 15.01, |
|
"eval_loss": 0.7756175398826599, |
|
"eval_runtime": 955.7345, |
|
"eval_samples_per_second": 1.055, |
|
"eval_steps_per_second": 0.033, |
|
"eval_wer": 30.481593707691317, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 17.01, |
|
"learning_rate": 6.925000000000001e-06, |
|
"loss": 0.0052, |
|
"step": 225 |
|
}, |
|
{ |
|
"epoch": 19.01, |
|
"learning_rate": 6.300000000000001e-06, |
|
"loss": 0.0039, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"learning_rate": 5.675000000000001e-06, |
|
"loss": 0.0033, |
|
"step": 275 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"learning_rate": 5.050000000000001e-06, |
|
"loss": 0.0029, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_loss": 0.8154371380805969, |
|
"eval_runtime": 1039.7317, |
|
"eval_samples_per_second": 0.969, |
|
"eval_steps_per_second": 0.031, |
|
"eval_wer": 31.4744374959706, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 24.03, |
|
"learning_rate": 4.425e-06, |
|
"loss": 0.0024, |
|
"step": 325 |
|
}, |
|
{ |
|
"epoch": 26.02, |
|
"learning_rate": 3.8000000000000005e-06, |
|
"loss": 0.0023, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 28.02, |
|
"learning_rate": 3.175e-06, |
|
"loss": 0.0021, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 30.02, |
|
"learning_rate": 2.55e-06, |
|
"loss": 0.002, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 30.02, |
|
"eval_loss": 0.8319515585899353, |
|
"eval_runtime": 954.6491, |
|
"eval_samples_per_second": 1.056, |
|
"eval_steps_per_second": 0.034, |
|
"eval_wer": 31.377731932177166, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 32.02, |
|
"learning_rate": 1.925e-06, |
|
"loss": 0.0019, |
|
"step": 425 |
|
}, |
|
{ |
|
"epoch": 34.02, |
|
"learning_rate": 1.3e-06, |
|
"loss": 0.0018, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 36.01, |
|
"learning_rate": 6.750000000000001e-07, |
|
"loss": 0.0018, |
|
"step": 475 |
|
}, |
|
{ |
|
"epoch": 38.01, |
|
"learning_rate": 5.0000000000000004e-08, |
|
"loss": 0.0017, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 38.01, |
|
"eval_loss": 0.8372375965118408, |
|
"eval_runtime": 984.3922, |
|
"eval_samples_per_second": 1.024, |
|
"eval_steps_per_second": 0.033, |
|
"eval_wer": 31.516343240281092, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 38.01, |
|
"step": 500, |
|
"total_flos": 8.59869058793472e+18, |
|
"train_loss": 0.17904520658403636, |
|
"train_runtime": 15686.2181, |
|
"train_samples_per_second": 2.04, |
|
"train_steps_per_second": 0.032 |
|
} |
|
], |
|
"max_steps": 500, |
|
"num_train_epochs": 9223372036854775807, |
|
"total_flos": 8.59869058793472e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|