whisper-large-v2-hi-v2 / trainer_state.json
anuragshas's picture
End of training
88bc0e7
raw
history blame
2.76 kB
{
"best_metric": 12.457650398315174,
"best_model_checkpoint": "./checkpoint-300",
"epoch": 1.1027522935779817,
"global_step": 300,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.09,
"learning_rate": 2.3000000000000004e-06,
"loss": 0.5068,
"step": 25
},
{
"epoch": 0.18,
"learning_rate": 4.800000000000001e-06,
"loss": 0.2745,
"step": 50
},
{
"epoch": 0.28,
"learning_rate": 7.3e-06,
"loss": 0.2341,
"step": 75
},
{
"epoch": 0.37,
"learning_rate": 9.800000000000001e-06,
"loss": 0.2097,
"step": 100
},
{
"epoch": 0.37,
"eval_loss": 0.26155176758766174,
"eval_runtime": 6495.4175,
"eval_samples_per_second": 0.446,
"eval_steps_per_second": 0.056,
"eval_wer": 17.6700851570369,
"step": 100
},
{
"epoch": 0.46,
"learning_rate": 8.85e-06,
"loss": 0.2161,
"step": 125
},
{
"epoch": 0.55,
"learning_rate": 7.600000000000001e-06,
"loss": 0.2043,
"step": 150
},
{
"epoch": 0.64,
"learning_rate": 6.35e-06,
"loss": 0.1803,
"step": 175
},
{
"epoch": 0.73,
"learning_rate": 5.150000000000001e-06,
"loss": 0.1578,
"step": 200
},
{
"epoch": 0.73,
"eval_loss": 0.21081551909446716,
"eval_runtime": 6471.6616,
"eval_samples_per_second": 0.447,
"eval_steps_per_second": 0.056,
"eval_wer": 14.098983609559564,
"step": 200
},
{
"epoch": 0.83,
"learning_rate": 3.900000000000001e-06,
"loss": 0.1696,
"step": 225
},
{
"epoch": 0.92,
"learning_rate": 2.6500000000000005e-06,
"loss": 0.144,
"step": 250
},
{
"epoch": 1.01,
"learning_rate": 1.4000000000000001e-06,
"loss": 0.1274,
"step": 275
},
{
"epoch": 1.1,
"learning_rate": 1.5000000000000002e-07,
"loss": 0.0806,
"step": 300
},
{
"epoch": 1.1,
"eval_loss": 0.18695282936096191,
"eval_runtime": 6462.2032,
"eval_samples_per_second": 0.448,
"eval_steps_per_second": 0.056,
"eval_wer": 12.457650398315174,
"step": 300
},
{
"epoch": 1.1,
"step": 300,
"total_flos": 1.02039599259648e+19,
"train_loss": 0.20877531051635742,
"train_runtime": 20970.8306,
"train_samples_per_second": 0.229,
"train_steps_per_second": 0.014
}
],
"max_steps": 300,
"num_train_epochs": 2,
"total_flos": 1.02039599259648e+19,
"trial_name": null,
"trial_params": null
}