PaulTran's picture
Upload 12 files
187dea8
{
"best_metric": 0.8468692367302207,
"best_model_checkpoint": "PhoBertPunc\\checkpoint-5746",
"epoch": 13.0,
"global_step": 5746,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"learning_rate": 1.9002262443438914e-05,
"loss": 0.3702,
"step": 441
},
{
"epoch": 1.0,
"eval_accuracy": 0.6371049949031601,
"eval_f1": 0.7381062355658198,
"eval_loss": 0.285582959651947,
"eval_roc_auc": 0.8207916729455642,
"eval_runtime": 9.0929,
"eval_samples_per_second": 107.886,
"eval_steps_per_second": 5.499,
"step": 442
},
{
"epoch": 2.0,
"learning_rate": 1.800452488687783e-05,
"loss": 0.2734,
"step": 882
},
{
"epoch": 2.0,
"eval_accuracy": 0.6605504587155964,
"eval_f1": 0.7523277467411547,
"eval_loss": 0.26946958899497986,
"eval_roc_auc": 0.828197000778661,
"eval_runtime": 7.7509,
"eval_samples_per_second": 126.566,
"eval_steps_per_second": 6.451,
"step": 884
},
{
"epoch": 2.99,
"learning_rate": 1.7006787330316743e-05,
"loss": 0.2267,
"step": 1323
},
{
"epoch": 3.0,
"eval_accuracy": 0.6595310907237513,
"eval_f1": 0.7564625850340136,
"eval_loss": 0.27753132581710815,
"eval_roc_auc": 0.8355058707497308,
"eval_runtime": 7.6581,
"eval_samples_per_second": 128.1,
"eval_steps_per_second": 6.529,
"step": 1326
},
{
"epoch": 3.99,
"learning_rate": 1.600904977375566e-05,
"loss": 0.1876,
"step": 1764
},
{
"epoch": 4.0,
"eval_accuracy": 0.6371049949031601,
"eval_f1": 0.763459841129744,
"eval_loss": 0.29114222526550293,
"eval_roc_auc": 0.8451443088928317,
"eval_runtime": 7.891,
"eval_samples_per_second": 124.318,
"eval_steps_per_second": 6.336,
"step": 1768
},
{
"epoch": 4.99,
"learning_rate": 1.5011312217194571e-05,
"loss": 0.1572,
"step": 2205
},
{
"epoch": 5.0,
"eval_accuracy": 0.6371049949031601,
"eval_f1": 0.7529827662395051,
"eval_loss": 0.31292596459388733,
"eval_roc_auc": 0.8381052176821842,
"eval_runtime": 7.5397,
"eval_samples_per_second": 130.111,
"eval_steps_per_second": 6.632,
"step": 2210
},
{
"epoch": 5.99,
"learning_rate": 1.4013574660633484e-05,
"loss": 0.1312,
"step": 2646
},
{
"epoch": 6.0,
"eval_accuracy": 0.6167176350662589,
"eval_f1": 0.7478632478632479,
"eval_loss": 0.3474615812301636,
"eval_roc_auc": 0.8410431585366024,
"eval_runtime": 8.8902,
"eval_samples_per_second": 110.346,
"eval_steps_per_second": 5.624,
"step": 2652
},
{
"epoch": 6.98,
"learning_rate": 1.30158371040724e-05,
"loss": 0.1048,
"step": 3087
},
{
"epoch": 7.0,
"eval_accuracy": 0.6187563710499491,
"eval_f1": 0.7460869565217391,
"eval_loss": 0.3677310347557068,
"eval_roc_auc": 0.8366267414318126,
"eval_runtime": 7.6489,
"eval_samples_per_second": 128.254,
"eval_steps_per_second": 6.537,
"step": 3094
},
{
"epoch": 7.98,
"learning_rate": 1.2018099547511313e-05,
"loss": 0.0844,
"step": 3528
},
{
"epoch": 8.0,
"eval_accuracy": 0.6034658511722731,
"eval_f1": 0.7418244406196213,
"eval_loss": 0.39172324538230896,
"eval_roc_auc": 0.835729578342679,
"eval_runtime": 7.4868,
"eval_samples_per_second": 131.031,
"eval_steps_per_second": 6.678,
"step": 3536
},
{
"epoch": 8.98,
"learning_rate": 1.1020361990950229e-05,
"loss": 0.0698,
"step": 3969
},
{
"epoch": 9.0,
"eval_accuracy": 0.6106014271151886,
"eval_f1": 0.7507481829841812,
"eval_loss": 0.42587536573410034,
"eval_roc_auc": 0.842892186936503,
"eval_runtime": 7.5353,
"eval_samples_per_second": 130.188,
"eval_steps_per_second": 6.635,
"step": 3978
},
{
"epoch": 9.98,
"learning_rate": 1.0022624434389141e-05,
"loss": 0.054,
"step": 4410
},
{
"epoch": 10.0,
"eval_accuracy": 0.5953109072375128,
"eval_f1": 0.7450317124735729,
"eval_loss": 0.4620385468006134,
"eval_roc_auc": 0.8411574616862839,
"eval_runtime": 7.8298,
"eval_samples_per_second": 125.29,
"eval_steps_per_second": 6.386,
"step": 4420
},
{
"epoch": 10.98,
"learning_rate": 9.024886877828056e-06,
"loss": 0.0451,
"step": 4851
},
{
"epoch": 11.0,
"eval_accuracy": 0.6330275229357798,
"eval_f1": 0.7534965034965035,
"eval_loss": 0.45941799879074097,
"eval_roc_auc": 0.8405079165428382,
"eval_runtime": 7.6958,
"eval_samples_per_second": 127.473,
"eval_steps_per_second": 6.497,
"step": 4862
},
{
"epoch": 11.97,
"learning_rate": 8.02714932126697e-06,
"loss": 0.0366,
"step": 5292
},
{
"epoch": 12.0,
"eval_accuracy": 0.5891946992864424,
"eval_f1": 0.7466777408637875,
"eval_loss": 0.5142910480499268,
"eval_roc_auc": 0.8457477828688038,
"eval_runtime": 7.657,
"eval_samples_per_second": 128.118,
"eval_steps_per_second": 6.53,
"step": 5304
},
{
"epoch": 12.97,
"learning_rate": 7.029411764705882e-06,
"loss": 0.0288,
"step": 5733
},
{
"epoch": 13.0,
"eval_accuracy": 0.601427115188583,
"eval_f1": 0.751892346509672,
"eval_loss": 0.5171791315078735,
"eval_roc_auc": 0.8468692367302207,
"eval_runtime": 7.4917,
"eval_samples_per_second": 130.944,
"eval_steps_per_second": 6.674,
"step": 5746
}
],
"max_steps": 8840,
"num_train_epochs": 20,
"total_flos": 1.5096534982943232e+16,
"trial_name": null,
"trial_params": null
}