|
{ |
|
"best_metric": 0.732569302631819, |
|
"best_model_checkpoint": "trained/hebban-reviews/bert-base-dutch-cased/checkpoint-3000", |
|
"epoch": 4.382997370727432, |
|
"global_step": 5001, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.44, |
|
"learning_rate": 4.5000999800039995e-05, |
|
"loss": 0.6824, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_accuracy": 0.7763806706114399, |
|
"eval_f1": 0.7835745137864604, |
|
"eval_loss": 0.602776288986206, |
|
"eval_precision": 0.8014359034966511, |
|
"eval_qwk": 0.6748032105430382, |
|
"eval_recall": 0.7763806706114399, |
|
"eval_runtime": 23.7871, |
|
"eval_samples_per_second": 682.05, |
|
"eval_steps_per_second": 5.339, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.88, |
|
"learning_rate": 4.000199960007999e-05, |
|
"loss": 0.5903, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.88, |
|
"eval_accuracy": 0.7441444773175543, |
|
"eval_f1": 0.7623993009582866, |
|
"eval_loss": 0.5676863789558411, |
|
"eval_precision": 0.8079269153410689, |
|
"eval_qwk": 0.6673976411458487, |
|
"eval_recall": 0.7441444773175543, |
|
"eval_runtime": 23.3353, |
|
"eval_samples_per_second": 695.257, |
|
"eval_steps_per_second": 5.442, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"learning_rate": 3.50129974005199e-05, |
|
"loss": 0.487, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"eval_accuracy": 0.7938239644970414, |
|
"eval_f1": 0.8033347539691899, |
|
"eval_loss": 0.5801703333854675, |
|
"eval_precision": 0.8206089090362688, |
|
"eval_qwk": 0.7239594229437711, |
|
"eval_recall": 0.7938239644970414, |
|
"eval_runtime": 23.5912, |
|
"eval_samples_per_second": 687.714, |
|
"eval_steps_per_second": 5.383, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 1.75, |
|
"learning_rate": 3.001399720055989e-05, |
|
"loss": 0.4465, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 1.75, |
|
"eval_accuracy": 0.7809418145956607, |
|
"eval_f1": 0.7939963208456309, |
|
"eval_loss": 0.5808519721031189, |
|
"eval_precision": 0.8222816466721266, |
|
"eval_qwk": 0.7118880899721043, |
|
"eval_recall": 0.7809418145956607, |
|
"eval_runtime": 23.7528, |
|
"eval_samples_per_second": 683.034, |
|
"eval_steps_per_second": 5.347, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 2.19, |
|
"learning_rate": 2.501499700059988e-05, |
|
"loss": 0.3808, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 2.19, |
|
"eval_accuracy": 0.8011587771203156, |
|
"eval_f1": 0.8108361051205994, |
|
"eval_loss": 0.7650117874145508, |
|
"eval_precision": 0.8317278803823261, |
|
"eval_qwk": 0.7224991347098964, |
|
"eval_recall": 0.8011587771203156, |
|
"eval_runtime": 23.668, |
|
"eval_samples_per_second": 685.482, |
|
"eval_steps_per_second": 5.366, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 2.63, |
|
"learning_rate": 2.001599680063987e-05, |
|
"loss": 0.2909, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 2.63, |
|
"eval_accuracy": 0.8086168639053254, |
|
"eval_f1": 0.8166494576368075, |
|
"eval_loss": 0.7910537719726562, |
|
"eval_precision": 0.8320947395056137, |
|
"eval_qwk": 0.732569302631819, |
|
"eval_recall": 0.8086168639053254, |
|
"eval_runtime": 23.5554, |
|
"eval_samples_per_second": 688.761, |
|
"eval_steps_per_second": 5.392, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 3.07, |
|
"learning_rate": 1.5026994601079786e-05, |
|
"loss": 0.2746, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 3.07, |
|
"eval_accuracy": 0.7985083826429981, |
|
"eval_f1": 0.8084609549617363, |
|
"eval_loss": 0.9503954648971558, |
|
"eval_precision": 0.8285545185236465, |
|
"eval_qwk": 0.7236034727222331, |
|
"eval_recall": 0.7985083826429981, |
|
"eval_runtime": 23.5785, |
|
"eval_samples_per_second": 688.084, |
|
"eval_steps_per_second": 5.386, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 3.51, |
|
"learning_rate": 1.0027994401119777e-05, |
|
"loss": 0.1939, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 3.51, |
|
"eval_accuracy": 0.7966592702169625, |
|
"eval_f1": 0.8064656300991808, |
|
"eval_loss": 0.9597578048706055, |
|
"eval_precision": 0.8249666716932728, |
|
"eval_qwk": 0.7250412688400546, |
|
"eval_recall": 0.7966592702169625, |
|
"eval_runtime": 23.6525, |
|
"eval_samples_per_second": 685.931, |
|
"eval_steps_per_second": 5.369, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 3.94, |
|
"learning_rate": 5.028994201159768e-06, |
|
"loss": 0.1824, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 3.94, |
|
"eval_accuracy": 0.8023298816568047, |
|
"eval_f1": 0.810968480495596, |
|
"eval_loss": 1.060992956161499, |
|
"eval_precision": 0.8277405554545381, |
|
"eval_qwk": 0.7252407399333649, |
|
"eval_recall": 0.8023298816568047, |
|
"eval_runtime": 23.7166, |
|
"eval_samples_per_second": 684.077, |
|
"eval_steps_per_second": 5.355, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 4.38, |
|
"learning_rate": 2.999400119976005e-08, |
|
"loss": 0.1426, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 4.38, |
|
"eval_accuracy": 0.8090483234714004, |
|
"eval_f1": 0.8157426407187547, |
|
"eval_loss": 1.1207919120788574, |
|
"eval_precision": 0.8273912560003507, |
|
"eval_qwk": 0.7316045159099166, |
|
"eval_recall": 0.8090483234714004, |
|
"eval_runtime": 23.6323, |
|
"eval_samples_per_second": 686.518, |
|
"eval_steps_per_second": 5.374, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 4.38, |
|
"step": 5001, |
|
"total_flos": 1.6838837781764506e+17, |
|
"train_loss": 0.3670836862052257, |
|
"train_runtime": 2628.6927, |
|
"train_samples_per_second": 243.516, |
|
"train_steps_per_second": 1.902 |
|
} |
|
], |
|
"max_steps": 5001, |
|
"num_train_epochs": 5, |
|
"total_flos": 1.6838837781764506e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|