{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.9891196834817013, "global_step": 1000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.1, "learning_rate": 1e-05, "loss": 1.012, "step": 100 }, { "epoch": 0.1, "eval_acc": 0.9251113585746102, "eval_f1 score": 0.9269220320565063, "eval_loss": 0.1983393132686615, "eval_precision": 0.8821096173733195, "eval_recall": 0.976531196336577, "eval_runtime": 29.7994, "eval_samples_per_second": 120.54, "eval_steps_per_second": 3.792, "step": 100 }, { "epoch": 0.2, "learning_rate": 2e-05, "loss": 0.0588, "step": 200 }, { "epoch": 0.2, "eval_acc": 0.9974944320712695, "eval_f1 score": 0.9974307736226092, "eval_loss": 0.008134149946272373, "eval_precision": 0.994874715261959, "eval_recall": 1.0, "eval_runtime": 29.7706, "eval_samples_per_second": 120.656, "eval_steps_per_second": 3.796, "step": 200 }, { "epoch": 0.3, "learning_rate": 3e-05, "loss": 0.0094, "step": 300 }, { "epoch": 0.3, "eval_acc": 0.9991648106904232, "eval_f1 score": 0.9991421218187019, "eval_loss": 0.0014619326684623957, "eval_precision": 0.9982857142857143, "eval_recall": 1.0, "eval_runtime": 29.7156, "eval_samples_per_second": 120.879, "eval_steps_per_second": 3.803, "step": 300 }, { "epoch": 0.4, "learning_rate": 4e-05, "loss": 0.003, "step": 400 }, { "epoch": 0.4, "eval_acc": 0.9991648106904232, "eval_f1 score": 0.9991411394217007, "eval_loss": 0.0031169140711426735, "eval_precision": 0.9994272623138603, "eval_recall": 0.9988551803091014, "eval_runtime": 29.7394, "eval_samples_per_second": 120.782, "eval_steps_per_second": 3.8, "step": 400 }, { "epoch": 0.49, "learning_rate": 5e-05, "loss": 0.0033, "step": 500 }, { "epoch": 0.49, "eval_acc": 0.998608017817372, "eval_f1 score": 0.9985710202915119, "eval_loss": 0.009261890314519405, "eval_precision": 0.9971461187214612, "eval_recall": 1.0, "eval_runtime": 29.7575, "eval_samples_per_second": 120.709, "eval_steps_per_second": 3.797, "step": 500 }, { "epoch": 0.59, "learning_rate": 4.021526418786693e-05, "loss": 0.0059, "step": 600 }, { "epoch": 0.59, "eval_acc": 0.9997216035634744, "eval_f1 score": 0.9997138769670958, "eval_loss": 0.002947951899841428, "eval_precision": 0.9994279176201373, "eval_recall": 1.0, "eval_runtime": 29.8118, "eval_samples_per_second": 120.489, "eval_steps_per_second": 3.79, "step": 600 }, { "epoch": 0.69, "learning_rate": 3.0430528375733857e-05, "loss": 0.0025, "step": 700 }, { "epoch": 0.69, "eval_acc": 1.0, "eval_f1 score": 1.0, "eval_loss": 0.00011875820928253233, "eval_precision": 1.0, "eval_recall": 1.0, "eval_runtime": 29.727, "eval_samples_per_second": 120.833, "eval_steps_per_second": 3.801, "step": 700 }, { "epoch": 0.79, "learning_rate": 2.064579256360078e-05, "loss": 0.0001, "step": 800 }, { "epoch": 0.79, "eval_acc": 0.9994432071269488, "eval_f1 score": 0.9994272623138604, "eval_loss": 0.0010784701444208622, "eval_precision": 1.0, "eval_recall": 0.9988551803091014, "eval_runtime": 29.689, "eval_samples_per_second": 120.987, "eval_steps_per_second": 3.806, "step": 800 }, { "epoch": 0.89, "learning_rate": 1.086105675146771e-05, "loss": 0.0042, "step": 900 }, { "epoch": 0.89, "eval_acc": 1.0, "eval_f1 score": 1.0, "eval_loss": 0.00021645698870997876, "eval_precision": 1.0, "eval_recall": 1.0, "eval_runtime": 29.7217, "eval_samples_per_second": 120.855, "eval_steps_per_second": 3.802, "step": 900 }, { "epoch": 0.99, "learning_rate": 1.076320939334638e-06, "loss": 0.0037, "step": 1000 }, { "epoch": 0.99, "eval_acc": 1.0, "eval_f1 score": 1.0, "eval_loss": 0.0003033815883100033, "eval_precision": 1.0, "eval_recall": 1.0, "eval_runtime": 29.7302, "eval_samples_per_second": 120.82, "eval_steps_per_second": 3.801, "step": 1000 } ], "max_steps": 1011, "num_train_epochs": 1, "total_flos": 4238956756992000.0, "trial_name": null, "trial_params": null }