| { | |
| "best_metric": 0.5588609576225281, | |
| "best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/models/t5-small-codesearchnet-multilang-python-java-javascript-go/checkpoint-3750", | |
| "epoch": 15.0, | |
| "global_step": 5625, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_avg_length": 16.436, | |
| "eval_bleu": 0.0028, | |
| "eval_loss": 0.7349299192428589, | |
| "eval_rouge1": 0.1562, | |
| "eval_rouge2": 0.0364, | |
| "eval_runtime": 171.828, | |
| "eval_samples_per_second": 29.099, | |
| "eval_steps_per_second": 3.637, | |
| "step": 375 | |
| }, | |
| { | |
| "epoch": 1.33, | |
| "learning_rate": 0.011613096110522747, | |
| "loss": 2.3117, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_avg_length": 16.824, | |
| "eval_bleu": 0.0066, | |
| "eval_loss": 0.6613165736198425, | |
| "eval_rouge1": 0.1818, | |
| "eval_rouge2": 0.0531, | |
| "eval_runtime": 169.3563, | |
| "eval_samples_per_second": 29.524, | |
| "eval_steps_per_second": 3.69, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 2.67, | |
| "learning_rate": 0.023271184414625168, | |
| "loss": 0.6755, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_avg_length": 16.931, | |
| "eval_bleu": 0.007, | |
| "eval_loss": 0.6232756972312927, | |
| "eval_rouge1": 0.1957, | |
| "eval_rouge2": 0.0594, | |
| "eval_runtime": 169.3476, | |
| "eval_samples_per_second": 29.525, | |
| "eval_steps_per_second": 3.691, | |
| "step": 1125 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "learning_rate": 0.03499825298786163, | |
| "loss": 0.5998, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_avg_length": 16.7154, | |
| "eval_bleu": 0.0082, | |
| "eval_loss": 0.6022565364837646, | |
| "eval_rouge1": 0.202, | |
| "eval_rouge2": 0.063, | |
| "eval_runtime": 165.1906, | |
| "eval_samples_per_second": 30.268, | |
| "eval_steps_per_second": 3.784, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_avg_length": 16.5468, | |
| "eval_bleu": 0.0096, | |
| "eval_loss": 0.5925326943397522, | |
| "eval_rouge1": 0.2154, | |
| "eval_rouge2": 0.0703, | |
| "eval_runtime": 162.8367, | |
| "eval_samples_per_second": 30.706, | |
| "eval_steps_per_second": 3.838, | |
| "step": 1875 | |
| }, | |
| { | |
| "epoch": 5.33, | |
| "learning_rate": 0.04682626947760582, | |
| "loss": 0.5511, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_avg_length": 15.7216, | |
| "eval_bleu": 0.0091, | |
| "eval_loss": 0.5728126168251038, | |
| "eval_rouge1": 0.2213, | |
| "eval_rouge2": 0.0774, | |
| "eval_runtime": 160.1137, | |
| "eval_samples_per_second": 31.228, | |
| "eval_steps_per_second": 3.903, | |
| "step": 2250 | |
| }, | |
| { | |
| "epoch": 6.67, | |
| "learning_rate": 0.05879075452685356, | |
| "loss": 0.5147, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_avg_length": 16.6658, | |
| "eval_bleu": 0.0111, | |
| "eval_loss": 0.5669918060302734, | |
| "eval_rouge1": 0.2311, | |
| "eval_rouge2": 0.0815, | |
| "eval_runtime": 160.5038, | |
| "eval_samples_per_second": 31.152, | |
| "eval_steps_per_second": 3.894, | |
| "step": 2625 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "learning_rate": 0.07094069570302963, | |
| "loss": 0.4861, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_avg_length": 17.038, | |
| "eval_bleu": 0.0089, | |
| "eval_loss": 0.5627844929695129, | |
| "eval_rouge1": 0.2217, | |
| "eval_rouge2": 0.077, | |
| "eval_runtime": 160.3931, | |
| "eval_samples_per_second": 31.173, | |
| "eval_steps_per_second": 3.897, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_avg_length": 16.362, | |
| "eval_bleu": 0.0103, | |
| "eval_loss": 0.5597769618034363, | |
| "eval_rouge1": 0.2311, | |
| "eval_rouge2": 0.0825, | |
| "eval_runtime": 159.243, | |
| "eval_samples_per_second": 31.399, | |
| "eval_steps_per_second": 3.925, | |
| "step": 3375 | |
| }, | |
| { | |
| "epoch": 9.33, | |
| "learning_rate": 0.08328617364168167, | |
| "loss": 0.4526, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_avg_length": 15.4298, | |
| "eval_bleu": 0.0083, | |
| "eval_loss": 0.5588609576225281, | |
| "eval_rouge1": 0.232, | |
| "eval_rouge2": 0.086, | |
| "eval_runtime": 160.7722, | |
| "eval_samples_per_second": 31.1, | |
| "eval_steps_per_second": 3.887, | |
| "step": 3750 | |
| }, | |
| { | |
| "epoch": 10.67, | |
| "learning_rate": 0.09589392691850662, | |
| "loss": 0.4329, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_avg_length": 16.5468, | |
| "eval_bleu": 0.0098, | |
| "eval_loss": 0.5649139285087585, | |
| "eval_rouge1": 0.2349, | |
| "eval_rouge2": 0.0839, | |
| "eval_runtime": 168.9129, | |
| "eval_samples_per_second": 29.601, | |
| "eval_steps_per_second": 3.7, | |
| "step": 4125 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "learning_rate": 0.10882016271352768, | |
| "loss": 0.4102, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_avg_length": 16.4136, | |
| "eval_bleu": 0.0098, | |
| "eval_loss": 0.5633437633514404, | |
| "eval_rouge1": 0.2366, | |
| "eval_rouge2": 0.0867, | |
| "eval_runtime": 166.1994, | |
| "eval_samples_per_second": 30.084, | |
| "eval_steps_per_second": 3.761, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_avg_length": 15.9864, | |
| "eval_bleu": 0.01, | |
| "eval_loss": 0.5841416120529175, | |
| "eval_rouge1": 0.2385, | |
| "eval_rouge2": 0.0869, | |
| "eval_runtime": 162.6882, | |
| "eval_samples_per_second": 30.734, | |
| "eval_steps_per_second": 3.842, | |
| "step": 4875 | |
| }, | |
| { | |
| "epoch": 13.33, | |
| "learning_rate": 0.12202449887990952, | |
| "loss": 0.3841, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_avg_length": 16.842, | |
| "eval_bleu": 0.0128, | |
| "eval_loss": 0.5776922106742859, | |
| "eval_rouge1": 0.2437, | |
| "eval_rouge2": 0.0894, | |
| "eval_runtime": 165.8581, | |
| "eval_samples_per_second": 30.146, | |
| "eval_steps_per_second": 3.768, | |
| "step": 5250 | |
| }, | |
| { | |
| "epoch": 14.67, | |
| "learning_rate": 0.13565437495708466, | |
| "loss": 0.3673, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_avg_length": 16.6192, | |
| "eval_bleu": 0.009, | |
| "eval_loss": 0.5955406427383423, | |
| "eval_rouge1": 0.2321, | |
| "eval_rouge2": 0.0831, | |
| "eval_runtime": 163.3821, | |
| "eval_samples_per_second": 30.603, | |
| "eval_steps_per_second": 3.825, | |
| "step": 5625 | |
| } | |
| ], | |
| "max_steps": 5625, | |
| "num_train_epochs": 15, | |
| "total_flos": 3.04519053312e+16, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |