{ "best_metric": 0.7449400424957275, "best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/models/t5-small-codesearchnet-python/checkpoint-3750", "epoch": 14.0, "global_step": 5250, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_avg_length": 14.1472, "eval_bleu": 0.0004, "eval_loss": 0.966545581817627, "eval_rouge1": 0.1696, "eval_rouge2": 0.0384, "eval_runtime": 148.9068, "eval_samples_per_second": 33.578, "eval_steps_per_second": 4.197, "step": 375 }, { "epoch": 1.33, "learning_rate": 0.011612925678491592, "loss": 2.0677, "step": 500 }, { "epoch": 2.0, "eval_avg_length": 13.38, "eval_bleu": 0.0004, "eval_loss": 0.8739555478096008, "eval_rouge1": 0.1758, "eval_rouge2": 0.0428, "eval_runtime": 148.3073, "eval_samples_per_second": 33.714, "eval_steps_per_second": 4.214, "step": 750 }, { "epoch": 2.67, "learning_rate": 0.02327043004333973, "loss": 0.8314, "step": 1000 }, { "epoch": 3.0, "eval_avg_length": 14.8026, "eval_bleu": 0.001, "eval_loss": 0.8281144499778748, "eval_rouge1": 0.1925, "eval_rouge2": 0.0505, "eval_runtime": 149.134, "eval_samples_per_second": 33.527, "eval_steps_per_second": 4.191, "step": 1125 }, { "epoch": 4.0, "learning_rate": 0.03499961644411087, "loss": 0.7563, "step": 1500 }, { "epoch": 4.0, "eval_avg_length": 14.9606, "eval_bleu": 0.0017, "eval_loss": 0.7996220588684082, "eval_rouge1": 0.2033, "eval_rouge2": 0.0582, "eval_runtime": 150.6141, "eval_samples_per_second": 33.197, "eval_steps_per_second": 4.15, "step": 1500 }, { "epoch": 5.0, "eval_avg_length": 14.9434, "eval_bleu": 0.0022, "eval_loss": 0.7780128121376038, "eval_rouge1": 0.2117, "eval_rouge2": 0.0607, "eval_runtime": 150.0628, "eval_samples_per_second": 33.319, "eval_steps_per_second": 4.165, "step": 1875 }, { "epoch": 5.33, "learning_rate": 0.04683296009898186, "loss": 0.6959, "step": 2000 }, { "epoch": 6.0, "eval_avg_length": 14.6926, "eval_bleu": 0.002, "eval_loss": 0.7587344646453857, "eval_rouge1": 0.2135, "eval_rouge2": 0.0621, "eval_runtime": 149.6348, "eval_samples_per_second": 33.415, "eval_steps_per_second": 4.177, "step": 2250 }, { "epoch": 6.67, "learning_rate": 0.058812398463487625, "loss": 0.6591, "step": 2500 }, { "epoch": 7.0, "eval_avg_length": 15.2818, "eval_bleu": 0.002, "eval_loss": 0.7544705271720886, "eval_rouge1": 0.2073, "eval_rouge2": 0.0605, "eval_runtime": 150.3492, "eval_samples_per_second": 33.256, "eval_steps_per_second": 4.157, "step": 2625 }, { "epoch": 8.0, "learning_rate": 0.07098705321550369, "loss": 0.6205, "step": 3000 }, { "epoch": 8.0, "eval_avg_length": 15.051, "eval_bleu": 0.0024, "eval_loss": 0.7471866011619568, "eval_rouge1": 0.2187, "eval_rouge2": 0.0674, "eval_runtime": 150.0125, "eval_samples_per_second": 33.331, "eval_steps_per_second": 4.166, "step": 3000 }, { "epoch": 9.0, "eval_avg_length": 15.6286, "eval_bleu": 0.0031, "eval_loss": 0.7505583763122559, "eval_rouge1": 0.2266, "eval_rouge2": 0.0696, "eval_runtime": 151.1802, "eval_samples_per_second": 33.073, "eval_steps_per_second": 4.134, "step": 3375 }, { "epoch": 9.33, "learning_rate": 0.08336292207241058, "loss": 0.5822, "step": 3500 }, { "epoch": 10.0, "eval_avg_length": 13.1462, "eval_bleu": 0.001, "eval_loss": 0.7449400424957275, "eval_rouge1": 0.206, "eval_rouge2": 0.063, "eval_runtime": 149.4965, "eval_samples_per_second": 33.446, "eval_steps_per_second": 4.181, "step": 3750 }, { "epoch": 10.67, "learning_rate": 0.09602057933807373, "loss": 0.5553, "step": 4000 }, { "epoch": 11.0, "eval_avg_length": 16.4076, "eval_bleu": 0.0027, "eval_loss": 0.7572856545448303, "eval_rouge1": 0.2148, "eval_rouge2": 0.0647, "eval_runtime": 151.0658, "eval_samples_per_second": 33.098, "eval_steps_per_second": 4.137, "step": 4125 }, { "epoch": 12.0, "learning_rate": 0.10902385413646698, "loss": 0.5295, "step": 4500 }, { "epoch": 12.0, "eval_avg_length": 15.8986, "eval_bleu": 0.0026, "eval_loss": 0.7677233219146729, "eval_rouge1": 0.2185, "eval_rouge2": 0.0658, "eval_runtime": 150.5334, "eval_samples_per_second": 33.215, "eval_steps_per_second": 4.152, "step": 4500 }, { "epoch": 13.0, "eval_avg_length": 12.3528, "eval_bleu": 0.0009, "eval_loss": 0.759487509727478, "eval_rouge1": 0.2052, "eval_rouge2": 0.0618, "eval_runtime": 147.275, "eval_samples_per_second": 33.95, "eval_steps_per_second": 4.244, "step": 4875 }, { "epoch": 13.33, "learning_rate": 0.12233853340148926, "loss": 0.4977, "step": 5000 }, { "epoch": 14.0, "eval_avg_length": 16.6706, "eval_bleu": 0.0035, "eval_loss": 0.7765543460845947, "eval_rouge1": 0.2177, "eval_rouge2": 0.0636, "eval_runtime": 151.0761, "eval_samples_per_second": 33.096, "eval_steps_per_second": 4.137, "step": 5250 } ], "max_steps": 5625, "num_train_epochs": 15, "total_flos": 2.842177830912e+16, "trial_name": null, "trial_params": null }