|
{ |
|
"best_metric": 0.9389400921658986, |
|
"best_model_checkpoint": "vit-base-patch16-224-in21k-finetuned-gecko/checkpoint-105", |
|
"epoch": 4.827586206896552, |
|
"eval_steps": 500, |
|
"global_step": 105, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.46, |
|
"learning_rate": 0.00045238095238095237, |
|
"loss": 4.0904, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.92, |
|
"learning_rate": 0.0004047619047619048, |
|
"loss": 3.4758, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.97, |
|
"eval_accuracy": 0.565668202764977, |
|
"eval_loss": 3.0532968044281006, |
|
"eval_runtime": 99.5572, |
|
"eval_samples_per_second": 8.719, |
|
"eval_steps_per_second": 0.281, |
|
"step": 21 |
|
}, |
|
{ |
|
"epoch": 1.38, |
|
"learning_rate": 0.00035714285714285714, |
|
"loss": 2.9086, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 1.84, |
|
"learning_rate": 0.00030952380952380956, |
|
"loss": 2.4494, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"eval_accuracy": 0.8191244239631337, |
|
"eval_loss": 2.0081708431243896, |
|
"eval_runtime": 96.1487, |
|
"eval_samples_per_second": 9.028, |
|
"eval_steps_per_second": 0.291, |
|
"step": 43 |
|
}, |
|
{ |
|
"epoch": 2.3, |
|
"learning_rate": 0.0002619047619047619, |
|
"loss": 2.0186, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 2.76, |
|
"learning_rate": 0.00021428571428571427, |
|
"loss": 1.6937, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 2.99, |
|
"eval_accuracy": 0.880184331797235, |
|
"eval_loss": 1.426762342453003, |
|
"eval_runtime": 98.7923, |
|
"eval_samples_per_second": 8.786, |
|
"eval_steps_per_second": 0.283, |
|
"step": 65 |
|
}, |
|
{ |
|
"epoch": 3.22, |
|
"learning_rate": 0.00016666666666666666, |
|
"loss": 1.4682, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 3.68, |
|
"learning_rate": 0.00011904761904761905, |
|
"loss": 1.3144, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9182027649769585, |
|
"eval_loss": 1.1381995677947998, |
|
"eval_runtime": 104.0783, |
|
"eval_samples_per_second": 8.34, |
|
"eval_steps_per_second": 0.269, |
|
"step": 87 |
|
}, |
|
{ |
|
"epoch": 4.14, |
|
"learning_rate": 7.142857142857142e-05, |
|
"loss": 1.1998, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 4.6, |
|
"learning_rate": 2.380952380952381e-05, |
|
"loss": 1.1068, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 4.83, |
|
"eval_accuracy": 0.9389400921658986, |
|
"eval_loss": 1.0130665302276611, |
|
"eval_runtime": 98.1827, |
|
"eval_samples_per_second": 8.841, |
|
"eval_steps_per_second": 0.285, |
|
"step": 105 |
|
}, |
|
{ |
|
"epoch": 4.83, |
|
"step": 105, |
|
"total_flos": 1.0346740581105009e+18, |
|
"train_loss": 2.118878391810826, |
|
"train_runtime": 1863.9077, |
|
"train_samples_per_second": 7.404, |
|
"train_steps_per_second": 0.056 |
|
} |
|
], |
|
"logging_steps": 10, |
|
"max_steps": 105, |
|
"num_train_epochs": 5, |
|
"save_steps": 500, |
|
"total_flos": 1.0346740581105009e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|