SodaXII's picture
Model save
0498682 verified
{
"best_metric": 0.2626972794532776,
"best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/[v4] Training Output/vit-tiny-patch16-224_rice-leaf-disease-augmented-v4_fft/checkpoint-448",
"epoch": 15.0,
"eval_steps": 64,
"global_step": 1920,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.5,
"grad_norm": 9.17007064819336,
"learning_rate": 7.265625e-06,
"loss": 2.0564,
"step": 64
},
{
"epoch": 0.5,
"eval_accuracy": 0.4899328859060403,
"eval_loss": 1.4541155099868774,
"eval_runtime": 8.722,
"eval_samples_per_second": 34.167,
"eval_steps_per_second": 0.573,
"step": 64
},
{
"epoch": 1.0,
"grad_norm": 13.332218170166016,
"learning_rate": 1.4765625e-05,
"loss": 1.0767,
"step": 128
},
{
"epoch": 1.0,
"eval_accuracy": 0.7651006711409396,
"eval_loss": 0.6909474730491638,
"eval_runtime": 8.6475,
"eval_samples_per_second": 34.461,
"eval_steps_per_second": 0.578,
"step": 128
},
{
"epoch": 1.5,
"grad_norm": 9.764442443847656,
"learning_rate": 2.2265625e-05,
"loss": 0.4917,
"step": 192
},
{
"epoch": 1.5,
"eval_accuracy": 0.8322147651006712,
"eval_loss": 0.4307171106338501,
"eval_runtime": 8.6026,
"eval_samples_per_second": 34.641,
"eval_steps_per_second": 0.581,
"step": 192
},
{
"epoch": 2.0,
"grad_norm": 9.665606498718262,
"learning_rate": 2.9765625e-05,
"loss": 0.285,
"step": 256
},
{
"epoch": 2.0,
"eval_accuracy": 0.9026845637583892,
"eval_loss": 0.2932307720184326,
"eval_runtime": 7.7763,
"eval_samples_per_second": 38.322,
"eval_steps_per_second": 0.643,
"step": 256
},
{
"epoch": 2.5,
"grad_norm": 8.143477439880371,
"learning_rate": 2.9084596206825315e-05,
"loss": 0.0902,
"step": 320
},
{
"epoch": 2.5,
"eval_accuracy": 0.8993288590604027,
"eval_loss": 0.31344401836395264,
"eval_runtime": 7.522,
"eval_samples_per_second": 39.617,
"eval_steps_per_second": 0.665,
"step": 320
},
{
"epoch": 3.0,
"grad_norm": 2.6106486320495605,
"learning_rate": 2.633961484257573e-05,
"loss": 0.0588,
"step": 384
},
{
"epoch": 3.0,
"eval_accuracy": 0.9161073825503355,
"eval_loss": 0.3075862526893616,
"eval_runtime": 8.3334,
"eval_samples_per_second": 35.76,
"eval_steps_per_second": 0.6,
"step": 384
},
{
"epoch": 3.5,
"grad_norm": 1.9543571472167969,
"learning_rate": 2.212085192038453e-05,
"loss": 0.0155,
"step": 448
},
{
"epoch": 3.5,
"eval_accuracy": 0.9395973154362416,
"eval_loss": 0.2626972794532776,
"eval_runtime": 8.3127,
"eval_samples_per_second": 35.849,
"eval_steps_per_second": 0.601,
"step": 448
},
{
"epoch": 4.0,
"grad_norm": 0.38745102286338806,
"learning_rate": 1.6976609572058592e-05,
"loss": 0.0066,
"step": 512
},
{
"epoch": 4.0,
"eval_accuracy": 0.9295302013422819,
"eval_loss": 0.299156129360199,
"eval_runtime": 7.2879,
"eval_samples_per_second": 40.89,
"eval_steps_per_second": 0.686,
"step": 512
},
{
"epoch": 4.5,
"grad_norm": 0.10160534083843231,
"learning_rate": 1.1575472190259976e-05,
"loss": 0.0017,
"step": 576
},
{
"epoch": 4.5,
"eval_accuracy": 0.9228187919463087,
"eval_loss": 0.2935960590839386,
"eval_runtime": 8.4642,
"eval_samples_per_second": 35.207,
"eval_steps_per_second": 0.591,
"step": 576
},
{
"epoch": 5.0,
"grad_norm": 0.13512970507144928,
"learning_rate": 6.619412176671753e-06,
"loss": 0.0009,
"step": 640
},
{
"epoch": 5.0,
"eval_accuracy": 0.9228187919463087,
"eval_loss": 0.29606831073760986,
"eval_runtime": 8.1466,
"eval_samples_per_second": 36.58,
"eval_steps_per_second": 0.614,
"step": 640
},
{
"epoch": 5.5,
"grad_norm": 0.08882313966751099,
"learning_rate": 2.7525563336129812e-06,
"loss": 0.0006,
"step": 704
},
{
"epoch": 5.5,
"eval_accuracy": 0.9228187919463087,
"eval_loss": 0.30046388506889343,
"eval_runtime": 7.478,
"eval_samples_per_second": 39.85,
"eval_steps_per_second": 0.669,
"step": 704
},
{
"epoch": 6.0,
"grad_norm": 0.08427230268716812,
"learning_rate": 4.774703044353035e-07,
"loss": 0.0005,
"step": 768
},
{
"epoch": 6.0,
"eval_accuracy": 0.9228187919463087,
"eval_loss": 0.3003771901130676,
"eval_runtime": 8.3653,
"eval_samples_per_second": 35.623,
"eval_steps_per_second": 0.598,
"step": 768
},
{
"epoch": 6.5,
"grad_norm": 0.03683856502175331,
"learning_rate": 2.9910158634081504e-05,
"loss": 0.0005,
"step": 832
},
{
"epoch": 6.5,
"eval_accuracy": 0.9261744966442953,
"eval_loss": 0.2867479920387268,
"eval_runtime": 7.215,
"eval_samples_per_second": 41.303,
"eval_steps_per_second": 0.693,
"step": 832
},
{
"epoch": 7.0,
"grad_norm": 0.04806307703256607,
"learning_rate": 2.8359951312200077e-05,
"loss": 0.0004,
"step": 896
},
{
"epoch": 7.0,
"eval_accuracy": 0.9295302013422819,
"eval_loss": 0.2976870834827423,
"eval_runtime": 8.3401,
"eval_samples_per_second": 35.731,
"eval_steps_per_second": 0.6,
"step": 896
},
{
"epoch": 7.5,
"grad_norm": 0.033956822007894516,
"learning_rate": 2.5073384322705278e-05,
"loss": 0.0003,
"step": 960
},
{
"epoch": 7.5,
"eval_accuracy": 0.9295302013422819,
"eval_loss": 0.2943709194660187,
"eval_runtime": 7.6673,
"eval_samples_per_second": 38.867,
"eval_steps_per_second": 0.652,
"step": 960
},
{
"epoch": 8.0,
"grad_norm": 0.031262967735528946,
"learning_rate": 2.0477604608884026e-05,
"loss": 0.0002,
"step": 1024
},
{
"epoch": 8.0,
"eval_accuracy": 0.9295302013422819,
"eval_loss": 0.30740392208099365,
"eval_runtime": 8.2818,
"eval_samples_per_second": 35.982,
"eval_steps_per_second": 0.604,
"step": 1024
},
{
"epoch": 8.5,
"grad_norm": 0.01630540005862713,
"learning_rate": 1.516991423792483e-05,
"loss": 0.0002,
"step": 1088
},
{
"epoch": 8.5,
"eval_accuracy": 0.9328859060402684,
"eval_loss": 0.3053071200847626,
"eval_runtime": 8.2512,
"eval_samples_per_second": 36.116,
"eval_steps_per_second": 0.606,
"step": 1088
},
{
"epoch": 9.0,
"grad_norm": 0.016130153089761734,
"learning_rate": 9.840140535762432e-06,
"loss": 0.0002,
"step": 1152
},
{
"epoch": 9.0,
"eval_accuracy": 0.9295302013422819,
"eval_loss": 0.3097546696662903,
"eval_runtime": 8.418,
"eval_samples_per_second": 35.4,
"eval_steps_per_second": 0.594,
"step": 1152
},
{
"epoch": 9.5,
"grad_norm": 0.014978409744799137,
"learning_rate": 5.180980944002794e-06,
"loss": 0.0001,
"step": 1216
},
{
"epoch": 9.5,
"eval_accuracy": 0.9295302013422819,
"eval_loss": 0.310248464345932,
"eval_runtime": 7.2498,
"eval_samples_per_second": 41.105,
"eval_steps_per_second": 0.69,
"step": 1216
},
{
"epoch": 10.0,
"grad_norm": 0.013572459109127522,
"learning_rate": 1.7979748550475833e-06,
"loss": 0.0001,
"step": 1280
},
{
"epoch": 10.0,
"eval_accuracy": 0.9261744966442953,
"eval_loss": 0.3105408847332001,
"eval_runtime": 8.3297,
"eval_samples_per_second": 35.776,
"eval_steps_per_second": 0.6,
"step": 1280
},
{
"epoch": 10.5,
"grad_norm": 0.010590254329144955,
"learning_rate": 1.3080316225364152e-07,
"loss": 0.0001,
"step": 1344
},
{
"epoch": 10.5,
"eval_accuracy": 0.9261744966442953,
"eval_loss": 0.3105214238166809,
"eval_runtime": 7.2656,
"eval_samples_per_second": 41.015,
"eval_steps_per_second": 0.688,
"step": 1344
},
{
"epoch": 11.0,
"grad_norm": 0.011299003846943378,
"learning_rate": 2.9603855973006482e-05,
"loss": 0.0001,
"step": 1408
},
{
"epoch": 11.0,
"eval_accuracy": 0.9261744966442953,
"eval_loss": 0.32019779086112976,
"eval_runtime": 8.1649,
"eval_samples_per_second": 36.498,
"eval_steps_per_second": 0.612,
"step": 1408
},
{
"epoch": 11.5,
"grad_norm": 0.016378453001379967,
"learning_rate": 2.7440488243452587e-05,
"loss": 0.0001,
"step": 1472
},
{
"epoch": 11.5,
"eval_accuracy": 0.9295302013422819,
"eval_loss": 0.3183320462703705,
"eval_runtime": 8.0678,
"eval_samples_per_second": 36.937,
"eval_steps_per_second": 0.62,
"step": 1472
},
{
"epoch": 12.0,
"grad_norm": 0.007818573154509068,
"learning_rate": 2.3660261176123762e-05,
"loss": 0.0001,
"step": 1536
},
{
"epoch": 12.0,
"eval_accuracy": 0.9328859060402684,
"eval_loss": 0.3130977153778076,
"eval_runtime": 8.2508,
"eval_samples_per_second": 36.118,
"eval_steps_per_second": 0.606,
"step": 1536
},
{
"epoch": 12.5,
"grad_norm": 0.00784409698098898,
"learning_rate": 1.875448148769462e-05,
"loss": 0.0001,
"step": 1600
},
{
"epoch": 12.5,
"eval_accuracy": 0.9295302013422819,
"eval_loss": 0.3157329261302948,
"eval_runtime": 7.1968,
"eval_samples_per_second": 41.407,
"eval_steps_per_second": 0.695,
"step": 1600
},
{
"epoch": 13.0,
"grad_norm": 0.006332057528197765,
"learning_rate": 1.3360741171588585e-05,
"loss": 0.0001,
"step": 1664
},
{
"epoch": 13.0,
"eval_accuracy": 0.9228187919463087,
"eval_loss": 0.3237887918949127,
"eval_runtime": 8.2082,
"eval_samples_per_second": 36.305,
"eval_steps_per_second": 0.609,
"step": 1664
},
{
"epoch": 13.5,
"grad_norm": 0.006929404567927122,
"learning_rate": 8.180051251245103e-06,
"loss": 0.0001,
"step": 1728
},
{
"epoch": 13.5,
"eval_accuracy": 0.9228187919463087,
"eval_loss": 0.3219589591026306,
"eval_runtime": 7.2368,
"eval_samples_per_second": 41.179,
"eval_steps_per_second": 0.691,
"step": 1728
},
{
"epoch": 14.0,
"grad_norm": 0.005624026525765657,
"learning_rate": 3.885733119675617e-06,
"loss": 0.0001,
"step": 1792
},
{
"epoch": 14.0,
"eval_accuracy": 0.9228187919463087,
"eval_loss": 0.3266230821609497,
"eval_runtime": 7.1645,
"eval_samples_per_second": 41.594,
"eval_steps_per_second": 0.698,
"step": 1792
},
{
"epoch": 14.5,
"grad_norm": 0.006068665534257889,
"learning_rate": 1.0359086314671929e-06,
"loss": 0.0001,
"step": 1856
},
{
"epoch": 14.5,
"eval_accuracy": 0.9228187919463087,
"eval_loss": 0.32735249400138855,
"eval_runtime": 7.4237,
"eval_samples_per_second": 40.142,
"eval_steps_per_second": 0.674,
"step": 1856
},
{
"epoch": 15.0,
"grad_norm": 0.007146658841520548,
"learning_rate": 9.62392481628771e-10,
"loss": 0.0001,
"step": 1920
},
{
"epoch": 15.0,
"eval_accuracy": 0.9228187919463087,
"eval_loss": 0.32691627740859985,
"eval_runtime": 7.1631,
"eval_samples_per_second": 41.602,
"eval_steps_per_second": 0.698,
"step": 1920
},
{
"epoch": 15.0,
"step": 1920,
"total_flos": 6.132781352484864e+17,
"train_loss": 0.1362585227402936,
"train_runtime": 4195.4959,
"train_samples_per_second": 29.289,
"train_steps_per_second": 0.458
}
],
"logging_steps": 64,
"max_steps": 1920,
"num_input_tokens_seen": 0,
"num_train_epochs": 15,
"save_steps": 64,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 6.132781352484864e+17,
"train_batch_size": 64,
"trial_name": null,
"trial_params": null
}