{ "best_metric": 0.9590163934426229, "best_model_checkpoint": "./vit-LungCancerViT/checkpoint-350", "epoch": 20.0, "global_step": 700, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.29, "learning_rate": 2.857142857142857e-05, "loss": 1.3951, "step": 10 }, { "epoch": 0.57, "learning_rate": 5.714285714285714e-05, "loss": 0.9527, "step": 20 }, { "epoch": 0.86, "learning_rate": 8.571428571428571e-05, "loss": 0.7463, "step": 30 }, { "epoch": 1.0, "eval_accuracy": 0.7213114754098361, "eval_loss": 0.7026457190513611, "eval_runtime": 52.9268, "eval_samples_per_second": 2.305, "eval_steps_per_second": 0.302, "step": 35 }, { "epoch": 1.14, "learning_rate": 0.00011428571428571428, "loss": 0.5309, "step": 40 }, { "epoch": 1.43, "learning_rate": 0.00014285714285714287, "loss": 0.4553, "step": 50 }, { "epoch": 1.71, "learning_rate": 0.00017142857142857143, "loss": 0.3735, "step": 60 }, { "epoch": 2.0, "learning_rate": 0.0002, "loss": 0.2276, "step": 70 }, { "epoch": 2.0, "eval_accuracy": 0.8360655737704918, "eval_loss": 0.3694429099559784, "eval_runtime": 1.4376, "eval_samples_per_second": 84.864, "eval_steps_per_second": 11.13, "step": 70 }, { "epoch": 2.29, "learning_rate": 0.00019682539682539682, "loss": 0.321, "step": 80 }, { "epoch": 2.57, "learning_rate": 0.00019365079365079365, "loss": 0.1708, "step": 90 }, { "epoch": 2.86, "learning_rate": 0.00019047619047619048, "loss": 0.3134, "step": 100 }, { "epoch": 3.0, "eval_accuracy": 0.860655737704918, "eval_loss": 0.3415001332759857, "eval_runtime": 1.2015, "eval_samples_per_second": 101.542, "eval_steps_per_second": 13.317, "step": 105 }, { "epoch": 3.14, "learning_rate": 0.00018730158730158731, "loss": 0.1296, "step": 110 }, { "epoch": 3.43, "learning_rate": 0.00018412698412698412, "loss": 0.1161, "step": 120 }, { "epoch": 3.71, "learning_rate": 0.00018095238095238095, "loss": 0.0696, "step": 130 }, { "epoch": 4.0, "learning_rate": 0.00017777777777777779, "loss": 0.1487, "step": 140 }, { "epoch": 4.0, "eval_accuracy": 0.860655737704918, "eval_loss": 0.4990597069263458, "eval_runtime": 1.1086, "eval_samples_per_second": 110.045, "eval_steps_per_second": 14.432, "step": 140 }, { "epoch": 4.29, "learning_rate": 0.00017460317460317462, "loss": 0.0783, "step": 150 }, { "epoch": 4.57, "learning_rate": 0.00017142857142857143, "loss": 0.1082, "step": 160 }, { "epoch": 4.86, "learning_rate": 0.00016825396825396826, "loss": 0.0301, "step": 170 }, { "epoch": 5.0, "eval_accuracy": 0.8934426229508197, "eval_loss": 0.2610397934913635, "eval_runtime": 1.1421, "eval_samples_per_second": 106.821, "eval_steps_per_second": 14.009, "step": 175 }, { "epoch": 5.14, "learning_rate": 0.0001650793650793651, "loss": 0.0994, "step": 180 }, { "epoch": 5.43, "learning_rate": 0.00016190476190476192, "loss": 0.1404, "step": 190 }, { "epoch": 5.71, "learning_rate": 0.00015873015873015873, "loss": 0.0216, "step": 200 }, { "epoch": 6.0, "learning_rate": 0.00015555555555555556, "loss": 0.0567, "step": 210 }, { "epoch": 6.0, "eval_accuracy": 0.9098360655737705, "eval_loss": 0.2997801601886749, "eval_runtime": 1.3611, "eval_samples_per_second": 89.633, "eval_steps_per_second": 11.755, "step": 210 }, { "epoch": 6.29, "learning_rate": 0.00015238095238095237, "loss": 0.0529, "step": 220 }, { "epoch": 6.57, "learning_rate": 0.00014920634920634923, "loss": 0.0305, "step": 230 }, { "epoch": 6.86, "learning_rate": 0.00014603174603174603, "loss": 0.0084, "step": 240 }, { "epoch": 7.0, "eval_accuracy": 0.9016393442622951, "eval_loss": 0.4632587730884552, "eval_runtime": 1.1837, "eval_samples_per_second": 103.068, "eval_steps_per_second": 13.517, "step": 245 }, { "epoch": 7.14, "learning_rate": 0.00014285714285714287, "loss": 0.0174, "step": 250 }, { "epoch": 7.43, "learning_rate": 0.00013968253968253967, "loss": 0.0027, "step": 260 }, { "epoch": 7.71, "learning_rate": 0.0001365079365079365, "loss": 0.0245, "step": 270 }, { "epoch": 8.0, "learning_rate": 0.00013333333333333334, "loss": 0.0071, "step": 280 }, { "epoch": 8.0, "eval_accuracy": 0.9508196721311475, "eval_loss": 0.21911580860614777, "eval_runtime": 1.1253, "eval_samples_per_second": 108.412, "eval_steps_per_second": 14.218, "step": 280 }, { "epoch": 8.29, "learning_rate": 0.00013015873015873017, "loss": 0.0169, "step": 290 }, { "epoch": 8.57, "learning_rate": 0.00012698412698412698, "loss": 0.014, "step": 300 }, { "epoch": 8.86, "learning_rate": 0.0001238095238095238, "loss": 0.0231, "step": 310 }, { "epoch": 9.0, "eval_accuracy": 0.9344262295081968, "eval_loss": 0.3097061216831207, "eval_runtime": 1.1316, "eval_samples_per_second": 107.81, "eval_steps_per_second": 14.139, "step": 315 }, { "epoch": 9.14, "learning_rate": 0.00012063492063492063, "loss": 0.0003, "step": 320 }, { "epoch": 9.43, "learning_rate": 0.00011746031746031746, "loss": 0.0195, "step": 330 }, { "epoch": 9.71, "learning_rate": 0.00011428571428571428, "loss": 0.0062, "step": 340 }, { "epoch": 10.0, "learning_rate": 0.00011111111111111112, "loss": 0.0003, "step": 350 }, { "epoch": 10.0, "eval_accuracy": 0.9590163934426229, "eval_loss": 0.2627410292625427, "eval_runtime": 1.345, "eval_samples_per_second": 90.707, "eval_steps_per_second": 11.896, "step": 350 }, { "epoch": 10.29, "learning_rate": 0.00010793650793650794, "loss": 0.0004, "step": 360 }, { "epoch": 10.57, "learning_rate": 0.00010476190476190477, "loss": 0.003, "step": 370 }, { "epoch": 10.86, "learning_rate": 0.00010158730158730159, "loss": 0.0002, "step": 380 }, { "epoch": 11.0, "eval_accuracy": 0.9508196721311475, "eval_loss": 0.284305602312088, "eval_runtime": 1.3379, "eval_samples_per_second": 91.19, "eval_steps_per_second": 11.959, "step": 385 }, { "epoch": 11.14, "learning_rate": 9.841269841269841e-05, "loss": 0.0051, "step": 390 }, { "epoch": 11.43, "learning_rate": 9.523809523809524e-05, "loss": 0.0001, "step": 400 }, { "epoch": 11.71, "learning_rate": 9.206349206349206e-05, "loss": 0.0016, "step": 410 }, { "epoch": 12.0, "learning_rate": 8.888888888888889e-05, "loss": 0.005, "step": 420 }, { "epoch": 12.0, "eval_accuracy": 0.9508196721311475, "eval_loss": 0.28199827671051025, "eval_runtime": 1.1031, "eval_samples_per_second": 110.597, "eval_steps_per_second": 14.505, "step": 420 }, { "epoch": 12.29, "learning_rate": 8.571428571428571e-05, "loss": 0.0001, "step": 430 }, { "epoch": 12.57, "learning_rate": 8.253968253968255e-05, "loss": 0.0001, "step": 440 }, { "epoch": 12.86, "learning_rate": 7.936507936507937e-05, "loss": 0.0054, "step": 450 }, { "epoch": 13.0, "eval_accuracy": 0.9508196721311475, "eval_loss": 0.2708677649497986, "eval_runtime": 1.117, "eval_samples_per_second": 109.217, "eval_steps_per_second": 14.324, "step": 455 }, { "epoch": 13.14, "learning_rate": 7.619047619047618e-05, "loss": 0.0001, "step": 460 }, { "epoch": 13.43, "learning_rate": 7.301587301587302e-05, "loss": 0.0001, "step": 470 }, { "epoch": 13.71, "learning_rate": 6.984126984126984e-05, "loss": 0.0027, "step": 480 }, { "epoch": 14.0, "learning_rate": 6.666666666666667e-05, "loss": 0.0026, "step": 490 }, { "epoch": 14.0, "eval_accuracy": 0.9508196721311475, "eval_loss": 0.2664688229560852, "eval_runtime": 1.2394, "eval_samples_per_second": 98.438, "eval_steps_per_second": 12.91, "step": 490 }, { "epoch": 14.29, "learning_rate": 6.349206349206349e-05, "loss": 0.0023, "step": 500 }, { "epoch": 14.57, "learning_rate": 6.0317460317460316e-05, "loss": 0.0038, "step": 510 }, { "epoch": 14.86, "learning_rate": 5.714285714285714e-05, "loss": 0.0001, "step": 520 }, { "epoch": 15.0, "eval_accuracy": 0.9590163934426229, "eval_loss": 0.2634933888912201, "eval_runtime": 1.3242, "eval_samples_per_second": 92.133, "eval_steps_per_second": 12.083, "step": 525 }, { "epoch": 15.14, "learning_rate": 5.396825396825397e-05, "loss": 0.0023, "step": 530 }, { "epoch": 15.43, "learning_rate": 5.0793650793650794e-05, "loss": 0.0028, "step": 540 }, { "epoch": 15.71, "learning_rate": 4.761904761904762e-05, "loss": 0.0001, "step": 550 }, { "epoch": 16.0, "learning_rate": 4.4444444444444447e-05, "loss": 0.0001, "step": 560 }, { "epoch": 16.0, "eval_accuracy": 0.9590163934426229, "eval_loss": 0.26172590255737305, "eval_runtime": 1.134, "eval_samples_per_second": 107.579, "eval_steps_per_second": 14.109, "step": 560 }, { "epoch": 16.29, "learning_rate": 4.126984126984127e-05, "loss": 0.0025, "step": 570 }, { "epoch": 16.57, "learning_rate": 3.809523809523809e-05, "loss": 0.0026, "step": 580 }, { "epoch": 16.86, "learning_rate": 3.492063492063492e-05, "loss": 0.0001, "step": 590 }, { "epoch": 17.0, "eval_accuracy": 0.9590163934426229, "eval_loss": 0.26094985008239746, "eval_runtime": 1.1056, "eval_samples_per_second": 110.343, "eval_steps_per_second": 14.471, "step": 595 }, { "epoch": 17.14, "learning_rate": 3.1746031746031745e-05, "loss": 0.0001, "step": 600 }, { "epoch": 17.43, "learning_rate": 2.857142857142857e-05, "loss": 0.0025, "step": 610 }, { "epoch": 17.71, "learning_rate": 2.5396825396825397e-05, "loss": 0.0001, "step": 620 }, { "epoch": 18.0, "learning_rate": 2.2222222222222223e-05, "loss": 0.0026, "step": 630 }, { "epoch": 18.0, "eval_accuracy": 0.9590163934426229, "eval_loss": 0.2608335614204407, "eval_runtime": 1.0804, "eval_samples_per_second": 112.918, "eval_steps_per_second": 14.809, "step": 630 }, { "epoch": 18.29, "learning_rate": 1.9047619047619046e-05, "loss": 0.0023, "step": 640 }, { "epoch": 18.57, "learning_rate": 1.5873015873015872e-05, "loss": 0.0001, "step": 650 }, { "epoch": 18.86, "learning_rate": 1.2698412698412699e-05, "loss": 0.0028, "step": 660 }, { "epoch": 19.0, "eval_accuracy": 0.9590163934426229, "eval_loss": 0.2601701617240906, "eval_runtime": 1.2677, "eval_samples_per_second": 96.24, "eval_steps_per_second": 12.622, "step": 665 }, { "epoch": 19.14, "learning_rate": 9.523809523809523e-06, "loss": 0.0001, "step": 670 }, { "epoch": 19.43, "learning_rate": 6.349206349206349e-06, "loss": 0.0026, "step": 680 }, { "epoch": 19.71, "learning_rate": 3.1746031746031746e-06, "loss": 0.0001, "step": 690 }, { "epoch": 20.0, "learning_rate": 0.0, "loss": 0.0022, "step": 700 }, { "epoch": 20.0, "eval_accuracy": 0.9590163934426229, "eval_loss": 0.2600506544113159, "eval_runtime": 1.1031, "eval_samples_per_second": 110.597, "eval_steps_per_second": 14.504, "step": 700 } ], "max_steps": 700, "num_train_epochs": 20, "total_flos": 1.6924553905235558e+18, "trial_name": null, "trial_params": null }