|
{ |
|
"best_metric": 0.50872844, |
|
"best_model_checkpoint": "/content/output/qwen2-vl-7b-instruct/v2-20240909-100714/checkpoint-45", |
|
"epoch": 0.993103448275862, |
|
"eval_steps": 50, |
|
"global_step": 45, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"acc": 0.61398816, |
|
"epoch": 0.022068965517241378, |
|
"grad_norm": 7.717197895050049, |
|
"learning_rate": 3.3333333333333335e-05, |
|
"loss": 2.87438893, |
|
"memory(GiB)": 20.29, |
|
"step": 1, |
|
"train_speed(iter/s)": 0.066629 |
|
}, |
|
{ |
|
"acc": 0.62096363, |
|
"epoch": 0.1103448275862069, |
|
"grad_norm": 8.616560935974121, |
|
"learning_rate": 9.944154131125642e-05, |
|
"loss": 2.60930538, |
|
"memory(GiB)": 22.58, |
|
"step": 5, |
|
"train_speed(iter/s)": 0.075138 |
|
}, |
|
{ |
|
"acc": 0.80472717, |
|
"epoch": 0.2206896551724138, |
|
"grad_norm": 3.399202346801758, |
|
"learning_rate": 9.330127018922194e-05, |
|
"loss": 0.68508205, |
|
"memory(GiB)": 23.35, |
|
"step": 10, |
|
"train_speed(iter/s)": 0.076348 |
|
}, |
|
{ |
|
"acc": 0.81436024, |
|
"epoch": 0.3310344827586207, |
|
"grad_norm": 5.226686477661133, |
|
"learning_rate": 8.117449009293668e-05, |
|
"loss": 0.69332366, |
|
"memory(GiB)": 24.12, |
|
"step": 15, |
|
"train_speed(iter/s)": 0.076737 |
|
}, |
|
{ |
|
"acc": 0.86372032, |
|
"epoch": 0.4413793103448276, |
|
"grad_norm": 3.478239059448242, |
|
"learning_rate": 6.473775872054521e-05, |
|
"loss": 0.57136168, |
|
"memory(GiB)": 24.12, |
|
"step": 20, |
|
"train_speed(iter/s)": 0.076946 |
|
}, |
|
{ |
|
"acc": 0.85740089, |
|
"epoch": 0.5517241379310345, |
|
"grad_norm": 2.1063661575317383, |
|
"learning_rate": 4.626349532067879e-05, |
|
"loss": 0.51958747, |
|
"memory(GiB)": 24.91, |
|
"step": 25, |
|
"train_speed(iter/s)": 0.077061 |
|
}, |
|
{ |
|
"acc": 0.85881948, |
|
"epoch": 0.6620689655172414, |
|
"grad_norm": 2.6917998790740967, |
|
"learning_rate": 2.8305813044122097e-05, |
|
"loss": 0.51737795, |
|
"memory(GiB)": 24.91, |
|
"step": 30, |
|
"train_speed(iter/s)": 0.077142 |
|
}, |
|
{ |
|
"acc": 0.84086313, |
|
"epoch": 0.7724137931034483, |
|
"grad_norm": 7.916348934173584, |
|
"learning_rate": 1.3347406408508695e-05, |
|
"loss": 0.72901492, |
|
"memory(GiB)": 24.91, |
|
"step": 35, |
|
"train_speed(iter/s)": 0.077198 |
|
}, |
|
{ |
|
"acc": 0.86680059, |
|
"epoch": 0.8827586206896552, |
|
"grad_norm": 2.948944568634033, |
|
"learning_rate": 3.4563125677897932e-06, |
|
"loss": 0.43249173, |
|
"memory(GiB)": 24.91, |
|
"step": 40, |
|
"train_speed(iter/s)": 0.077243 |
|
}, |
|
{ |
|
"acc": 0.91657734, |
|
"epoch": 0.993103448275862, |
|
"grad_norm": 2.6367099285125732, |
|
"learning_rate": 0.0, |
|
"loss": 0.34231672, |
|
"memory(GiB)": 24.91, |
|
"step": 45, |
|
"train_speed(iter/s)": 0.077273 |
|
}, |
|
{ |
|
"epoch": 0.993103448275862, |
|
"eval_acc": 0.8181818181818182, |
|
"eval_loss": 0.5087284445762634, |
|
"eval_runtime": 3.4104, |
|
"eval_samples_per_second": 2.053, |
|
"eval_steps_per_second": 2.053, |
|
"step": 45 |
|
} |
|
], |
|
"logging_steps": 5, |
|
"max_steps": 45, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 1, |
|
"save_steps": 50, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 4.488065503664026e+16, |
|
"train_batch_size": 1, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|