|
{ |
|
"best_metric": 0.5903876477694423, |
|
"best_model_checkpoint": "case-analysis-legal-bert-base-uncased/checkpoint-896", |
|
"epoch": 4.0, |
|
"eval_steps": 500, |
|
"global_step": 896, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.6570155902004454, |
|
"eval_f1_macro": 0.4081263564022185, |
|
"eval_f1_micro": 0.6570155902004454, |
|
"eval_f1_weighted": 0.6166399839312825, |
|
"eval_loss": 1.0114229917526245, |
|
"eval_macro_fpr": 0.19475132363363487, |
|
"eval_macro_sensitivity": 0.40746667217255456, |
|
"eval_macro_specificity": 0.8324392236563901, |
|
"eval_precision": 0.6178816225558943, |
|
"eval_precision_macro": 0.4664000256488353, |
|
"eval_recall": 0.6570155902004454, |
|
"eval_recall_macro": 0.40746667217255456, |
|
"eval_runtime": 7.3199, |
|
"eval_samples_per_second": 61.34, |
|
"eval_steps_per_second": 7.787, |
|
"eval_weighted_fpr": 0.1482194417709336, |
|
"eval_weighted_sensitivity": 0.6570155902004454, |
|
"eval_weighted_specificity": 0.6727413044251147, |
|
"step": 224 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7750556792873051, |
|
"eval_f1_macro": 0.5658663855845003, |
|
"eval_f1_micro": 0.775055679287305, |
|
"eval_f1_weighted": 0.7564492543508543, |
|
"eval_loss": 0.764952540397644, |
|
"eval_macro_fpr": 0.10943701020063132, |
|
"eval_macro_sensitivity": 0.5805958747135218, |
|
"eval_macro_specificity": 0.9039084791647444, |
|
"eval_precision": 0.7425093237919278, |
|
"eval_precision_macro": 0.5566158325717437, |
|
"eval_recall": 0.7750556792873051, |
|
"eval_recall_macro": 0.5805958747135218, |
|
"eval_runtime": 30.7218, |
|
"eval_samples_per_second": 14.615, |
|
"eval_steps_per_second": 1.855, |
|
"eval_weighted_fpr": 0.08820960698689956, |
|
"eval_weighted_sensitivity": 0.7750556792873051, |
|
"eval_weighted_specificity": 0.8405782373716723, |
|
"step": 448 |
|
}, |
|
{ |
|
"epoch": 2.232142857142857, |
|
"grad_norm": 9.53757095336914, |
|
"learning_rate": 4.631696428571429e-05, |
|
"loss": 0.7677, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7817371937639198, |
|
"eval_f1_macro": 0.5707248076329534, |
|
"eval_f1_micro": 0.7817371937639198, |
|
"eval_f1_weighted": 0.7678448816993292, |
|
"eval_loss": 0.7341566681861877, |
|
"eval_macro_fpr": 0.10409605667370833, |
|
"eval_macro_sensitivity": 0.5967117805353099, |
|
"eval_macro_specificity": 0.9083046086144851, |
|
"eval_precision": 0.7694906286035585, |
|
"eval_precision_macro": 0.5673619923602318, |
|
"eval_recall": 0.7817371937639198, |
|
"eval_recall_macro": 0.5967117805353099, |
|
"eval_runtime": 32.9882, |
|
"eval_samples_per_second": 13.611, |
|
"eval_steps_per_second": 1.728, |
|
"eval_weighted_fpr": 0.08514335360556038, |
|
"eval_weighted_sensitivity": 0.7817371937639198, |
|
"eval_weighted_specificity": 0.8514812406940205, |
|
"step": 672 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8173719376391982, |
|
"eval_f1_macro": 0.5903876477694423, |
|
"eval_f1_micro": 0.8173719376391981, |
|
"eval_f1_weighted": 0.7920921547144288, |
|
"eval_loss": 0.7967568635940552, |
|
"eval_macro_fpr": 0.09654289346260755, |
|
"eval_macro_sensitivity": 0.5892796922208687, |
|
"eval_macro_specificity": 0.9135512326349768, |
|
"eval_precision": 0.776630887817645, |
|
"eval_precision_macro": 0.6035747039094435, |
|
"eval_recall": 0.8173719376391982, |
|
"eval_recall_macro": 0.5892796922208687, |
|
"eval_runtime": 31.5737, |
|
"eval_samples_per_second": 14.221, |
|
"eval_steps_per_second": 1.805, |
|
"eval_weighted_fpr": 0.06931530008453085, |
|
"eval_weighted_sensitivity": 0.8173719376391982, |
|
"eval_weighted_specificity": 0.836832992900709, |
|
"step": 896 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 6720, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 30, |
|
"save_steps": 500, |
|
"total_flos": 1886013911728128.0, |
|
"train_batch_size": 8, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|