|
{ |
|
"best_metric": 0.4942768580570481, |
|
"best_model_checkpoint": "legal-bert-lora/checkpoint-1446", |
|
"epoch": 8.995334370139968, |
|
"eval_steps": 500, |
|
"global_step": 1446, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.6297443841982959, |
|
"eval_f1_macro": 0.274206359888179, |
|
"eval_f1_micro": 0.6297443841982959, |
|
"eval_f1_weighted": 0.5693924444438366, |
|
"eval_loss": 1.3252344131469727, |
|
"eval_macro_fpr": 0.04170202326759921, |
|
"eval_macro_sensitivity": 0.31095312319919677, |
|
"eval_macro_specificity": 0.9716859606487191, |
|
"eval_precision": 0.5643117258906628, |
|
"eval_precision_macro": 0.2864620870649182, |
|
"eval_recall": 0.6297443841982959, |
|
"eval_recall_macro": 0.31095312319919677, |
|
"eval_runtime": 29.2455, |
|
"eval_samples_per_second": 44.143, |
|
"eval_steps_per_second": 5.539, |
|
"eval_weighted_fpr": 0.0403035413153457, |
|
"eval_weighted_sensitivity": 0.6297443841982959, |
|
"eval_weighted_specificity": 0.945545025532491, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7312161115414407, |
|
"eval_f1_macro": 0.39668888106795264, |
|
"eval_f1_micro": 0.7312161115414407, |
|
"eval_f1_weighted": 0.6996238601563893, |
|
"eval_loss": 0.8870222568511963, |
|
"eval_macro_fpr": 0.025654492164758257, |
|
"eval_macro_sensitivity": 0.4525442260434048, |
|
"eval_macro_specificity": 0.9800113592544849, |
|
"eval_precision": 0.687310022738013, |
|
"eval_precision_macro": 0.37417463878901125, |
|
"eval_recall": 0.7312161115414407, |
|
"eval_recall_macro": 0.4525442260434048, |
|
"eval_runtime": 31.4769, |
|
"eval_samples_per_second": 41.014, |
|
"eval_steps_per_second": 5.147, |
|
"eval_weighted_fpr": 0.025584310255843103, |
|
"eval_weighted_sensitivity": 0.7312161115414407, |
|
"eval_weighted_specificity": 0.9689542772758329, |
|
"step": 321 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7482571649883811, |
|
"eval_f1_macro": 0.4262450946907797, |
|
"eval_f1_micro": 0.7482571649883811, |
|
"eval_f1_weighted": 0.7282078768513273, |
|
"eval_loss": 0.7794041037559509, |
|
"eval_macro_fpr": 0.023941075707085962, |
|
"eval_macro_sensitivity": 0.46803400264857875, |
|
"eval_macro_specificity": 0.9812882861560729, |
|
"eval_precision": 0.716881212213352, |
|
"eval_precision_macro": 0.40594566191566384, |
|
"eval_recall": 0.7482571649883811, |
|
"eval_recall_macro": 0.46803400264857875, |
|
"eval_runtime": 31.9176, |
|
"eval_samples_per_second": 40.448, |
|
"eval_steps_per_second": 5.076, |
|
"eval_weighted_fpr": 0.02346739836811322, |
|
"eval_weighted_sensitivity": 0.7482571649883811, |
|
"eval_weighted_specificity": 0.9710671273527125, |
|
"step": 482 |
|
}, |
|
{ |
|
"epoch": 3.11, |
|
"learning_rate": 3.4375e-05, |
|
"loss": 1.2835, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.7443841982958946, |
|
"eval_f1_macro": 0.4099967964216515, |
|
"eval_f1_micro": 0.7443841982958946, |
|
"eval_f1_weighted": 0.7145941103131069, |
|
"eval_loss": 0.7480739951133728, |
|
"eval_macro_fpr": 0.024347730036769315, |
|
"eval_macro_sensitivity": 0.45879715060247334, |
|
"eval_macro_specificity": 0.9809610383366641, |
|
"eval_precision": 0.7084810945380595, |
|
"eval_precision_macro": 0.39966194371515146, |
|
"eval_recall": 0.7443841982958946, |
|
"eval_recall_macro": 0.45879715060247334, |
|
"eval_runtime": 31.4007, |
|
"eval_samples_per_second": 41.114, |
|
"eval_steps_per_second": 5.159, |
|
"eval_weighted_fpr": 0.023940800928612886, |
|
"eval_weighted_sensitivity": 0.7443841982958946, |
|
"eval_weighted_specificity": 0.9700313767540658, |
|
"step": 643 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.7629744384198296, |
|
"eval_f1_macro": 0.43501781058601113, |
|
"eval_f1_micro": 0.7629744384198296, |
|
"eval_f1_weighted": 0.7371758021368604, |
|
"eval_loss": 0.7360239624977112, |
|
"eval_macro_fpr": 0.022582062196490615, |
|
"eval_macro_sensitivity": 0.4763281068994499, |
|
"eval_macro_specificity": 0.9822126782492226, |
|
"eval_precision": 0.7245041319757508, |
|
"eval_precision_macro": 0.4175606064626592, |
|
"eval_recall": 0.7629744384198296, |
|
"eval_recall_macro": 0.4763281068994499, |
|
"eval_runtime": 31.4819, |
|
"eval_samples_per_second": 41.008, |
|
"eval_steps_per_second": 5.146, |
|
"eval_weighted_fpr": 0.021708286038592508, |
|
"eval_weighted_sensitivity": 0.7629744384198296, |
|
"eval_weighted_specificity": 0.9702157353185087, |
|
"step": 803 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.7738187451587917, |
|
"eval_f1_macro": 0.45136434049983454, |
|
"eval_f1_micro": 0.7738187451587917, |
|
"eval_f1_weighted": 0.7549277434298373, |
|
"eval_loss": 0.7146413922309875, |
|
"eval_macro_fpr": 0.020909390992017808, |
|
"eval_macro_sensitivity": 0.49065578942391963, |
|
"eval_macro_specificity": 0.9831195609570588, |
|
"eval_precision": 0.7789833226684362, |
|
"eval_precision_macro": 0.5020078701673053, |
|
"eval_recall": 0.7738187451587917, |
|
"eval_recall_macro": 0.49065578942391963, |
|
"eval_runtime": 31.935, |
|
"eval_samples_per_second": 40.426, |
|
"eval_steps_per_second": 5.073, |
|
"eval_weighted_fpr": 0.020451043563524302, |
|
"eval_weighted_sensitivity": 0.7738187451587917, |
|
"eval_weighted_specificity": 0.9729746691970887, |
|
"step": 964 |
|
}, |
|
{ |
|
"epoch": 6.22, |
|
"learning_rate": 1.8750000000000002e-05, |
|
"loss": 0.6494, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.7606506584043378, |
|
"eval_f1_macro": 0.4555893583613109, |
|
"eval_f1_micro": 0.7606506584043377, |
|
"eval_f1_weighted": 0.739017992628783, |
|
"eval_loss": 0.7362409234046936, |
|
"eval_macro_fpr": 0.022493653031422953, |
|
"eval_macro_sensitivity": 0.4889578896745981, |
|
"eval_macro_specificity": 0.9822020479931979, |
|
"eval_precision": 0.7519338544853175, |
|
"eval_precision_macro": 0.5232191620367644, |
|
"eval_recall": 0.7606506584043378, |
|
"eval_recall_macro": 0.4889578896745981, |
|
"eval_runtime": 31.5363, |
|
"eval_samples_per_second": 40.937, |
|
"eval_steps_per_second": 5.137, |
|
"eval_weighted_fpr": 0.021981930710677954, |
|
"eval_weighted_sensitivity": 0.7606506584043378, |
|
"eval_weighted_specificity": 0.9723800614936304, |
|
"step": 1125 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.78001549186677, |
|
"eval_f1_macro": 0.492346438039213, |
|
"eval_f1_micro": 0.78001549186677, |
|
"eval_f1_weighted": 0.7616714702598053, |
|
"eval_loss": 0.7271353006362915, |
|
"eval_macro_fpr": 0.020514731186999667, |
|
"eval_macro_sensitivity": 0.517079968248798, |
|
"eval_macro_specificity": 0.9835380831075756, |
|
"eval_precision": 0.7639081358018293, |
|
"eval_precision_macro": 0.5348049874207874, |
|
"eval_recall": 0.78001549186677, |
|
"eval_recall_macro": 0.517079968248798, |
|
"eval_runtime": 31.6682, |
|
"eval_samples_per_second": 40.766, |
|
"eval_steps_per_second": 5.116, |
|
"eval_weighted_fpr": 0.0197469058545404, |
|
"eval_weighted_sensitivity": 0.78001549186677, |
|
"eval_weighted_specificity": 0.9730557547468652, |
|
"step": 1286 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.7846630518977536, |
|
"eval_f1_macro": 0.4942768580570481, |
|
"eval_f1_micro": 0.7846630518977536, |
|
"eval_f1_weighted": 0.7665188470695673, |
|
"eval_loss": 0.7067885398864746, |
|
"eval_macro_fpr": 0.019851450460712513, |
|
"eval_macro_sensitivity": 0.5204636688208197, |
|
"eval_macro_specificity": 0.9839403746401699, |
|
"eval_precision": 0.7739358194210298, |
|
"eval_precision_macro": 0.5494759535541606, |
|
"eval_recall": 0.7846630518977536, |
|
"eval_recall_macro": 0.5204636688208197, |
|
"eval_runtime": 32.9208, |
|
"eval_samples_per_second": 39.215, |
|
"eval_steps_per_second": 4.921, |
|
"eval_weighted_fpr": 0.01922544951590595, |
|
"eval_weighted_sensitivity": 0.7846630518977536, |
|
"eval_weighted_specificity": 0.974442567704795, |
|
"step": 1446 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 1600, |
|
"num_train_epochs": 10, |
|
"save_steps": 500, |
|
"total_flos": 1.2550375956271104e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|