{ "best_metric": 0.4942768580570481, "best_model_checkpoint": "legal-bert-lora/checkpoint-1446", "epoch": 8.995334370139968, "eval_steps": 500, "global_step": 1446, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.6297443841982959, "eval_f1_macro": 0.274206359888179, "eval_f1_micro": 0.6297443841982959, "eval_f1_weighted": 0.5693924444438366, "eval_loss": 1.3252344131469727, "eval_macro_fpr": 0.04170202326759921, "eval_macro_sensitivity": 0.31095312319919677, "eval_macro_specificity": 0.9716859606487191, "eval_precision": 0.5643117258906628, "eval_precision_macro": 0.2864620870649182, "eval_recall": 0.6297443841982959, "eval_recall_macro": 0.31095312319919677, "eval_runtime": 29.2455, "eval_samples_per_second": 44.143, "eval_steps_per_second": 5.539, "eval_weighted_fpr": 0.0403035413153457, "eval_weighted_sensitivity": 0.6297443841982959, "eval_weighted_specificity": 0.945545025532491, "step": 160 }, { "epoch": 2.0, "eval_accuracy": 0.7312161115414407, "eval_f1_macro": 0.39668888106795264, "eval_f1_micro": 0.7312161115414407, "eval_f1_weighted": 0.6996238601563893, "eval_loss": 0.8870222568511963, "eval_macro_fpr": 0.025654492164758257, "eval_macro_sensitivity": 0.4525442260434048, "eval_macro_specificity": 0.9800113592544849, "eval_precision": 0.687310022738013, "eval_precision_macro": 0.37417463878901125, "eval_recall": 0.7312161115414407, "eval_recall_macro": 0.4525442260434048, "eval_runtime": 31.4769, "eval_samples_per_second": 41.014, "eval_steps_per_second": 5.147, "eval_weighted_fpr": 0.025584310255843103, "eval_weighted_sensitivity": 0.7312161115414407, "eval_weighted_specificity": 0.9689542772758329, "step": 321 }, { "epoch": 3.0, "eval_accuracy": 0.7482571649883811, "eval_f1_macro": 0.4262450946907797, "eval_f1_micro": 0.7482571649883811, "eval_f1_weighted": 0.7282078768513273, "eval_loss": 0.7794041037559509, "eval_macro_fpr": 0.023941075707085962, "eval_macro_sensitivity": 0.46803400264857875, "eval_macro_specificity": 0.9812882861560729, "eval_precision": 0.716881212213352, "eval_precision_macro": 0.40594566191566384, "eval_recall": 0.7482571649883811, "eval_recall_macro": 0.46803400264857875, "eval_runtime": 31.9176, "eval_samples_per_second": 40.448, "eval_steps_per_second": 5.076, "eval_weighted_fpr": 0.02346739836811322, "eval_weighted_sensitivity": 0.7482571649883811, "eval_weighted_specificity": 0.9710671273527125, "step": 482 }, { "epoch": 3.11, "learning_rate": 3.4375e-05, "loss": 1.2835, "step": 500 }, { "epoch": 4.0, "eval_accuracy": 0.7443841982958946, "eval_f1_macro": 0.4099967964216515, "eval_f1_micro": 0.7443841982958946, "eval_f1_weighted": 0.7145941103131069, "eval_loss": 0.7480739951133728, "eval_macro_fpr": 0.024347730036769315, "eval_macro_sensitivity": 0.45879715060247334, "eval_macro_specificity": 0.9809610383366641, "eval_precision": 0.7084810945380595, "eval_precision_macro": 0.39966194371515146, "eval_recall": 0.7443841982958946, "eval_recall_macro": 0.45879715060247334, "eval_runtime": 31.4007, "eval_samples_per_second": 41.114, "eval_steps_per_second": 5.159, "eval_weighted_fpr": 0.023940800928612886, "eval_weighted_sensitivity": 0.7443841982958946, "eval_weighted_specificity": 0.9700313767540658, "step": 643 }, { "epoch": 5.0, "eval_accuracy": 0.7629744384198296, "eval_f1_macro": 0.43501781058601113, "eval_f1_micro": 0.7629744384198296, "eval_f1_weighted": 0.7371758021368604, "eval_loss": 0.7360239624977112, "eval_macro_fpr": 0.022582062196490615, "eval_macro_sensitivity": 0.4763281068994499, "eval_macro_specificity": 0.9822126782492226, "eval_precision": 0.7245041319757508, "eval_precision_macro": 0.4175606064626592, "eval_recall": 0.7629744384198296, "eval_recall_macro": 0.4763281068994499, "eval_runtime": 31.4819, "eval_samples_per_second": 41.008, "eval_steps_per_second": 5.146, "eval_weighted_fpr": 0.021708286038592508, "eval_weighted_sensitivity": 0.7629744384198296, "eval_weighted_specificity": 0.9702157353185087, "step": 803 }, { "epoch": 6.0, "eval_accuracy": 0.7738187451587917, "eval_f1_macro": 0.45136434049983454, "eval_f1_micro": 0.7738187451587917, "eval_f1_weighted": 0.7549277434298373, "eval_loss": 0.7146413922309875, "eval_macro_fpr": 0.020909390992017808, "eval_macro_sensitivity": 0.49065578942391963, "eval_macro_specificity": 0.9831195609570588, "eval_precision": 0.7789833226684362, "eval_precision_macro": 0.5020078701673053, "eval_recall": 0.7738187451587917, "eval_recall_macro": 0.49065578942391963, "eval_runtime": 31.935, "eval_samples_per_second": 40.426, "eval_steps_per_second": 5.073, "eval_weighted_fpr": 0.020451043563524302, "eval_weighted_sensitivity": 0.7738187451587917, "eval_weighted_specificity": 0.9729746691970887, "step": 964 }, { "epoch": 6.22, "learning_rate": 1.8750000000000002e-05, "loss": 0.6494, "step": 1000 }, { "epoch": 7.0, "eval_accuracy": 0.7606506584043378, "eval_f1_macro": 0.4555893583613109, "eval_f1_micro": 0.7606506584043377, "eval_f1_weighted": 0.739017992628783, "eval_loss": 0.7362409234046936, "eval_macro_fpr": 0.022493653031422953, "eval_macro_sensitivity": 0.4889578896745981, "eval_macro_specificity": 0.9822020479931979, "eval_precision": 0.7519338544853175, "eval_precision_macro": 0.5232191620367644, "eval_recall": 0.7606506584043378, "eval_recall_macro": 0.4889578896745981, "eval_runtime": 31.5363, "eval_samples_per_second": 40.937, "eval_steps_per_second": 5.137, "eval_weighted_fpr": 0.021981930710677954, "eval_weighted_sensitivity": 0.7606506584043378, "eval_weighted_specificity": 0.9723800614936304, "step": 1125 }, { "epoch": 8.0, "eval_accuracy": 0.78001549186677, "eval_f1_macro": 0.492346438039213, "eval_f1_micro": 0.78001549186677, "eval_f1_weighted": 0.7616714702598053, "eval_loss": 0.7271353006362915, "eval_macro_fpr": 0.020514731186999667, "eval_macro_sensitivity": 0.517079968248798, "eval_macro_specificity": 0.9835380831075756, "eval_precision": 0.7639081358018293, "eval_precision_macro": 0.5348049874207874, "eval_recall": 0.78001549186677, "eval_recall_macro": 0.517079968248798, "eval_runtime": 31.6682, "eval_samples_per_second": 40.766, "eval_steps_per_second": 5.116, "eval_weighted_fpr": 0.0197469058545404, "eval_weighted_sensitivity": 0.78001549186677, "eval_weighted_specificity": 0.9730557547468652, "step": 1286 }, { "epoch": 9.0, "eval_accuracy": 0.7846630518977536, "eval_f1_macro": 0.4942768580570481, "eval_f1_micro": 0.7846630518977536, "eval_f1_weighted": 0.7665188470695673, "eval_loss": 0.7067885398864746, "eval_macro_fpr": 0.019851450460712513, "eval_macro_sensitivity": 0.5204636688208197, "eval_macro_specificity": 0.9839403746401699, "eval_precision": 0.7739358194210298, "eval_precision_macro": 0.5494759535541606, "eval_recall": 0.7846630518977536, "eval_recall_macro": 0.5204636688208197, "eval_runtime": 32.9208, "eval_samples_per_second": 39.215, "eval_steps_per_second": 4.921, "eval_weighted_fpr": 0.01922544951590595, "eval_weighted_sensitivity": 0.7846630518977536, "eval_weighted_specificity": 0.974442567704795, "step": 1446 } ], "logging_steps": 500, "max_steps": 1600, "num_train_epochs": 10, "save_steps": 500, "total_flos": 1.2550375956271104e+16, "trial_name": null, "trial_params": null }