{ "best_metric": 0.45136434049983454, "best_model_checkpoint": "legal-bert-lora/checkpoint-964", "epoch": 5.996889580093312, "eval_steps": 500, "global_step": 964, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.6297443841982959, "eval_f1_macro": 0.274206359888179, "eval_f1_micro": 0.6297443841982959, "eval_f1_weighted": 0.5693924444438366, "eval_loss": 1.3252344131469727, "eval_macro_fpr": 0.04170202326759921, "eval_macro_sensitivity": 0.31095312319919677, "eval_macro_specificity": 0.9716859606487191, "eval_precision": 0.5643117258906628, "eval_precision_macro": 0.2864620870649182, "eval_recall": 0.6297443841982959, "eval_recall_macro": 0.31095312319919677, "eval_runtime": 29.2455, "eval_samples_per_second": 44.143, "eval_steps_per_second": 5.539, "eval_weighted_fpr": 0.0403035413153457, "eval_weighted_sensitivity": 0.6297443841982959, "eval_weighted_specificity": 0.945545025532491, "step": 160 }, { "epoch": 2.0, "eval_accuracy": 0.7312161115414407, "eval_f1_macro": 0.39668888106795264, "eval_f1_micro": 0.7312161115414407, "eval_f1_weighted": 0.6996238601563893, "eval_loss": 0.8870222568511963, "eval_macro_fpr": 0.025654492164758257, "eval_macro_sensitivity": 0.4525442260434048, "eval_macro_specificity": 0.9800113592544849, "eval_precision": 0.687310022738013, "eval_precision_macro": 0.37417463878901125, "eval_recall": 0.7312161115414407, "eval_recall_macro": 0.4525442260434048, "eval_runtime": 31.4769, "eval_samples_per_second": 41.014, "eval_steps_per_second": 5.147, "eval_weighted_fpr": 0.025584310255843103, "eval_weighted_sensitivity": 0.7312161115414407, "eval_weighted_specificity": 0.9689542772758329, "step": 321 }, { "epoch": 3.0, "eval_accuracy": 0.7482571649883811, "eval_f1_macro": 0.4262450946907797, "eval_f1_micro": 0.7482571649883811, "eval_f1_weighted": 0.7282078768513273, "eval_loss": 0.7794041037559509, "eval_macro_fpr": 0.023941075707085962, "eval_macro_sensitivity": 0.46803400264857875, "eval_macro_specificity": 0.9812882861560729, "eval_precision": 0.716881212213352, "eval_precision_macro": 0.40594566191566384, "eval_recall": 0.7482571649883811, "eval_recall_macro": 0.46803400264857875, "eval_runtime": 31.9176, "eval_samples_per_second": 40.448, "eval_steps_per_second": 5.076, "eval_weighted_fpr": 0.02346739836811322, "eval_weighted_sensitivity": 0.7482571649883811, "eval_weighted_specificity": 0.9710671273527125, "step": 482 }, { "epoch": 3.11, "learning_rate": 3.4375e-05, "loss": 1.2835, "step": 500 }, { "epoch": 4.0, "eval_accuracy": 0.7443841982958946, "eval_f1_macro": 0.4099967964216515, "eval_f1_micro": 0.7443841982958946, "eval_f1_weighted": 0.7145941103131069, "eval_loss": 0.7480739951133728, "eval_macro_fpr": 0.024347730036769315, "eval_macro_sensitivity": 0.45879715060247334, "eval_macro_specificity": 0.9809610383366641, "eval_precision": 0.7084810945380595, "eval_precision_macro": 0.39966194371515146, "eval_recall": 0.7443841982958946, "eval_recall_macro": 0.45879715060247334, "eval_runtime": 31.4007, "eval_samples_per_second": 41.114, "eval_steps_per_second": 5.159, "eval_weighted_fpr": 0.023940800928612886, "eval_weighted_sensitivity": 0.7443841982958946, "eval_weighted_specificity": 0.9700313767540658, "step": 643 }, { "epoch": 5.0, "eval_accuracy": 0.7629744384198296, "eval_f1_macro": 0.43501781058601113, "eval_f1_micro": 0.7629744384198296, "eval_f1_weighted": 0.7371758021368604, "eval_loss": 0.7360239624977112, "eval_macro_fpr": 0.022582062196490615, "eval_macro_sensitivity": 0.4763281068994499, "eval_macro_specificity": 0.9822126782492226, "eval_precision": 0.7245041319757508, "eval_precision_macro": 0.4175606064626592, "eval_recall": 0.7629744384198296, "eval_recall_macro": 0.4763281068994499, "eval_runtime": 31.4819, "eval_samples_per_second": 41.008, "eval_steps_per_second": 5.146, "eval_weighted_fpr": 0.021708286038592508, "eval_weighted_sensitivity": 0.7629744384198296, "eval_weighted_specificity": 0.9702157353185087, "step": 803 }, { "epoch": 6.0, "eval_accuracy": 0.7738187451587917, "eval_f1_macro": 0.45136434049983454, "eval_f1_micro": 0.7738187451587917, "eval_f1_weighted": 0.7549277434298373, "eval_loss": 0.7146413922309875, "eval_macro_fpr": 0.020909390992017808, "eval_macro_sensitivity": 0.49065578942391963, "eval_macro_specificity": 0.9831195609570588, "eval_precision": 0.7789833226684362, "eval_precision_macro": 0.5020078701673053, "eval_recall": 0.7738187451587917, "eval_recall_macro": 0.49065578942391963, "eval_runtime": 31.935, "eval_samples_per_second": 40.426, "eval_steps_per_second": 5.073, "eval_weighted_fpr": 0.020451043563524302, "eval_weighted_sensitivity": 0.7738187451587917, "eval_weighted_specificity": 0.9729746691970887, "step": 964 } ], "logging_steps": 500, "max_steps": 1600, "num_train_epochs": 10, "save_steps": 500, "total_flos": 8366917304180736.0, "trial_name": null, "trial_params": null }