xshubhamx's picture
Upload folder using huggingface_hub
ac73358 verified
raw
history blame
8.49 kB
{
"best_metric": 0.4942768580570481,
"best_model_checkpoint": "legal-bert-lora/checkpoint-1446",
"epoch": 8.995334370139968,
"eval_steps": 500,
"global_step": 1446,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.6297443841982959,
"eval_f1_macro": 0.274206359888179,
"eval_f1_micro": 0.6297443841982959,
"eval_f1_weighted": 0.5693924444438366,
"eval_loss": 1.3252344131469727,
"eval_macro_fpr": 0.04170202326759921,
"eval_macro_sensitivity": 0.31095312319919677,
"eval_macro_specificity": 0.9716859606487191,
"eval_precision": 0.5643117258906628,
"eval_precision_macro": 0.2864620870649182,
"eval_recall": 0.6297443841982959,
"eval_recall_macro": 0.31095312319919677,
"eval_runtime": 29.2455,
"eval_samples_per_second": 44.143,
"eval_steps_per_second": 5.539,
"eval_weighted_fpr": 0.0403035413153457,
"eval_weighted_sensitivity": 0.6297443841982959,
"eval_weighted_specificity": 0.945545025532491,
"step": 160
},
{
"epoch": 2.0,
"eval_accuracy": 0.7312161115414407,
"eval_f1_macro": 0.39668888106795264,
"eval_f1_micro": 0.7312161115414407,
"eval_f1_weighted": 0.6996238601563893,
"eval_loss": 0.8870222568511963,
"eval_macro_fpr": 0.025654492164758257,
"eval_macro_sensitivity": 0.4525442260434048,
"eval_macro_specificity": 0.9800113592544849,
"eval_precision": 0.687310022738013,
"eval_precision_macro": 0.37417463878901125,
"eval_recall": 0.7312161115414407,
"eval_recall_macro": 0.4525442260434048,
"eval_runtime": 31.4769,
"eval_samples_per_second": 41.014,
"eval_steps_per_second": 5.147,
"eval_weighted_fpr": 0.025584310255843103,
"eval_weighted_sensitivity": 0.7312161115414407,
"eval_weighted_specificity": 0.9689542772758329,
"step": 321
},
{
"epoch": 3.0,
"eval_accuracy": 0.7482571649883811,
"eval_f1_macro": 0.4262450946907797,
"eval_f1_micro": 0.7482571649883811,
"eval_f1_weighted": 0.7282078768513273,
"eval_loss": 0.7794041037559509,
"eval_macro_fpr": 0.023941075707085962,
"eval_macro_sensitivity": 0.46803400264857875,
"eval_macro_specificity": 0.9812882861560729,
"eval_precision": 0.716881212213352,
"eval_precision_macro": 0.40594566191566384,
"eval_recall": 0.7482571649883811,
"eval_recall_macro": 0.46803400264857875,
"eval_runtime": 31.9176,
"eval_samples_per_second": 40.448,
"eval_steps_per_second": 5.076,
"eval_weighted_fpr": 0.02346739836811322,
"eval_weighted_sensitivity": 0.7482571649883811,
"eval_weighted_specificity": 0.9710671273527125,
"step": 482
},
{
"epoch": 3.11,
"learning_rate": 3.4375e-05,
"loss": 1.2835,
"step": 500
},
{
"epoch": 4.0,
"eval_accuracy": 0.7443841982958946,
"eval_f1_macro": 0.4099967964216515,
"eval_f1_micro": 0.7443841982958946,
"eval_f1_weighted": 0.7145941103131069,
"eval_loss": 0.7480739951133728,
"eval_macro_fpr": 0.024347730036769315,
"eval_macro_sensitivity": 0.45879715060247334,
"eval_macro_specificity": 0.9809610383366641,
"eval_precision": 0.7084810945380595,
"eval_precision_macro": 0.39966194371515146,
"eval_recall": 0.7443841982958946,
"eval_recall_macro": 0.45879715060247334,
"eval_runtime": 31.4007,
"eval_samples_per_second": 41.114,
"eval_steps_per_second": 5.159,
"eval_weighted_fpr": 0.023940800928612886,
"eval_weighted_sensitivity": 0.7443841982958946,
"eval_weighted_specificity": 0.9700313767540658,
"step": 643
},
{
"epoch": 5.0,
"eval_accuracy": 0.7629744384198296,
"eval_f1_macro": 0.43501781058601113,
"eval_f1_micro": 0.7629744384198296,
"eval_f1_weighted": 0.7371758021368604,
"eval_loss": 0.7360239624977112,
"eval_macro_fpr": 0.022582062196490615,
"eval_macro_sensitivity": 0.4763281068994499,
"eval_macro_specificity": 0.9822126782492226,
"eval_precision": 0.7245041319757508,
"eval_precision_macro": 0.4175606064626592,
"eval_recall": 0.7629744384198296,
"eval_recall_macro": 0.4763281068994499,
"eval_runtime": 31.4819,
"eval_samples_per_second": 41.008,
"eval_steps_per_second": 5.146,
"eval_weighted_fpr": 0.021708286038592508,
"eval_weighted_sensitivity": 0.7629744384198296,
"eval_weighted_specificity": 0.9702157353185087,
"step": 803
},
{
"epoch": 6.0,
"eval_accuracy": 0.7738187451587917,
"eval_f1_macro": 0.45136434049983454,
"eval_f1_micro": 0.7738187451587917,
"eval_f1_weighted": 0.7549277434298373,
"eval_loss": 0.7146413922309875,
"eval_macro_fpr": 0.020909390992017808,
"eval_macro_sensitivity": 0.49065578942391963,
"eval_macro_specificity": 0.9831195609570588,
"eval_precision": 0.7789833226684362,
"eval_precision_macro": 0.5020078701673053,
"eval_recall": 0.7738187451587917,
"eval_recall_macro": 0.49065578942391963,
"eval_runtime": 31.935,
"eval_samples_per_second": 40.426,
"eval_steps_per_second": 5.073,
"eval_weighted_fpr": 0.020451043563524302,
"eval_weighted_sensitivity": 0.7738187451587917,
"eval_weighted_specificity": 0.9729746691970887,
"step": 964
},
{
"epoch": 6.22,
"learning_rate": 1.8750000000000002e-05,
"loss": 0.6494,
"step": 1000
},
{
"epoch": 7.0,
"eval_accuracy": 0.7606506584043378,
"eval_f1_macro": 0.4555893583613109,
"eval_f1_micro": 0.7606506584043377,
"eval_f1_weighted": 0.739017992628783,
"eval_loss": 0.7362409234046936,
"eval_macro_fpr": 0.022493653031422953,
"eval_macro_sensitivity": 0.4889578896745981,
"eval_macro_specificity": 0.9822020479931979,
"eval_precision": 0.7519338544853175,
"eval_precision_macro": 0.5232191620367644,
"eval_recall": 0.7606506584043378,
"eval_recall_macro": 0.4889578896745981,
"eval_runtime": 31.5363,
"eval_samples_per_second": 40.937,
"eval_steps_per_second": 5.137,
"eval_weighted_fpr": 0.021981930710677954,
"eval_weighted_sensitivity": 0.7606506584043378,
"eval_weighted_specificity": 0.9723800614936304,
"step": 1125
},
{
"epoch": 8.0,
"eval_accuracy": 0.78001549186677,
"eval_f1_macro": 0.492346438039213,
"eval_f1_micro": 0.78001549186677,
"eval_f1_weighted": 0.7616714702598053,
"eval_loss": 0.7271353006362915,
"eval_macro_fpr": 0.020514731186999667,
"eval_macro_sensitivity": 0.517079968248798,
"eval_macro_specificity": 0.9835380831075756,
"eval_precision": 0.7639081358018293,
"eval_precision_macro": 0.5348049874207874,
"eval_recall": 0.78001549186677,
"eval_recall_macro": 0.517079968248798,
"eval_runtime": 31.6682,
"eval_samples_per_second": 40.766,
"eval_steps_per_second": 5.116,
"eval_weighted_fpr": 0.0197469058545404,
"eval_weighted_sensitivity": 0.78001549186677,
"eval_weighted_specificity": 0.9730557547468652,
"step": 1286
},
{
"epoch": 9.0,
"eval_accuracy": 0.7846630518977536,
"eval_f1_macro": 0.4942768580570481,
"eval_f1_micro": 0.7846630518977536,
"eval_f1_weighted": 0.7665188470695673,
"eval_loss": 0.7067885398864746,
"eval_macro_fpr": 0.019851450460712513,
"eval_macro_sensitivity": 0.5204636688208197,
"eval_macro_specificity": 0.9839403746401699,
"eval_precision": 0.7739358194210298,
"eval_precision_macro": 0.5494759535541606,
"eval_recall": 0.7846630518977536,
"eval_recall_macro": 0.5204636688208197,
"eval_runtime": 32.9208,
"eval_samples_per_second": 39.215,
"eval_steps_per_second": 4.921,
"eval_weighted_fpr": 0.01922544951590595,
"eval_weighted_sensitivity": 0.7846630518977536,
"eval_weighted_specificity": 0.974442567704795,
"step": 1446
}
],
"logging_steps": 500,
"max_steps": 1600,
"num_train_epochs": 10,
"save_steps": 500,
"total_flos": 1.2550375956271104e+16,
"trial_name": null,
"trial_params": null
}