File size: 4,032 Bytes
d23325f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 |
{
"best_metric": 0.4262450946907797,
"best_model_checkpoint": "legal-bert-lora/checkpoint-482",
"epoch": 4.0,
"eval_steps": 500,
"global_step": 643,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.6297443841982959,
"eval_f1_macro": 0.274206359888179,
"eval_f1_micro": 0.6297443841982959,
"eval_f1_weighted": 0.5693924444438366,
"eval_loss": 1.3252344131469727,
"eval_macro_fpr": 0.04170202326759921,
"eval_macro_sensitivity": 0.31095312319919677,
"eval_macro_specificity": 0.9716859606487191,
"eval_precision": 0.5643117258906628,
"eval_precision_macro": 0.2864620870649182,
"eval_recall": 0.6297443841982959,
"eval_recall_macro": 0.31095312319919677,
"eval_runtime": 29.2455,
"eval_samples_per_second": 44.143,
"eval_steps_per_second": 5.539,
"eval_weighted_fpr": 0.0403035413153457,
"eval_weighted_sensitivity": 0.6297443841982959,
"eval_weighted_specificity": 0.945545025532491,
"step": 160
},
{
"epoch": 2.0,
"eval_accuracy": 0.7312161115414407,
"eval_f1_macro": 0.39668888106795264,
"eval_f1_micro": 0.7312161115414407,
"eval_f1_weighted": 0.6996238601563893,
"eval_loss": 0.8870222568511963,
"eval_macro_fpr": 0.025654492164758257,
"eval_macro_sensitivity": 0.4525442260434048,
"eval_macro_specificity": 0.9800113592544849,
"eval_precision": 0.687310022738013,
"eval_precision_macro": 0.37417463878901125,
"eval_recall": 0.7312161115414407,
"eval_recall_macro": 0.4525442260434048,
"eval_runtime": 31.4769,
"eval_samples_per_second": 41.014,
"eval_steps_per_second": 5.147,
"eval_weighted_fpr": 0.025584310255843103,
"eval_weighted_sensitivity": 0.7312161115414407,
"eval_weighted_specificity": 0.9689542772758329,
"step": 321
},
{
"epoch": 3.0,
"eval_accuracy": 0.7482571649883811,
"eval_f1_macro": 0.4262450946907797,
"eval_f1_micro": 0.7482571649883811,
"eval_f1_weighted": 0.7282078768513273,
"eval_loss": 0.7794041037559509,
"eval_macro_fpr": 0.023941075707085962,
"eval_macro_sensitivity": 0.46803400264857875,
"eval_macro_specificity": 0.9812882861560729,
"eval_precision": 0.716881212213352,
"eval_precision_macro": 0.40594566191566384,
"eval_recall": 0.7482571649883811,
"eval_recall_macro": 0.46803400264857875,
"eval_runtime": 31.9176,
"eval_samples_per_second": 40.448,
"eval_steps_per_second": 5.076,
"eval_weighted_fpr": 0.02346739836811322,
"eval_weighted_sensitivity": 0.7482571649883811,
"eval_weighted_specificity": 0.9710671273527125,
"step": 482
},
{
"epoch": 3.11,
"learning_rate": 3.4375e-05,
"loss": 1.2835,
"step": 500
},
{
"epoch": 4.0,
"eval_accuracy": 0.7443841982958946,
"eval_f1_macro": 0.4099967964216515,
"eval_f1_micro": 0.7443841982958946,
"eval_f1_weighted": 0.7145941103131069,
"eval_loss": 0.7480739951133728,
"eval_macro_fpr": 0.024347730036769315,
"eval_macro_sensitivity": 0.45879715060247334,
"eval_macro_specificity": 0.9809610383366641,
"eval_precision": 0.7084810945380595,
"eval_precision_macro": 0.39966194371515146,
"eval_recall": 0.7443841982958946,
"eval_recall_macro": 0.45879715060247334,
"eval_runtime": 31.4007,
"eval_samples_per_second": 41.114,
"eval_steps_per_second": 5.159,
"eval_weighted_fpr": 0.023940800928612886,
"eval_weighted_sensitivity": 0.7443841982958946,
"eval_weighted_specificity": 0.9700313767540658,
"step": 643
}
],
"logging_steps": 500,
"max_steps": 1600,
"num_train_epochs": 10,
"save_steps": 500,
"total_flos": 5577944869453824.0,
"trial_name": null,
"trial_params": null
}
|