|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 18.06451612903226, |
|
"global_step": 140, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.9, |
|
"eval_accuracy": 0.7432239657631954, |
|
"eval_f1": 0.0, |
|
"eval_loss": 1.1863211393356323, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 0.0695, |
|
"eval_samples_per_second": 115.178, |
|
"eval_steps_per_second": 14.397, |
|
"step": 7 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"eval_accuracy": 0.7931526390870185, |
|
"eval_f1": 0.25925925925925924, |
|
"eval_loss": 0.7849462628364563, |
|
"eval_precision": 0.34146341463414637, |
|
"eval_recall": 0.208955223880597, |
|
"eval_runtime": 0.113, |
|
"eval_samples_per_second": 70.799, |
|
"eval_steps_per_second": 8.85, |
|
"step": 15 |
|
}, |
|
{ |
|
"epoch": 2.97, |
|
"eval_accuracy": 0.8487874465049928, |
|
"eval_f1": 0.484375, |
|
"eval_loss": 0.5964732766151428, |
|
"eval_precision": 0.5081967213114754, |
|
"eval_recall": 0.4626865671641791, |
|
"eval_runtime": 0.0576, |
|
"eval_samples_per_second": 139.001, |
|
"eval_steps_per_second": 17.375, |
|
"step": 23 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8944365192582026, |
|
"eval_f1": 0.6277372262773724, |
|
"eval_loss": 0.5038930773735046, |
|
"eval_precision": 0.6142857142857143, |
|
"eval_recall": 0.6417910447761194, |
|
"eval_runtime": 0.0605, |
|
"eval_samples_per_second": 132.311, |
|
"eval_steps_per_second": 16.539, |
|
"step": 31 |
|
}, |
|
{ |
|
"epoch": 4.9, |
|
"eval_accuracy": 0.891583452211127, |
|
"eval_f1": 0.6293706293706294, |
|
"eval_loss": 0.45688581466674805, |
|
"eval_precision": 0.5921052631578947, |
|
"eval_recall": 0.6716417910447762, |
|
"eval_runtime": 0.0797, |
|
"eval_samples_per_second": 100.319, |
|
"eval_steps_per_second": 12.54, |
|
"step": 38 |
|
}, |
|
{ |
|
"epoch": 5.94, |
|
"eval_accuracy": 0.8887303851640513, |
|
"eval_f1": 0.5899280575539567, |
|
"eval_loss": 0.43453264236450195, |
|
"eval_precision": 0.5694444444444444, |
|
"eval_recall": 0.6119402985074627, |
|
"eval_runtime": 0.0617, |
|
"eval_samples_per_second": 129.645, |
|
"eval_steps_per_second": 16.206, |
|
"step": 46 |
|
}, |
|
{ |
|
"epoch": 6.97, |
|
"eval_accuracy": 0.9072753209700428, |
|
"eval_f1": 0.6225165562913907, |
|
"eval_loss": 0.3776801824569702, |
|
"eval_precision": 0.5595238095238095, |
|
"eval_recall": 0.7014925373134329, |
|
"eval_runtime": 0.0586, |
|
"eval_samples_per_second": 136.463, |
|
"eval_steps_per_second": 17.058, |
|
"step": 54 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9115549215406562, |
|
"eval_f1": 0.6533333333333333, |
|
"eval_loss": 0.379366397857666, |
|
"eval_precision": 0.5903614457831325, |
|
"eval_recall": 0.7313432835820896, |
|
"eval_runtime": 0.0869, |
|
"eval_samples_per_second": 92.01, |
|
"eval_steps_per_second": 11.501, |
|
"step": 62 |
|
}, |
|
{ |
|
"epoch": 8.9, |
|
"eval_accuracy": 0.920114122681883, |
|
"eval_f1": 0.7200000000000001, |
|
"eval_loss": 0.3528553247451782, |
|
"eval_precision": 0.6506024096385542, |
|
"eval_recall": 0.8059701492537313, |
|
"eval_runtime": 0.0586, |
|
"eval_samples_per_second": 136.489, |
|
"eval_steps_per_second": 17.061, |
|
"step": 69 |
|
}, |
|
{ |
|
"epoch": 9.94, |
|
"eval_accuracy": 0.920114122681883, |
|
"eval_f1": 0.7172413793103448, |
|
"eval_loss": 0.38467955589294434, |
|
"eval_precision": 0.6666666666666666, |
|
"eval_recall": 0.7761194029850746, |
|
"eval_runtime": 0.0815, |
|
"eval_samples_per_second": 98.125, |
|
"eval_steps_per_second": 12.266, |
|
"step": 77 |
|
}, |
|
{ |
|
"epoch": 10.97, |
|
"eval_accuracy": 0.920114122681883, |
|
"eval_f1": 0.7346938775510204, |
|
"eval_loss": 0.3774794638156891, |
|
"eval_precision": 0.675, |
|
"eval_recall": 0.8059701492537313, |
|
"eval_runtime": 0.0582, |
|
"eval_samples_per_second": 137.398, |
|
"eval_steps_per_second": 17.175, |
|
"step": 85 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.920114122681883, |
|
"eval_f1": 0.7464788732394366, |
|
"eval_loss": 0.3588719367980957, |
|
"eval_precision": 0.7066666666666667, |
|
"eval_recall": 0.7910447761194029, |
|
"eval_runtime": 0.0607, |
|
"eval_samples_per_second": 131.854, |
|
"eval_steps_per_second": 16.482, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 12.9, |
|
"eval_accuracy": 0.9243937232524965, |
|
"eval_f1": 0.7692307692307693, |
|
"eval_loss": 0.358673632144928, |
|
"eval_precision": 0.7236842105263158, |
|
"eval_recall": 0.8208955223880597, |
|
"eval_runtime": 0.0777, |
|
"eval_samples_per_second": 102.924, |
|
"eval_steps_per_second": 12.866, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 13.94, |
|
"eval_accuracy": 0.9144079885877318, |
|
"eval_f1": 0.6973684210526316, |
|
"eval_loss": 0.3642039895057678, |
|
"eval_precision": 0.6235294117647059, |
|
"eval_recall": 0.7910447761194029, |
|
"eval_runtime": 0.0603, |
|
"eval_samples_per_second": 132.64, |
|
"eval_steps_per_second": 16.58, |
|
"step": 108 |
|
}, |
|
{ |
|
"epoch": 14.97, |
|
"eval_accuracy": 0.9144079885877318, |
|
"eval_f1": 0.7066666666666667, |
|
"eval_loss": 0.3640976548194885, |
|
"eval_precision": 0.6385542168674698, |
|
"eval_recall": 0.7910447761194029, |
|
"eval_runtime": 0.1061, |
|
"eval_samples_per_second": 75.406, |
|
"eval_steps_per_second": 9.426, |
|
"step": 116 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.9172610556348074, |
|
"eval_f1": 0.7534246575342466, |
|
"eval_loss": 0.3683820962905884, |
|
"eval_precision": 0.6962025316455697, |
|
"eval_recall": 0.8208955223880597, |
|
"eval_runtime": 0.0609, |
|
"eval_samples_per_second": 131.457, |
|
"eval_steps_per_second": 16.432, |
|
"step": 124 |
|
}, |
|
{ |
|
"epoch": 16.9, |
|
"eval_accuracy": 0.9172610556348074, |
|
"eval_f1": 0.7534246575342466, |
|
"eval_loss": 0.3730718493461609, |
|
"eval_precision": 0.6962025316455697, |
|
"eval_recall": 0.8208955223880597, |
|
"eval_runtime": 0.0806, |
|
"eval_samples_per_second": 99.214, |
|
"eval_steps_per_second": 12.402, |
|
"step": 131 |
|
}, |
|
{ |
|
"epoch": 17.94, |
|
"eval_accuracy": 0.9172610556348074, |
|
"eval_f1": 0.738255033557047, |
|
"eval_loss": 0.3693277835845947, |
|
"eval_precision": 0.6707317073170732, |
|
"eval_recall": 0.8208955223880597, |
|
"eval_runtime": 0.0628, |
|
"eval_samples_per_second": 127.442, |
|
"eval_steps_per_second": 15.93, |
|
"step": 139 |
|
}, |
|
{ |
|
"epoch": 18.06, |
|
"eval_accuracy": 0.9172610556348074, |
|
"eval_f1": 0.7333333333333333, |
|
"eval_loss": 0.36928027868270874, |
|
"eval_precision": 0.6626506024096386, |
|
"eval_recall": 0.8208955223880597, |
|
"eval_runtime": 0.0817, |
|
"eval_samples_per_second": 97.898, |
|
"eval_steps_per_second": 12.237, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 18.06, |
|
"step": 140, |
|
"total_flos": 142823207204352.0, |
|
"train_loss": 0.284281131199428, |
|
"train_runtime": 653.9512, |
|
"train_samples_per_second": 3.701, |
|
"train_steps_per_second": 0.214 |
|
} |
|
], |
|
"max_steps": 140, |
|
"num_train_epochs": 20, |
|
"total_flos": 142823207204352.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|