{ "best_metric": null, "best_model_checkpoint": null, "epoch": 18.06451612903226, "global_step": 140, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.9, "eval_accuracy": 0.7432239657631954, "eval_f1": 0.0, "eval_loss": 1.1863211393356323, "eval_precision": 0.0, "eval_recall": 0.0, "eval_runtime": 0.0695, "eval_samples_per_second": 115.178, "eval_steps_per_second": 14.397, "step": 7 }, { "epoch": 1.94, "eval_accuracy": 0.7931526390870185, "eval_f1": 0.25925925925925924, "eval_loss": 0.7849462628364563, "eval_precision": 0.34146341463414637, "eval_recall": 0.208955223880597, "eval_runtime": 0.113, "eval_samples_per_second": 70.799, "eval_steps_per_second": 8.85, "step": 15 }, { "epoch": 2.97, "eval_accuracy": 0.8487874465049928, "eval_f1": 0.484375, "eval_loss": 0.5964732766151428, "eval_precision": 0.5081967213114754, "eval_recall": 0.4626865671641791, "eval_runtime": 0.0576, "eval_samples_per_second": 139.001, "eval_steps_per_second": 17.375, "step": 23 }, { "epoch": 4.0, "eval_accuracy": 0.8944365192582026, "eval_f1": 0.6277372262773724, "eval_loss": 0.5038930773735046, "eval_precision": 0.6142857142857143, "eval_recall": 0.6417910447761194, "eval_runtime": 0.0605, "eval_samples_per_second": 132.311, "eval_steps_per_second": 16.539, "step": 31 }, { "epoch": 4.9, "eval_accuracy": 0.891583452211127, "eval_f1": 0.6293706293706294, "eval_loss": 0.45688581466674805, "eval_precision": 0.5921052631578947, "eval_recall": 0.6716417910447762, "eval_runtime": 0.0797, "eval_samples_per_second": 100.319, "eval_steps_per_second": 12.54, "step": 38 }, { "epoch": 5.94, "eval_accuracy": 0.8887303851640513, "eval_f1": 0.5899280575539567, "eval_loss": 0.43453264236450195, "eval_precision": 0.5694444444444444, "eval_recall": 0.6119402985074627, "eval_runtime": 0.0617, "eval_samples_per_second": 129.645, "eval_steps_per_second": 16.206, "step": 46 }, { "epoch": 6.97, "eval_accuracy": 0.9072753209700428, "eval_f1": 0.6225165562913907, "eval_loss": 0.3776801824569702, "eval_precision": 0.5595238095238095, "eval_recall": 0.7014925373134329, "eval_runtime": 0.0586, "eval_samples_per_second": 136.463, "eval_steps_per_second": 17.058, "step": 54 }, { "epoch": 8.0, "eval_accuracy": 0.9115549215406562, "eval_f1": 0.6533333333333333, "eval_loss": 0.379366397857666, "eval_precision": 0.5903614457831325, "eval_recall": 0.7313432835820896, "eval_runtime": 0.0869, "eval_samples_per_second": 92.01, "eval_steps_per_second": 11.501, "step": 62 }, { "epoch": 8.9, "eval_accuracy": 0.920114122681883, "eval_f1": 0.7200000000000001, "eval_loss": 0.3528553247451782, "eval_precision": 0.6506024096385542, "eval_recall": 0.8059701492537313, "eval_runtime": 0.0586, "eval_samples_per_second": 136.489, "eval_steps_per_second": 17.061, "step": 69 }, { "epoch": 9.94, "eval_accuracy": 0.920114122681883, "eval_f1": 0.7172413793103448, "eval_loss": 0.38467955589294434, "eval_precision": 0.6666666666666666, "eval_recall": 0.7761194029850746, "eval_runtime": 0.0815, "eval_samples_per_second": 98.125, "eval_steps_per_second": 12.266, "step": 77 }, { "epoch": 10.97, "eval_accuracy": 0.920114122681883, "eval_f1": 0.7346938775510204, "eval_loss": 0.3774794638156891, "eval_precision": 0.675, "eval_recall": 0.8059701492537313, "eval_runtime": 0.0582, "eval_samples_per_second": 137.398, "eval_steps_per_second": 17.175, "step": 85 }, { "epoch": 12.0, "eval_accuracy": 0.920114122681883, "eval_f1": 0.7464788732394366, "eval_loss": 0.3588719367980957, "eval_precision": 0.7066666666666667, "eval_recall": 0.7910447761194029, "eval_runtime": 0.0607, "eval_samples_per_second": 131.854, "eval_steps_per_second": 16.482, "step": 93 }, { "epoch": 12.9, "eval_accuracy": 0.9243937232524965, "eval_f1": 0.7692307692307693, "eval_loss": 0.358673632144928, "eval_precision": 0.7236842105263158, "eval_recall": 0.8208955223880597, "eval_runtime": 0.0777, "eval_samples_per_second": 102.924, "eval_steps_per_second": 12.866, "step": 100 }, { "epoch": 13.94, "eval_accuracy": 0.9144079885877318, "eval_f1": 0.6973684210526316, "eval_loss": 0.3642039895057678, "eval_precision": 0.6235294117647059, "eval_recall": 0.7910447761194029, "eval_runtime": 0.0603, "eval_samples_per_second": 132.64, "eval_steps_per_second": 16.58, "step": 108 }, { "epoch": 14.97, "eval_accuracy": 0.9144079885877318, "eval_f1": 0.7066666666666667, "eval_loss": 0.3640976548194885, "eval_precision": 0.6385542168674698, "eval_recall": 0.7910447761194029, "eval_runtime": 0.1061, "eval_samples_per_second": 75.406, "eval_steps_per_second": 9.426, "step": 116 }, { "epoch": 16.0, "eval_accuracy": 0.9172610556348074, "eval_f1": 0.7534246575342466, "eval_loss": 0.3683820962905884, "eval_precision": 0.6962025316455697, "eval_recall": 0.8208955223880597, "eval_runtime": 0.0609, "eval_samples_per_second": 131.457, "eval_steps_per_second": 16.432, "step": 124 }, { "epoch": 16.9, "eval_accuracy": 0.9172610556348074, "eval_f1": 0.7534246575342466, "eval_loss": 0.3730718493461609, "eval_precision": 0.6962025316455697, "eval_recall": 0.8208955223880597, "eval_runtime": 0.0806, "eval_samples_per_second": 99.214, "eval_steps_per_second": 12.402, "step": 131 }, { "epoch": 17.94, "eval_accuracy": 0.9172610556348074, "eval_f1": 0.738255033557047, "eval_loss": 0.3693277835845947, "eval_precision": 0.6707317073170732, "eval_recall": 0.8208955223880597, "eval_runtime": 0.0628, "eval_samples_per_second": 127.442, "eval_steps_per_second": 15.93, "step": 139 }, { "epoch": 18.06, "eval_accuracy": 0.9172610556348074, "eval_f1": 0.7333333333333333, "eval_loss": 0.36928027868270874, "eval_precision": 0.6626506024096386, "eval_recall": 0.8208955223880597, "eval_runtime": 0.0817, "eval_samples_per_second": 97.898, "eval_steps_per_second": 12.237, "step": 140 }, { "epoch": 18.06, "step": 140, "total_flos": 142823207204352.0, "train_loss": 0.284281131199428, "train_runtime": 653.9512, "train_samples_per_second": 3.701, "train_steps_per_second": 0.214 } ], "max_steps": 140, "num_train_epochs": 20, "total_flos": 142823207204352.0, "trial_name": null, "trial_params": null }