{"current_steps": 1, "total_steps": 560, "loss": 0.7247, "learning_rate": 1.7857142857142857e-06, "epoch": 0.017777777777777778, "percentage": 0.18, "elapsed_time": "0:00:29", "remaining_time": "4:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 560, "loss": 0.6432, "learning_rate": 3.5714285714285714e-06, "epoch": 0.035555555555555556, "percentage": 0.36, "elapsed_time": "0:01:03", "remaining_time": "4:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 560, "loss": 0.6158, "learning_rate": 5.357142857142857e-06, "epoch": 0.05333333333333334, "percentage": 0.54, "elapsed_time": "0:01:48", "remaining_time": "5:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 560, "loss": 0.6322, "learning_rate": 7.142857142857143e-06, "epoch": 0.07111111111111111, "percentage": 0.71, "elapsed_time": "0:02:24", "remaining_time": "5:33:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 560, "loss": 0.5955, "learning_rate": 8.92857142857143e-06, "epoch": 0.08888888888888889, "percentage": 0.89, "elapsed_time": "0:03:09", "remaining_time": "5:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 560, "loss": 0.6794, "learning_rate": 1.0714285714285714e-05, "epoch": 0.10666666666666667, "percentage": 1.07, "elapsed_time": "0:03:44", "remaining_time": "5:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 560, "loss": 0.5716, "learning_rate": 1.25e-05, "epoch": 0.12444444444444444, "percentage": 1.25, "elapsed_time": "0:04:31", "remaining_time": "5:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 560, "loss": 0.6785, "learning_rate": 1.4285714285714285e-05, "epoch": 0.14222222222222222, "percentage": 1.43, "elapsed_time": "0:05:07", "remaining_time": "5:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 560, "loss": 0.5768, "learning_rate": 1.6071428571428572e-05, "epoch": 0.16, "percentage": 1.61, "elapsed_time": "0:05:54", "remaining_time": "6:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 560, "loss": 0.653, "learning_rate": 1.785714285714286e-05, "epoch": 0.17777777777777778, "percentage": 1.79, "elapsed_time": "0:06:22", "remaining_time": "5:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 560, "loss": 0.608, "learning_rate": 1.9642857142857145e-05, "epoch": 0.19555555555555557, "percentage": 1.96, "elapsed_time": "0:06:55", "remaining_time": "5:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 560, "loss": 0.6273, "learning_rate": 2.1428571428571428e-05, "epoch": 0.21333333333333335, "percentage": 2.14, "elapsed_time": "0:07:31", "remaining_time": "5:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 560, "loss": 0.5894, "learning_rate": 2.3214285714285715e-05, "epoch": 0.2311111111111111, "percentage": 2.32, "elapsed_time": "0:08:03", "remaining_time": "5:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 560, "loss": 0.6952, "learning_rate": 2.5e-05, "epoch": 0.24888888888888888, "percentage": 2.5, "elapsed_time": "0:08:26", "remaining_time": "5:29:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 560, "loss": 0.695, "learning_rate": 2.6785714285714288e-05, "epoch": 0.26666666666666666, "percentage": 2.68, "elapsed_time": "0:08:50", "remaining_time": "5:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 560, "loss": 0.5933, "learning_rate": 2.857142857142857e-05, "epoch": 0.28444444444444444, "percentage": 2.86, "elapsed_time": "0:09:20", "remaining_time": "5:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 560, "loss": 0.5422, "learning_rate": 3.0357142857142857e-05, "epoch": 0.3022222222222222, "percentage": 3.04, "elapsed_time": "0:09:51", "remaining_time": "5:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 560, "loss": 0.5283, "learning_rate": 3.2142857142857144e-05, "epoch": 0.32, "percentage": 3.21, "elapsed_time": "0:10:19", "remaining_time": "5:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 560, "loss": 0.5295, "learning_rate": 3.392857142857143e-05, "epoch": 0.3377777777777778, "percentage": 3.39, "elapsed_time": "0:10:51", "remaining_time": "5:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 560, "loss": 0.4891, "learning_rate": 3.571428571428572e-05, "epoch": 0.35555555555555557, "percentage": 3.57, "elapsed_time": "0:11:27", "remaining_time": "5:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 560, "loss": 0.5169, "learning_rate": 3.7500000000000003e-05, "epoch": 0.37333333333333335, "percentage": 3.75, "elapsed_time": "0:12:05", "remaining_time": "5:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 560, "loss": 0.5211, "learning_rate": 3.928571428571429e-05, "epoch": 0.39111111111111113, "percentage": 3.93, "elapsed_time": "0:12:37", "remaining_time": "5:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 560, "loss": 0.4661, "learning_rate": 4.107142857142857e-05, "epoch": 0.4088888888888889, "percentage": 4.11, "elapsed_time": "0:13:19", "remaining_time": "5:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 560, "loss": 0.4794, "learning_rate": 4.2857142857142856e-05, "epoch": 0.4266666666666667, "percentage": 4.29, "elapsed_time": "0:13:58", "remaining_time": "5:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 560, "loss": 0.4965, "learning_rate": 4.464285714285715e-05, "epoch": 0.4444444444444444, "percentage": 4.46, "elapsed_time": "0:14:32", "remaining_time": "5:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 560, "loss": 0.8358, "learning_rate": 4.642857142857143e-05, "epoch": 0.4622222222222222, "percentage": 4.64, "elapsed_time": "0:14:58", "remaining_time": "5:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 560, "loss": 0.4957, "learning_rate": 4.8214285714285716e-05, "epoch": 0.48, "percentage": 4.82, "elapsed_time": "0:15:18", "remaining_time": "5:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 560, "loss": 0.5393, "learning_rate": 5e-05, "epoch": 0.49777777777777776, "percentage": 5.0, "elapsed_time": "0:15:46", "remaining_time": "4:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 560, "loss": 0.5784, "learning_rate": 5.1785714285714296e-05, "epoch": 0.5155555555555555, "percentage": 5.18, "elapsed_time": "0:16:02", "remaining_time": "4:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 560, "loss": 0.4446, "learning_rate": 5.3571428571428575e-05, "epoch": 0.5333333333333333, "percentage": 5.36, "elapsed_time": "0:16:29", "remaining_time": "4:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 560, "loss": 0.3995, "learning_rate": 5.535714285714286e-05, "epoch": 0.5511111111111111, "percentage": 5.54, "elapsed_time": "0:16:55", "remaining_time": "4:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 560, "loss": 0.3399, "learning_rate": 5.714285714285714e-05, "epoch": 0.5688888888888889, "percentage": 5.71, "elapsed_time": "0:17:37", "remaining_time": "4:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 560, "loss": 0.3983, "learning_rate": 5.8928571428571435e-05, "epoch": 0.5866666666666667, "percentage": 5.89, "elapsed_time": "0:18:07", "remaining_time": "4:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 560, "loss": 0.3831, "learning_rate": 6.0714285714285715e-05, "epoch": 0.6044444444444445, "percentage": 6.07, "elapsed_time": "0:18:32", "remaining_time": "4:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 560, "loss": 0.3359, "learning_rate": 6.25e-05, "epoch": 0.6222222222222222, "percentage": 6.25, "elapsed_time": "0:19:06", "remaining_time": "4:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 560, "loss": 0.3597, "learning_rate": 6.428571428571429e-05, "epoch": 0.64, "percentage": 6.43, "elapsed_time": "0:19:27", "remaining_time": "4:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 560, "loss": 0.4061, "learning_rate": 6.607142857142857e-05, "epoch": 0.6577777777777778, "percentage": 6.61, "elapsed_time": "0:19:58", "remaining_time": "4:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 560, "loss": 0.3533, "learning_rate": 6.785714285714286e-05, "epoch": 0.6755555555555556, "percentage": 6.79, "elapsed_time": "0:20:38", "remaining_time": "4:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 560, "loss": 0.3598, "learning_rate": 6.964285714285715e-05, "epoch": 0.6933333333333334, "percentage": 6.96, "elapsed_time": "0:21:09", "remaining_time": "4:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 560, "loss": 0.3796, "learning_rate": 7.142857142857143e-05, "epoch": 0.7111111111111111, "percentage": 7.14, "elapsed_time": "0:21:34", "remaining_time": "4:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 560, "loss": 0.4386, "learning_rate": 7.321428571428571e-05, "epoch": 0.7288888888888889, "percentage": 7.32, "elapsed_time": "0:22:04", "remaining_time": "4:39:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 560, "loss": 0.3265, "learning_rate": 7.500000000000001e-05, "epoch": 0.7466666666666667, "percentage": 7.5, "elapsed_time": "0:22:38", "remaining_time": "4:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 560, "loss": 0.3344, "learning_rate": 7.67857142857143e-05, "epoch": 0.7644444444444445, "percentage": 7.68, "elapsed_time": "0:23:09", "remaining_time": "4:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 560, "loss": 0.3514, "learning_rate": 7.857142857142858e-05, "epoch": 0.7822222222222223, "percentage": 7.86, "elapsed_time": "0:23:31", "remaining_time": "4:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 560, "loss": 0.3258, "learning_rate": 8.035714285714287e-05, "epoch": 0.8, "percentage": 8.04, "elapsed_time": "0:23:58", "remaining_time": "4:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 560, "loss": 0.3228, "learning_rate": 8.214285714285714e-05, "epoch": 0.8177777777777778, "percentage": 8.21, "elapsed_time": "0:24:35", "remaining_time": "4:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 560, "loss": 0.3752, "learning_rate": 8.392857142857144e-05, "epoch": 0.8355555555555556, "percentage": 8.39, "elapsed_time": "0:25:08", "remaining_time": "4:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 560, "loss": 0.3656, "learning_rate": 8.571428571428571e-05, "epoch": 0.8533333333333334, "percentage": 8.57, "elapsed_time": "0:25:36", "remaining_time": "4:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 560, "loss": 0.3254, "learning_rate": 8.75e-05, "epoch": 0.8711111111111111, "percentage": 8.75, "elapsed_time": "0:26:15", "remaining_time": "4:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 560, "loss": 0.2911, "learning_rate": 8.92857142857143e-05, "epoch": 0.8888888888888888, "percentage": 8.93, "elapsed_time": "0:26:54", "remaining_time": "4:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 560, "loss": 0.3641, "learning_rate": 9.107142857142857e-05, "epoch": 0.9066666666666666, "percentage": 9.11, "elapsed_time": "0:27:32", "remaining_time": "4:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 560, "loss": 0.3164, "learning_rate": 9.285714285714286e-05, "epoch": 0.9244444444444444, "percentage": 9.29, "elapsed_time": "0:27:54", "remaining_time": "4:32:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 560, "loss": 0.3216, "learning_rate": 9.464285714285715e-05, "epoch": 0.9422222222222222, "percentage": 9.46, "elapsed_time": "0:28:25", "remaining_time": "4:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 560, "loss": 0.4645, "learning_rate": 9.642857142857143e-05, "epoch": 0.96, "percentage": 9.64, "elapsed_time": "0:28:45", "remaining_time": "4:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 560, "loss": 0.341, "learning_rate": 9.821428571428572e-05, "epoch": 0.9777777777777777, "percentage": 9.82, "elapsed_time": "0:29:08", "remaining_time": "4:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 560, "loss": 0.3029, "learning_rate": 0.0001, "epoch": 0.9955555555555555, "percentage": 10.0, "elapsed_time": "0:29:50", "remaining_time": "4:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 560, "loss": 0.3005, "learning_rate": 9.999902864657691e-05, "epoch": 1.0133333333333334, "percentage": 10.18, "elapsed_time": "0:30:31", "remaining_time": "4:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 560, "loss": 0.3182, "learning_rate": 9.999611462404875e-05, "epoch": 1.031111111111111, "percentage": 10.36, "elapsed_time": "0:30:57", "remaining_time": "4:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 560, "loss": 0.4438, "learning_rate": 9.999125804563732e-05, "epoch": 1.048888888888889, "percentage": 10.54, "elapsed_time": "0:31:24", "remaining_time": "4:26:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 560, "loss": 0.3115, "learning_rate": 9.998445910004082e-05, "epoch": 1.0666666666666667, "percentage": 10.71, "elapsed_time": "0:32:00", "remaining_time": "4:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 560, "loss": 0.4094, "learning_rate": 9.997571805142639e-05, "epoch": 1.0844444444444445, "percentage": 10.89, "elapsed_time": "0:32:22", "remaining_time": "4:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 560, "loss": 0.3135, "learning_rate": 9.996503523941994e-05, "epoch": 1.1022222222222222, "percentage": 11.07, "elapsed_time": "0:32:51", "remaining_time": "4:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 560, "loss": 0.2901, "learning_rate": 9.99524110790929e-05, "epoch": 1.12, "percentage": 11.25, "elapsed_time": "0:33:24", "remaining_time": "4:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 560, "loss": 0.3178, "learning_rate": 9.993784606094612e-05, "epoch": 1.1377777777777778, "percentage": 11.43, "elapsed_time": "0:33:49", "remaining_time": "4:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 560, "loss": 0.3534, "learning_rate": 9.992134075089084e-05, "epoch": 1.1555555555555554, "percentage": 11.61, "elapsed_time": "0:34:08", "remaining_time": "4:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 560, "loss": 0.3155, "learning_rate": 9.99028957902266e-05, "epoch": 1.1733333333333333, "percentage": 11.79, "elapsed_time": "0:34:36", "remaining_time": "4:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 560, "loss": 0.3555, "learning_rate": 9.988251189561645e-05, "epoch": 1.1911111111111112, "percentage": 11.96, "elapsed_time": "0:35:12", "remaining_time": "4:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 560, "loss": 0.33, "learning_rate": 9.986018985905901e-05, "epoch": 1.208888888888889, "percentage": 12.14, "elapsed_time": "0:35:46", "remaining_time": "4:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 560, "loss": 0.3499, "learning_rate": 9.983593054785776e-05, "epoch": 1.2266666666666666, "percentage": 12.32, "elapsed_time": "0:36:13", "remaining_time": "4:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 560, "loss": 0.353, "learning_rate": 9.980973490458728e-05, "epoch": 1.2444444444444445, "percentage": 12.5, "elapsed_time": "0:36:36", "remaining_time": "4:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 560, "loss": 0.2993, "learning_rate": 9.978160394705668e-05, "epoch": 1.2622222222222224, "percentage": 12.68, "elapsed_time": "0:37:00", "remaining_time": "4:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 560, "loss": 0.3122, "learning_rate": 9.975153876827008e-05, "epoch": 1.28, "percentage": 12.86, "elapsed_time": "0:37:27", "remaining_time": "4:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 560, "loss": 0.3258, "learning_rate": 9.971954053638399e-05, "epoch": 1.2977777777777777, "percentage": 13.04, "elapsed_time": "0:37:54", "remaining_time": "4:12:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 560, "loss": 0.3835, "learning_rate": 9.968561049466214e-05, "epoch": 1.3155555555555556, "percentage": 13.21, "elapsed_time": "0:38:16", "remaining_time": "4:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 560, "loss": 0.2817, "learning_rate": 9.964974996142698e-05, "epoch": 1.3333333333333333, "percentage": 13.39, "elapsed_time": "0:39:04", "remaining_time": "4:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 560, "loss": 0.2828, "learning_rate": 9.961196033000861e-05, "epoch": 1.3511111111111112, "percentage": 13.57, "elapsed_time": "0:39:41", "remaining_time": "4:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 560, "loss": 0.3253, "learning_rate": 9.957224306869053e-05, "epoch": 1.3688888888888888, "percentage": 13.75, "elapsed_time": "0:40:04", "remaining_time": "4:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 560, "loss": 0.3215, "learning_rate": 9.953059972065265e-05, "epoch": 1.3866666666666667, "percentage": 13.93, "elapsed_time": "0:40:32", "remaining_time": "4:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 560, "loss": 0.323, "learning_rate": 9.948703190391131e-05, "epoch": 1.4044444444444444, "percentage": 14.11, "elapsed_time": "0:41:09", "remaining_time": "4:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 560, "loss": 0.2962, "learning_rate": 9.944154131125642e-05, "epoch": 1.4222222222222223, "percentage": 14.29, "elapsed_time": "0:41:45", "remaining_time": "4:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 560, "loss": 0.314, "learning_rate": 9.939412971018574e-05, "epoch": 1.44, "percentage": 14.46, "elapsed_time": "0:42:29", "remaining_time": "4:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 560, "loss": 0.2828, "learning_rate": 9.934479894283606e-05, "epoch": 1.4577777777777778, "percentage": 14.64, "elapsed_time": "0:43:00", "remaining_time": "4:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 560, "loss": 0.3124, "learning_rate": 9.92935509259118e-05, "epoch": 1.4755555555555555, "percentage": 14.82, "elapsed_time": "0:43:27", "remaining_time": "4:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 560, "loss": 0.2861, "learning_rate": 9.924038765061042e-05, "epoch": 1.4933333333333334, "percentage": 15.0, "elapsed_time": "0:44:04", "remaining_time": "4:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 560, "loss": 0.286, "learning_rate": 9.918531118254507e-05, "epoch": 1.511111111111111, "percentage": 15.18, "elapsed_time": "0:44:32", "remaining_time": "4:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 560, "loss": 0.307, "learning_rate": 9.912832366166442e-05, "epoch": 1.528888888888889, "percentage": 15.36, "elapsed_time": "0:45:08", "remaining_time": "4:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 560, "loss": 0.3053, "learning_rate": 9.906942730216939e-05, "epoch": 1.5466666666666666, "percentage": 15.54, "elapsed_time": "0:45:34", "remaining_time": "4:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 560, "loss": 0.3108, "learning_rate": 9.900862439242719e-05, "epoch": 1.5644444444444443, "percentage": 15.71, "elapsed_time": "0:45:57", "remaining_time": "4:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 560, "loss": 0.3178, "learning_rate": 9.894591729488242e-05, "epoch": 1.5822222222222222, "percentage": 15.89, "elapsed_time": "0:46:39", "remaining_time": "4:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 560, "loss": 0.303, "learning_rate": 9.888130844596524e-05, "epoch": 1.6, "percentage": 16.07, "elapsed_time": "0:47:08", "remaining_time": "4:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 560, "loss": 0.3503, "learning_rate": 9.881480035599667e-05, "epoch": 1.6177777777777778, "percentage": 16.25, "elapsed_time": "0:47:39", "remaining_time": "4:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 560, "loss": 0.2876, "learning_rate": 9.874639560909117e-05, "epoch": 1.6355555555555554, "percentage": 16.43, "elapsed_time": "0:48:17", "remaining_time": "4:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 560, "loss": 0.2937, "learning_rate": 9.867609686305617e-05, "epoch": 1.6533333333333333, "percentage": 16.61, "elapsed_time": "0:48:42", "remaining_time": "4:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 560, "loss": 0.3155, "learning_rate": 9.860390684928873e-05, "epoch": 1.6711111111111112, "percentage": 16.79, "elapsed_time": "0:49:14", "remaining_time": "4:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 560, "loss": 0.276, "learning_rate": 9.852982837266955e-05, "epoch": 1.6888888888888889, "percentage": 16.96, "elapsed_time": "0:49:50", "remaining_time": "4:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 560, "loss": 0.2831, "learning_rate": 9.84538643114539e-05, "epoch": 1.7066666666666666, "percentage": 17.14, "elapsed_time": "0:50:17", "remaining_time": "4:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 560, "loss": 0.2964, "learning_rate": 9.837601761715983e-05, "epoch": 1.7244444444444444, "percentage": 17.32, "elapsed_time": "0:50:51", "remaining_time": "4:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 560, "loss": 0.2814, "learning_rate": 9.829629131445342e-05, "epoch": 1.7422222222222223, "percentage": 17.5, "elapsed_time": "0:51:21", "remaining_time": "4:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 560, "loss": 0.2806, "learning_rate": 9.82146885010314e-05, "epoch": 1.76, "percentage": 17.68, "elapsed_time": "0:52:06", "remaining_time": "4:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 560, "loss": 0.3065, "learning_rate": 9.81312123475006e-05, "epoch": 1.7777777777777777, "percentage": 17.86, "elapsed_time": "0:52:29", "remaining_time": "4:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 560, "loss": 0.311, "learning_rate": 9.804586609725499e-05, "epoch": 1.7955555555555556, "percentage": 18.04, "elapsed_time": "0:53:05", "remaining_time": "4:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 560, "loss": 0.3003, "learning_rate": 9.79586530663494e-05, "epoch": 1.8133333333333335, "percentage": 18.21, "elapsed_time": "0:53:34", "remaining_time": "4:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 560, "loss": 0.2727, "learning_rate": 9.78695766433709e-05, "epoch": 1.8311111111111111, "percentage": 18.39, "elapsed_time": "0:54:05", "remaining_time": "3:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 560, "loss": 0.2834, "learning_rate": 9.777864028930705e-05, "epoch": 1.8488888888888888, "percentage": 18.57, "elapsed_time": "0:54:29", "remaining_time": "3:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 560, "loss": 0.2806, "learning_rate": 9.768584753741134e-05, "epoch": 1.8666666666666667, "percentage": 18.75, "elapsed_time": "0:55:11", "remaining_time": "3:59:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 560, "loss": 0.2951, "learning_rate": 9.759120199306613e-05, "epoch": 1.8844444444444446, "percentage": 18.93, "elapsed_time": "0:55:40", "remaining_time": "3:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 560, "loss": 0.2975, "learning_rate": 9.74947073336423e-05, "epoch": 1.9022222222222223, "percentage": 19.11, "elapsed_time": "0:56:15", "remaining_time": "3:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 560, "loss": 0.2677, "learning_rate": 9.73963673083566e-05, "epoch": 1.92, "percentage": 19.29, "elapsed_time": "0:56:51", "remaining_time": "3:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 560, "loss": 0.3219, "learning_rate": 9.72961857381258e-05, "epoch": 1.9377777777777778, "percentage": 19.46, "elapsed_time": "0:57:25", "remaining_time": "3:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 560, "loss": 0.2631, "learning_rate": 9.719416651541839e-05, "epoch": 1.9555555555555557, "percentage": 19.64, "elapsed_time": "0:57:51", "remaining_time": "3:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 560, "loss": 0.2788, "learning_rate": 9.709031360410318e-05, "epoch": 1.9733333333333334, "percentage": 19.82, "elapsed_time": "0:58:17", "remaining_time": "3:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 560, "loss": 0.2723, "learning_rate": 9.698463103929542e-05, "epoch": 1.991111111111111, "percentage": 20.0, "elapsed_time": "0:58:56", "remaining_time": "3:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 560, "loss": 0.3279, "learning_rate": 9.687712292719997e-05, "epoch": 2.008888888888889, "percentage": 20.18, "elapsed_time": "0:59:30", "remaining_time": "3:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 560, "loss": 0.2708, "learning_rate": 9.67677934449517e-05, "epoch": 2.026666666666667, "percentage": 20.36, "elapsed_time": "0:59:56", "remaining_time": "3:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 560, "loss": 0.2801, "learning_rate": 9.665664684045333e-05, "epoch": 2.0444444444444443, "percentage": 20.54, "elapsed_time": "1:00:25", "remaining_time": "3:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 560, "loss": 0.218, "learning_rate": 9.654368743221022e-05, "epoch": 2.062222222222222, "percentage": 20.71, "elapsed_time": "1:00:59", "remaining_time": "3:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 560, "loss": 0.2865, "learning_rate": 9.642891960916268e-05, "epoch": 2.08, "percentage": 20.89, "elapsed_time": "1:01:30", "remaining_time": "3:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 560, "loss": 0.2866, "learning_rate": 9.631234783051544e-05, "epoch": 2.097777777777778, "percentage": 21.07, "elapsed_time": "1:02:03", "remaining_time": "3:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 560, "loss": 0.2776, "learning_rate": 9.619397662556435e-05, "epoch": 2.1155555555555554, "percentage": 21.25, "elapsed_time": "1:02:38", "remaining_time": "3:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 560, "loss": 0.2655, "learning_rate": 9.607381059352038e-05, "epoch": 2.1333333333333333, "percentage": 21.43, "elapsed_time": "1:03:14", "remaining_time": "3:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 560, "loss": 0.3282, "learning_rate": 9.595185440333103e-05, "epoch": 2.151111111111111, "percentage": 21.61, "elapsed_time": "1:03:42", "remaining_time": "3:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 560, "loss": 0.3087, "learning_rate": 9.582811279349882e-05, "epoch": 2.168888888888889, "percentage": 21.79, "elapsed_time": "1:03:59", "remaining_time": "3:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 560, "loss": 0.2924, "learning_rate": 9.570259057189717e-05, "epoch": 2.1866666666666665, "percentage": 21.96, "elapsed_time": "1:04:30", "remaining_time": "3:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 560, "loss": 0.2613, "learning_rate": 9.557529261558367e-05, "epoch": 2.2044444444444444, "percentage": 22.14, "elapsed_time": "1:05:08", "remaining_time": "3:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 560, "loss": 0.2574, "learning_rate": 9.544622387061055e-05, "epoch": 2.2222222222222223, "percentage": 22.32, "elapsed_time": "1:05:49", "remaining_time": "3:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 560, "loss": 0.2883, "learning_rate": 9.53153893518325e-05, "epoch": 2.24, "percentage": 22.5, "elapsed_time": "1:06:25", "remaining_time": "3:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 560, "loss": 0.3131, "learning_rate": 9.518279414271183e-05, "epoch": 2.2577777777777777, "percentage": 22.68, "elapsed_time": "1:06:45", "remaining_time": "3:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 560, "loss": 0.3184, "learning_rate": 9.504844339512095e-05, "epoch": 2.2755555555555556, "percentage": 22.86, "elapsed_time": "1:07:25", "remaining_time": "3:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 560, "loss": 0.2794, "learning_rate": 9.491234232914221e-05, "epoch": 2.2933333333333334, "percentage": 23.04, "elapsed_time": "1:07:58", "remaining_time": "3:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 560, "loss": 0.2884, "learning_rate": 9.477449623286505e-05, "epoch": 2.311111111111111, "percentage": 23.21, "elapsed_time": "1:08:36", "remaining_time": "3:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 560, "loss": 0.2655, "learning_rate": 9.463491046218058e-05, "epoch": 2.328888888888889, "percentage": 23.39, "elapsed_time": "1:09:11", "remaining_time": "3:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 560, "loss": 0.2611, "learning_rate": 9.449359044057345e-05, "epoch": 2.3466666666666667, "percentage": 23.57, "elapsed_time": "1:09:40", "remaining_time": "3:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 560, "loss": 0.2589, "learning_rate": 9.435054165891109e-05, "epoch": 2.3644444444444446, "percentage": 23.75, "elapsed_time": "1:10:11", "remaining_time": "3:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 560, "loss": 0.3022, "learning_rate": 9.420576967523049e-05, "epoch": 2.3822222222222225, "percentage": 23.93, "elapsed_time": "1:10:44", "remaining_time": "3:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 560, "loss": 0.2498, "learning_rate": 9.405928011452211e-05, "epoch": 2.4, "percentage": 24.11, "elapsed_time": "1:11:25", "remaining_time": "3:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 560, "loss": 0.2636, "learning_rate": 9.391107866851143e-05, "epoch": 2.417777777777778, "percentage": 24.29, "elapsed_time": "1:12:01", "remaining_time": "3:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 560, "loss": 0.25, "learning_rate": 9.376117109543769e-05, "epoch": 2.4355555555555557, "percentage": 24.46, "elapsed_time": "1:12:34", "remaining_time": "3:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 560, "loss": 0.2435, "learning_rate": 9.360956321983028e-05, "epoch": 2.453333333333333, "percentage": 24.64, "elapsed_time": "1:13:05", "remaining_time": "3:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 560, "loss": 0.2427, "learning_rate": 9.345626093228233e-05, "epoch": 2.471111111111111, "percentage": 24.82, "elapsed_time": "1:13:28", "remaining_time": "3:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 560, "loss": 0.2897, "learning_rate": 9.330127018922194e-05, "epoch": 2.488888888888889, "percentage": 25.0, "elapsed_time": "1:14:01", "remaining_time": "3:42:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 560, "loss": 0.2833, "learning_rate": 9.314459701268065e-05, "epoch": 2.506666666666667, "percentage": 25.18, "elapsed_time": "1:14:33", "remaining_time": "3:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 560, "loss": 0.2698, "learning_rate": 9.298624749005951e-05, "epoch": 2.5244444444444447, "percentage": 25.36, "elapsed_time": "1:15:09", "remaining_time": "3:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 560, "loss": 0.2372, "learning_rate": 9.282622777389258e-05, "epoch": 2.542222222222222, "percentage": 25.54, "elapsed_time": "1:15:41", "remaining_time": "3:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 560, "loss": 0.2756, "learning_rate": 9.266454408160779e-05, "epoch": 2.56, "percentage": 25.71, "elapsed_time": "1:16:12", "remaining_time": "3:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 560, "loss": 0.2661, "learning_rate": 9.250120269528546e-05, "epoch": 2.5777777777777775, "percentage": 25.89, "elapsed_time": "1:16:55", "remaining_time": "3:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 560, "loss": 0.2945, "learning_rate": 9.233620996141421e-05, "epoch": 2.5955555555555554, "percentage": 26.07, "elapsed_time": "1:17:16", "remaining_time": "3:39:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 560, "loss": 0.2391, "learning_rate": 9.21695722906443e-05, "epoch": 2.6133333333333333, "percentage": 26.25, "elapsed_time": "1:17:47", "remaining_time": "3:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 560, "loss": 0.2664, "learning_rate": 9.200129615753859e-05, "epoch": 2.631111111111111, "percentage": 26.43, "elapsed_time": "1:18:17", "remaining_time": "3:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 560, "loss": 0.2371, "learning_rate": 9.183138810032099e-05, "epoch": 2.648888888888889, "percentage": 26.61, "elapsed_time": "1:18:46", "remaining_time": "3:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 560, "loss": 0.2883, "learning_rate": 9.165985472062246e-05, "epoch": 2.6666666666666665, "percentage": 26.79, "elapsed_time": "1:19:18", "remaining_time": "3:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 151, "total_steps": 560, "loss": 0.2572, "learning_rate": 9.148670268322438e-05, "epoch": 2.6844444444444444, "percentage": 26.96, "elapsed_time": "1:19:49", "remaining_time": "3:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 560, "loss": 0.2423, "learning_rate": 9.131193871579975e-05, "epoch": 2.7022222222222223, "percentage": 27.14, "elapsed_time": "1:20:21", "remaining_time": "3:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 153, "total_steps": 560, "loss": 0.2453, "learning_rate": 9.113556960865167e-05, "epoch": 2.7199999999999998, "percentage": 27.32, "elapsed_time": "1:20:49", "remaining_time": "3:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 560, "loss": 0.2297, "learning_rate": 9.09576022144496e-05, "epoch": 2.7377777777777776, "percentage": 27.5, "elapsed_time": "1:21:20", "remaining_time": "3:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 560, "loss": 0.2865, "learning_rate": 9.077804344796302e-05, "epoch": 2.7555555555555555, "percentage": 27.68, "elapsed_time": "1:21:45", "remaining_time": "3:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 560, "loss": 0.2567, "learning_rate": 9.059690028579284e-05, "epoch": 2.7733333333333334, "percentage": 27.86, "elapsed_time": "1:22:15", "remaining_time": "3:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 157, "total_steps": 560, "loss": 0.2537, "learning_rate": 9.041417976610027e-05, "epoch": 2.7911111111111113, "percentage": 28.04, "elapsed_time": "1:22:54", "remaining_time": "3:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 560, "loss": 0.2212, "learning_rate": 9.022988898833342e-05, "epoch": 2.8088888888888888, "percentage": 28.21, "elapsed_time": "1:23:29", "remaining_time": "3:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 159, "total_steps": 560, "loss": 0.2514, "learning_rate": 9.004403511295141e-05, "epoch": 2.8266666666666667, "percentage": 28.39, "elapsed_time": "1:23:50", "remaining_time": "3:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 560, "loss": 0.2857, "learning_rate": 8.985662536114613e-05, "epoch": 2.8444444444444446, "percentage": 28.57, "elapsed_time": "1:24:20", "remaining_time": "3:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 161, "total_steps": 560, "loss": 0.2507, "learning_rate": 8.966766701456177e-05, "epoch": 2.862222222222222, "percentage": 28.75, "elapsed_time": "1:24:46", "remaining_time": "3:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 560, "loss": 0.2875, "learning_rate": 8.947716741501177e-05, "epoch": 2.88, "percentage": 28.93, "elapsed_time": "1:25:16", "remaining_time": "3:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 163, "total_steps": 560, "loss": 0.2601, "learning_rate": 8.928513396419368e-05, "epoch": 2.897777777777778, "percentage": 29.11, "elapsed_time": "1:25:38", "remaining_time": "3:28:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 560, "loss": 0.2624, "learning_rate": 8.90915741234015e-05, "epoch": 2.9155555555555557, "percentage": 29.29, "elapsed_time": "1:26:03", "remaining_time": "3:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 560, "loss": 0.2578, "learning_rate": 8.889649541323574e-05, "epoch": 2.9333333333333336, "percentage": 29.46, "elapsed_time": "1:26:42", "remaining_time": "3:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 560, "loss": 0.2354, "learning_rate": 8.869990541331138e-05, "epoch": 2.951111111111111, "percentage": 29.64, "elapsed_time": "1:27:19", "remaining_time": "3:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 167, "total_steps": 560, "loss": 0.3058, "learning_rate": 8.850181176196315e-05, "epoch": 2.968888888888889, "percentage": 29.82, "elapsed_time": "1:27:53", "remaining_time": "3:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 560, "loss": 0.2424, "learning_rate": 8.83022221559489e-05, "epoch": 2.986666666666667, "percentage": 30.0, "elapsed_time": "1:28:41", "remaining_time": "3:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 169, "total_steps": 560, "loss": 0.2527, "learning_rate": 8.810114435015054e-05, "epoch": 3.0044444444444443, "percentage": 30.18, "elapsed_time": "1:29:32", "remaining_time": "3:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 560, "loss": 0.2644, "learning_rate": 8.789858615727265e-05, "epoch": 3.022222222222222, "percentage": 30.36, "elapsed_time": "1:30:07", "remaining_time": "3:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 171, "total_steps": 560, "loss": 0.2419, "learning_rate": 8.7694555447539e-05, "epoch": 3.04, "percentage": 30.54, "elapsed_time": "1:30:43", "remaining_time": "3:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 560, "loss": 0.2201, "learning_rate": 8.748906014838672e-05, "epoch": 3.057777777777778, "percentage": 30.71, "elapsed_time": "1:31:17", "remaining_time": "3:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 173, "total_steps": 560, "loss": 0.2479, "learning_rate": 8.728210824415827e-05, "epoch": 3.0755555555555554, "percentage": 30.89, "elapsed_time": "1:31:41", "remaining_time": "3:25:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 560, "loss": 0.2311, "learning_rate": 8.707370777579133e-05, "epoch": 3.0933333333333333, "percentage": 31.07, "elapsed_time": "1:32:18", "remaining_time": "3:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 560, "loss": 0.2239, "learning_rate": 8.68638668405062e-05, "epoch": 3.111111111111111, "percentage": 31.25, "elapsed_time": "1:32:48", "remaining_time": "3:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 560, "loss": 0.2798, "learning_rate": 8.665259359149132e-05, "epoch": 3.128888888888889, "percentage": 31.43, "elapsed_time": "1:33:21", "remaining_time": "3:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 177, "total_steps": 560, "loss": 0.2376, "learning_rate": 8.643989623758643e-05, "epoch": 3.1466666666666665, "percentage": 31.61, "elapsed_time": "1:33:43", "remaining_time": "3:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 560, "loss": 0.2672, "learning_rate": 8.622578304296364e-05, "epoch": 3.1644444444444444, "percentage": 31.79, "elapsed_time": "1:34:17", "remaining_time": "3:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 179, "total_steps": 560, "loss": 0.2463, "learning_rate": 8.601026232680634e-05, "epoch": 3.1822222222222223, "percentage": 31.96, "elapsed_time": "1:34:36", "remaining_time": "3:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 560, "loss": 0.2367, "learning_rate": 8.579334246298593e-05, "epoch": 3.2, "percentage": 32.14, "elapsed_time": "1:35:14", "remaining_time": "3:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 181, "total_steps": 560, "loss": 0.2362, "learning_rate": 8.557503187973651e-05, "epoch": 3.2177777777777776, "percentage": 32.32, "elapsed_time": "1:35:55", "remaining_time": "3:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 560, "loss": 0.2331, "learning_rate": 8.535533905932738e-05, "epoch": 3.2355555555555555, "percentage": 32.5, "elapsed_time": "1:36:16", "remaining_time": "3:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 183, "total_steps": 560, "loss": 0.2775, "learning_rate": 8.513427253773346e-05, "epoch": 3.2533333333333334, "percentage": 32.68, "elapsed_time": "1:36:38", "remaining_time": "3:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 560, "loss": 0.2239, "learning_rate": 8.491184090430364e-05, "epoch": 3.2711111111111113, "percentage": 32.86, "elapsed_time": "1:37:08", "remaining_time": "3:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 560, "loss": 0.2395, "learning_rate": 8.468805280142709e-05, "epoch": 3.2888888888888888, "percentage": 33.04, "elapsed_time": "1:37:50", "remaining_time": "3:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 560, "loss": 0.2222, "learning_rate": 8.446291692419736e-05, "epoch": 3.3066666666666666, "percentage": 33.21, "elapsed_time": "1:38:29", "remaining_time": "3:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 187, "total_steps": 560, "loss": 0.2151, "learning_rate": 8.423644202007467e-05, "epoch": 3.3244444444444445, "percentage": 33.39, "elapsed_time": "1:39:10", "remaining_time": "3:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 560, "loss": 0.2501, "learning_rate": 8.400863688854597e-05, "epoch": 3.3422222222222224, "percentage": 33.57, "elapsed_time": "1:39:42", "remaining_time": "3:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 189, "total_steps": 560, "loss": 0.2801, "learning_rate": 8.377951038078302e-05, "epoch": 3.36, "percentage": 33.75, "elapsed_time": "1:40:12", "remaining_time": "3:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 560, "loss": 0.2216, "learning_rate": 8.354907139929851e-05, "epoch": 3.3777777777777778, "percentage": 33.93, "elapsed_time": "1:40:48", "remaining_time": "3:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 191, "total_steps": 560, "loss": 0.228, "learning_rate": 8.33173288976002e-05, "epoch": 3.3955555555555557, "percentage": 34.11, "elapsed_time": "1:41:13", "remaining_time": "3:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 560, "loss": 0.2521, "learning_rate": 8.308429187984297e-05, "epoch": 3.413333333333333, "percentage": 34.29, "elapsed_time": "1:41:38", "remaining_time": "3:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 193, "total_steps": 560, "loss": 0.2397, "learning_rate": 8.284996940047903e-05, "epoch": 3.431111111111111, "percentage": 34.46, "elapsed_time": "1:42:07", "remaining_time": "3:14:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 560, "loss": 0.2204, "learning_rate": 8.261437056390606e-05, "epoch": 3.448888888888889, "percentage": 34.64, "elapsed_time": "1:42:49", "remaining_time": "3:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 560, "loss": 0.2291, "learning_rate": 8.237750452411353e-05, "epoch": 3.466666666666667, "percentage": 34.82, "elapsed_time": "1:43:29", "remaining_time": "3:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 560, "loss": 0.2218, "learning_rate": 8.213938048432697e-05, "epoch": 3.4844444444444447, "percentage": 35.0, "elapsed_time": "1:44:00", "remaining_time": "3:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 197, "total_steps": 560, "loss": 0.249, "learning_rate": 8.190000769665044e-05, "epoch": 3.502222222222222, "percentage": 35.18, "elapsed_time": "1:44:22", "remaining_time": "3:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 560, "loss": 0.2749, "learning_rate": 8.1659395461707e-05, "epoch": 3.52, "percentage": 35.36, "elapsed_time": "1:44:48", "remaining_time": "3:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 199, "total_steps": 560, "loss": 0.2134, "learning_rate": 8.141755312827736e-05, "epoch": 3.537777777777778, "percentage": 35.54, "elapsed_time": "1:45:23", "remaining_time": "3:11:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 560, "loss": 0.2216, "learning_rate": 8.117449009293668e-05, "epoch": 3.5555555555555554, "percentage": 35.71, "elapsed_time": "1:46:05", "remaining_time": "3:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 201, "total_steps": 560, "loss": 0.2369, "learning_rate": 8.093021579968941e-05, "epoch": 3.5733333333333333, "percentage": 35.89, "elapsed_time": "1:46:37", "remaining_time": "3:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 560, "loss": 0.2433, "learning_rate": 8.068473973960238e-05, "epoch": 3.591111111111111, "percentage": 36.07, "elapsed_time": "1:47:12", "remaining_time": "3:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 203, "total_steps": 560, "loss": 0.2405, "learning_rate": 8.043807145043604e-05, "epoch": 3.608888888888889, "percentage": 36.25, "elapsed_time": "1:47:44", "remaining_time": "3:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 560, "loss": 0.2345, "learning_rate": 8.019022051627388e-05, "epoch": 3.626666666666667, "percentage": 36.43, "elapsed_time": "1:48:25", "remaining_time": "3:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 560, "loss": 0.2574, "learning_rate": 7.994119656715002e-05, "epoch": 3.6444444444444444, "percentage": 36.61, "elapsed_time": "1:48:54", "remaining_time": "3:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 560, "loss": 0.2445, "learning_rate": 7.969100927867507e-05, "epoch": 3.6622222222222223, "percentage": 36.79, "elapsed_time": "1:49:30", "remaining_time": "3:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 207, "total_steps": 560, "loss": 0.2099, "learning_rate": 7.943966837166023e-05, "epoch": 3.68, "percentage": 36.96, "elapsed_time": "1:50:04", "remaining_time": "3:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 560, "loss": 0.2051, "learning_rate": 7.91871836117395e-05, "epoch": 3.6977777777777776, "percentage": 37.14, "elapsed_time": "1:50:39", "remaining_time": "3:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 209, "total_steps": 560, "loss": 0.2132, "learning_rate": 7.89335648089903e-05, "epoch": 3.7155555555555555, "percentage": 37.32, "elapsed_time": "1:51:20", "remaining_time": "3:06:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 560, "loss": 0.2284, "learning_rate": 7.86788218175523e-05, "epoch": 3.7333333333333334, "percentage": 37.5, "elapsed_time": "1:51:59", "remaining_time": "3:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 211, "total_steps": 560, "loss": 0.3221, "learning_rate": 7.842296453524463e-05, "epoch": 3.7511111111111113, "percentage": 37.68, "elapsed_time": "1:52:17", "remaining_time": "3:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 560, "loss": 0.2558, "learning_rate": 7.81660029031811e-05, "epoch": 3.7688888888888887, "percentage": 37.86, "elapsed_time": "1:52:51", "remaining_time": "3:05:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 213, "total_steps": 560, "loss": 0.228, "learning_rate": 7.79079469053842e-05, "epoch": 3.7866666666666666, "percentage": 38.04, "elapsed_time": "1:53:20", "remaining_time": "3:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 560, "loss": 0.2025, "learning_rate": 7.764880656839696e-05, "epoch": 3.8044444444444445, "percentage": 38.21, "elapsed_time": "1:53:49", "remaining_time": "3:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 560, "loss": 0.2142, "learning_rate": 7.738859196089358e-05, "epoch": 3.822222222222222, "percentage": 38.39, "elapsed_time": "1:54:27", "remaining_time": "3:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 560, "loss": 0.2614, "learning_rate": 7.712731319328798e-05, "epoch": 3.84, "percentage": 38.57, "elapsed_time": "1:54:53", "remaining_time": "3:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 217, "total_steps": 560, "loss": 0.24, "learning_rate": 7.68649804173412e-05, "epoch": 3.8577777777777778, "percentage": 38.75, "elapsed_time": "1:55:28", "remaining_time": "3:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 560, "loss": 0.2054, "learning_rate": 7.660160382576683e-05, "epoch": 3.8755555555555556, "percentage": 38.93, "elapsed_time": "1:55:44", "remaining_time": "3:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 219, "total_steps": 560, "loss": 0.2464, "learning_rate": 7.633719365183504e-05, "epoch": 3.8933333333333335, "percentage": 39.11, "elapsed_time": "1:56:12", "remaining_time": "3:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 560, "loss": 0.2583, "learning_rate": 7.60717601689749e-05, "epoch": 3.911111111111111, "percentage": 39.29, "elapsed_time": "1:56:50", "remaining_time": "3:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 221, "total_steps": 560, "loss": 0.2387, "learning_rate": 7.580531369037533e-05, "epoch": 3.928888888888889, "percentage": 39.46, "elapsed_time": "1:57:14", "remaining_time": "2:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 560, "loss": 0.2333, "learning_rate": 7.553786456858429e-05, "epoch": 3.9466666666666668, "percentage": 39.64, "elapsed_time": "1:57:46", "remaining_time": "2:59:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 223, "total_steps": 560, "loss": 0.2353, "learning_rate": 7.526942319510655e-05, "epoch": 3.964444444444444, "percentage": 39.82, "elapsed_time": "1:58:19", "remaining_time": "2:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 560, "loss": 0.2411, "learning_rate": 7.500000000000001e-05, "epoch": 3.982222222222222, "percentage": 40.0, "elapsed_time": "1:58:55", "remaining_time": "2:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 560, "loss": 0.2472, "learning_rate": 7.472960545147038e-05, "epoch": 4.0, "percentage": 40.18, "elapsed_time": "1:59:24", "remaining_time": "2:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 560, "loss": 0.217, "learning_rate": 7.445825005546448e-05, "epoch": 4.017777777777778, "percentage": 40.36, "elapsed_time": "2:00:13", "remaining_time": "2:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 227, "total_steps": 560, "loss": 0.2026, "learning_rate": 7.4185944355262e-05, "epoch": 4.035555555555556, "percentage": 40.54, "elapsed_time": "2:00:40", "remaining_time": "2:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 560, "loss": 0.2364, "learning_rate": 7.391269893106592e-05, "epoch": 4.053333333333334, "percentage": 40.71, "elapsed_time": "2:01:13", "remaining_time": "2:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 229, "total_steps": 560, "loss": 0.1774, "learning_rate": 7.363852439959135e-05, "epoch": 4.071111111111111, "percentage": 40.89, "elapsed_time": "2:01:48", "remaining_time": "2:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 560, "loss": 0.2156, "learning_rate": 7.33634314136531e-05, "epoch": 4.088888888888889, "percentage": 41.07, "elapsed_time": "2:02:14", "remaining_time": "2:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 231, "total_steps": 560, "loss": 0.2006, "learning_rate": 7.308743066175172e-05, "epoch": 4.1066666666666665, "percentage": 41.25, "elapsed_time": "2:02:36", "remaining_time": "2:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 560, "loss": 0.2195, "learning_rate": 7.281053286765815e-05, "epoch": 4.124444444444444, "percentage": 41.43, "elapsed_time": "2:03:17", "remaining_time": "2:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 233, "total_steps": 560, "loss": 0.2268, "learning_rate": 7.253274878999727e-05, "epoch": 4.142222222222222, "percentage": 41.61, "elapsed_time": "2:03:52", "remaining_time": "2:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 560, "loss": 0.2186, "learning_rate": 7.225408922182961e-05, "epoch": 4.16, "percentage": 41.79, "elapsed_time": "2:04:25", "remaining_time": "2:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 560, "loss": 0.2039, "learning_rate": 7.197456499023225e-05, "epoch": 4.177777777777778, "percentage": 41.96, "elapsed_time": "2:04:48", "remaining_time": "2:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 560, "loss": 0.2107, "learning_rate": 7.169418695587791e-05, "epoch": 4.195555555555556, "percentage": 42.14, "elapsed_time": "2:05:25", "remaining_time": "2:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 237, "total_steps": 560, "loss": 0.2387, "learning_rate": 7.141296601261314e-05, "epoch": 4.213333333333333, "percentage": 42.32, "elapsed_time": "2:05:49", "remaining_time": "2:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 560, "loss": 0.1914, "learning_rate": 7.113091308703498e-05, "epoch": 4.231111111111111, "percentage": 42.5, "elapsed_time": "2:06:18", "remaining_time": "2:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 239, "total_steps": 560, "loss": 0.2192, "learning_rate": 7.084803913806641e-05, "epoch": 4.248888888888889, "percentage": 42.68, "elapsed_time": "2:06:46", "remaining_time": "2:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 560, "loss": 0.2406, "learning_rate": 7.056435515653059e-05, "epoch": 4.266666666666667, "percentage": 42.86, "elapsed_time": "2:07:08", "remaining_time": "2:49:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 241, "total_steps": 560, "loss": 0.2102, "learning_rate": 7.027987216472377e-05, "epoch": 4.2844444444444445, "percentage": 43.04, "elapsed_time": "2:07:42", "remaining_time": "2:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 560, "loss": 0.1943, "learning_rate": 6.999460121598704e-05, "epoch": 4.302222222222222, "percentage": 43.21, "elapsed_time": "2:08:11", "remaining_time": "2:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 243, "total_steps": 560, "loss": 0.1955, "learning_rate": 6.970855339427698e-05, "epoch": 4.32, "percentage": 43.39, "elapsed_time": "2:08:33", "remaining_time": "2:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 560, "loss": 0.2316, "learning_rate": 6.942173981373474e-05, "epoch": 4.337777777777778, "percentage": 43.57, "elapsed_time": "2:09:09", "remaining_time": "2:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 560, "loss": 0.2038, "learning_rate": 6.91341716182545e-05, "epoch": 4.355555555555555, "percentage": 43.75, "elapsed_time": "2:09:40", "remaining_time": "2:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 560, "loss": 0.2137, "learning_rate": 6.884585998105026e-05, "epoch": 4.373333333333333, "percentage": 43.93, "elapsed_time": "2:10:02", "remaining_time": "2:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 247, "total_steps": 560, "loss": 0.2059, "learning_rate": 6.855681610422189e-05, "epoch": 4.391111111111111, "percentage": 44.11, "elapsed_time": "2:10:31", "remaining_time": "2:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 560, "loss": 0.2213, "learning_rate": 6.826705121831976e-05, "epoch": 4.408888888888889, "percentage": 44.29, "elapsed_time": "2:11:20", "remaining_time": "2:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 249, "total_steps": 560, "loss": 0.2061, "learning_rate": 6.797657658190839e-05, "epoch": 4.426666666666667, "percentage": 44.46, "elapsed_time": "2:11:37", "remaining_time": "2:44:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 560, "loss": 0.2185, "learning_rate": 6.768540348112907e-05, "epoch": 4.444444444444445, "percentage": 44.64, "elapsed_time": "2:12:23", "remaining_time": "2:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 251, "total_steps": 560, "loss": 0.1946, "learning_rate": 6.739354322926136e-05, "epoch": 4.4622222222222225, "percentage": 44.82, "elapsed_time": "2:12:53", "remaining_time": "2:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 560, "loss": 0.2716, "learning_rate": 6.710100716628344e-05, "epoch": 4.48, "percentage": 45.0, "elapsed_time": "2:13:25", "remaining_time": "2:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 253, "total_steps": 560, "loss": 0.1893, "learning_rate": 6.680780665843155e-05, "epoch": 4.497777777777777, "percentage": 45.18, "elapsed_time": "2:13:49", "remaining_time": "2:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 560, "loss": 0.216, "learning_rate": 6.651395309775837e-05, "epoch": 4.515555555555555, "percentage": 45.36, "elapsed_time": "2:14:34", "remaining_time": "2:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 560, "loss": 0.1849, "learning_rate": 6.621945790169036e-05, "epoch": 4.533333333333333, "percentage": 45.54, "elapsed_time": "2:15:02", "remaining_time": "2:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 560, "loss": 0.1977, "learning_rate": 6.592433251258423e-05, "epoch": 4.551111111111111, "percentage": 45.71, "elapsed_time": "2:15:30", "remaining_time": "2:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 257, "total_steps": 560, "loss": 0.2167, "learning_rate": 6.562858839728223e-05, "epoch": 4.568888888888889, "percentage": 45.89, "elapsed_time": "2:16:11", "remaining_time": "2:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 560, "loss": 0.2128, "learning_rate": 6.533223704666672e-05, "epoch": 4.586666666666667, "percentage": 46.07, "elapsed_time": "2:16:45", "remaining_time": "2:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 259, "total_steps": 560, "loss": 0.1932, "learning_rate": 6.503528997521366e-05, "epoch": 4.604444444444445, "percentage": 46.25, "elapsed_time": "2:17:13", "remaining_time": "2:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 560, "loss": 0.1991, "learning_rate": 6.473775872054521e-05, "epoch": 4.622222222222222, "percentage": 46.43, "elapsed_time": "2:18:04", "remaining_time": "2:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 261, "total_steps": 560, "loss": 0.179, "learning_rate": 6.44396548429815e-05, "epoch": 4.64, "percentage": 46.61, "elapsed_time": "2:18:28", "remaining_time": "2:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 560, "loss": 0.2154, "learning_rate": 6.414098992509138e-05, "epoch": 4.657777777777778, "percentage": 46.79, "elapsed_time": "2:18:58", "remaining_time": "2:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 263, "total_steps": 560, "loss": 0.2024, "learning_rate": 6.384177557124247e-05, "epoch": 4.6755555555555555, "percentage": 46.96, "elapsed_time": "2:19:22", "remaining_time": "2:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 560, "loss": 0.2264, "learning_rate": 6.354202340715026e-05, "epoch": 4.693333333333333, "percentage": 47.14, "elapsed_time": "2:20:03", "remaining_time": "2:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 560, "loss": 0.2175, "learning_rate": 6.324174507942637e-05, "epoch": 4.711111111111111, "percentage": 47.32, "elapsed_time": "2:20:37", "remaining_time": "2:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 560, "loss": 0.1969, "learning_rate": 6.294095225512603e-05, "epoch": 4.728888888888889, "percentage": 47.5, "elapsed_time": "2:21:17", "remaining_time": "2:36:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 267, "total_steps": 560, "loss": 0.2322, "learning_rate": 6.263965662129487e-05, "epoch": 4.746666666666667, "percentage": 47.68, "elapsed_time": "2:21:52", "remaining_time": "2:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 560, "loss": 0.1617, "learning_rate": 6.233786988451468e-05, "epoch": 4.764444444444445, "percentage": 47.86, "elapsed_time": "2:22:25", "remaining_time": "2:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 269, "total_steps": 560, "loss": 0.2324, "learning_rate": 6.203560377044866e-05, "epoch": 4.782222222222222, "percentage": 48.04, "elapsed_time": "2:22:57", "remaining_time": "2:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 560, "loss": 0.2213, "learning_rate": 6.173287002338577e-05, "epoch": 4.8, "percentage": 48.21, "elapsed_time": "2:23:31", "remaining_time": "2:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 271, "total_steps": 560, "loss": 0.2163, "learning_rate": 6.142968040578449e-05, "epoch": 4.817777777777778, "percentage": 48.39, "elapsed_time": "2:23:58", "remaining_time": "2:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 560, "loss": 0.2014, "learning_rate": 6.112604669781572e-05, "epoch": 4.835555555555556, "percentage": 48.57, "elapsed_time": "2:24:22", "remaining_time": "2:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 273, "total_steps": 560, "loss": 0.2123, "learning_rate": 6.0821980696905146e-05, "epoch": 4.8533333333333335, "percentage": 48.75, "elapsed_time": "2:24:54", "remaining_time": "2:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 560, "loss": 0.2008, "learning_rate": 6.0517494217274794e-05, "epoch": 4.871111111111111, "percentage": 48.93, "elapsed_time": "2:25:34", "remaining_time": "2:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 560, "loss": 0.2011, "learning_rate": 6.021259908948402e-05, "epoch": 4.888888888888889, "percentage": 49.11, "elapsed_time": "2:25:58", "remaining_time": "2:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 560, "loss": 0.2215, "learning_rate": 5.9907307159969884e-05, "epoch": 4.906666666666666, "percentage": 49.29, "elapsed_time": "2:26:40", "remaining_time": "2:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 277, "total_steps": 560, "loss": 0.1943, "learning_rate": 5.960163029058682e-05, "epoch": 4.924444444444444, "percentage": 49.46, "elapsed_time": "2:27:18", "remaining_time": "2:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 560, "loss": 0.2132, "learning_rate": 5.9295580358145744e-05, "epoch": 4.942222222222222, "percentage": 49.64, "elapsed_time": "2:27:51", "remaining_time": "2:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 279, "total_steps": 560, "loss": 0.2227, "learning_rate": 5.898916925395264e-05, "epoch": 4.96, "percentage": 49.82, "elapsed_time": "2:28:22", "remaining_time": "2:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 560, "loss": 0.2165, "learning_rate": 5.868240888334653e-05, "epoch": 4.977777777777778, "percentage": 50.0, "elapsed_time": "2:28:58", "remaining_time": "2:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 281, "total_steps": 560, "loss": 0.1669, "learning_rate": 5.837531116523682e-05, "epoch": 4.995555555555556, "percentage": 50.18, "elapsed_time": "2:29:33", "remaining_time": "2:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 560, "loss": 0.1828, "learning_rate": 5.806788803164034e-05, "epoch": 5.013333333333334, "percentage": 50.36, "elapsed_time": "2:30:00", "remaining_time": "2:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 283, "total_steps": 560, "loss": 0.1957, "learning_rate": 5.7760151427217576e-05, "epoch": 5.0311111111111115, "percentage": 50.54, "elapsed_time": "2:30:31", "remaining_time": "2:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 560, "loss": 0.2331, "learning_rate": 5.745211330880872e-05, "epoch": 5.0488888888888885, "percentage": 50.71, "elapsed_time": "2:31:07", "remaining_time": "2:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 560, "loss": 0.2065, "learning_rate": 5.714378564496901e-05, "epoch": 5.066666666666666, "percentage": 50.89, "elapsed_time": "2:31:40", "remaining_time": "2:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 560, "loss": 0.1657, "learning_rate": 5.683518041550368e-05, "epoch": 5.084444444444444, "percentage": 51.07, "elapsed_time": "2:32:01", "remaining_time": "2:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 287, "total_steps": 560, "loss": 0.1948, "learning_rate": 5.6526309611002594e-05, "epoch": 5.102222222222222, "percentage": 51.25, "elapsed_time": "2:32:27", "remaining_time": "2:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 560, "loss": 0.1709, "learning_rate": 5.621718523237427e-05, "epoch": 5.12, "percentage": 51.43, "elapsed_time": "2:33:00", "remaining_time": "2:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 289, "total_steps": 560, "loss": 0.1662, "learning_rate": 5.590781929037965e-05, "epoch": 5.137777777777778, "percentage": 51.61, "elapsed_time": "2:33:34", "remaining_time": "2:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 560, "loss": 0.1477, "learning_rate": 5.559822380516539e-05, "epoch": 5.155555555555556, "percentage": 51.79, "elapsed_time": "2:34:01", "remaining_time": "2:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 291, "total_steps": 560, "loss": 0.1802, "learning_rate": 5.5288410805796895e-05, "epoch": 5.173333333333334, "percentage": 51.96, "elapsed_time": "2:34:32", "remaining_time": "2:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 560, "loss": 0.178, "learning_rate": 5.497839232979084e-05, "epoch": 5.191111111111111, "percentage": 52.14, "elapsed_time": "2:35:00", "remaining_time": "2:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 293, "total_steps": 560, "loss": 0.1453, "learning_rate": 5.466818042264753e-05, "epoch": 5.208888888888889, "percentage": 52.32, "elapsed_time": "2:35:19", "remaining_time": "2:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 560, "loss": 0.212, "learning_rate": 5.435778713738292e-05, "epoch": 5.226666666666667, "percentage": 52.5, "elapsed_time": "2:35:57", "remaining_time": "2:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 560, "loss": 0.1773, "learning_rate": 5.404722453406017e-05, "epoch": 5.2444444444444445, "percentage": 52.68, "elapsed_time": "2:36:33", "remaining_time": "2:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 560, "loss": 0.1816, "learning_rate": 5.373650467932122e-05, "epoch": 5.262222222222222, "percentage": 52.86, "elapsed_time": "2:37:01", "remaining_time": "2:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 297, "total_steps": 560, "loss": 0.1544, "learning_rate": 5.3425639645917834e-05, "epoch": 5.28, "percentage": 53.04, "elapsed_time": "2:37:29", "remaining_time": "2:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 560, "loss": 0.1381, "learning_rate": 5.311464151224261e-05, "epoch": 5.297777777777778, "percentage": 53.21, "elapsed_time": "2:37:56", "remaining_time": "2:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 299, "total_steps": 560, "loss": 0.1653, "learning_rate": 5.2803522361859594e-05, "epoch": 5.315555555555555, "percentage": 53.39, "elapsed_time": "2:38:26", "remaining_time": "2:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 560, "loss": 0.167, "learning_rate": 5.249229428303486e-05, "epoch": 5.333333333333333, "percentage": 53.57, "elapsed_time": "2:38:56", "remaining_time": "2:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 301, "total_steps": 560, "loss": 0.2221, "learning_rate": 5.218096936826681e-05, "epoch": 5.351111111111111, "percentage": 53.75, "elapsed_time": "2:39:40", "remaining_time": "2:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 560, "loss": 0.1932, "learning_rate": 5.18695597138163e-05, "epoch": 5.368888888888889, "percentage": 53.93, "elapsed_time": "2:40:20", "remaining_time": "2:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 303, "total_steps": 560, "loss": 0.1818, "learning_rate": 5.155807741923666e-05, "epoch": 5.386666666666667, "percentage": 54.11, "elapsed_time": "2:40:58", "remaining_time": "2:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 560, "loss": 0.1924, "learning_rate": 5.124653458690365e-05, "epoch": 5.404444444444445, "percentage": 54.29, "elapsed_time": "2:41:32", "remaining_time": "2:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 560, "loss": 0.1922, "learning_rate": 5.0934943321545115e-05, "epoch": 5.4222222222222225, "percentage": 54.46, "elapsed_time": "2:41:57", "remaining_time": "2:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 560, "loss": 0.1828, "learning_rate": 5.062331572977076e-05, "epoch": 5.44, "percentage": 54.64, "elapsed_time": "2:42:34", "remaining_time": "2:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 307, "total_steps": 560, "loss": 0.2173, "learning_rate": 5.031166391960168e-05, "epoch": 5.457777777777777, "percentage": 54.82, "elapsed_time": "2:43:01", "remaining_time": "2:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 560, "loss": 0.1703, "learning_rate": 5e-05, "epoch": 5.475555555555555, "percentage": 55.0, "elapsed_time": "2:43:33", "remaining_time": "2:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 309, "total_steps": 560, "loss": 0.1751, "learning_rate": 4.968833608039832e-05, "epoch": 5.493333333333333, "percentage": 55.18, "elapsed_time": "2:44:15", "remaining_time": "2:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 560, "loss": 0.1835, "learning_rate": 4.9376684270229254e-05, "epoch": 5.511111111111111, "percentage": 55.36, "elapsed_time": "2:44:56", "remaining_time": "2:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 311, "total_steps": 560, "loss": 0.1892, "learning_rate": 4.9065056678454904e-05, "epoch": 5.528888888888889, "percentage": 55.54, "elapsed_time": "2:45:28", "remaining_time": "2:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 560, "loss": 0.181, "learning_rate": 4.875346541309637e-05, "epoch": 5.546666666666667, "percentage": 55.71, "elapsed_time": "2:45:55", "remaining_time": "2:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 313, "total_steps": 560, "loss": 0.1723, "learning_rate": 4.844192258076336e-05, "epoch": 5.564444444444445, "percentage": 55.89, "elapsed_time": "2:46:19", "remaining_time": "2:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 560, "loss": 0.1875, "learning_rate": 4.813044028618373e-05, "epoch": 5.582222222222223, "percentage": 56.07, "elapsed_time": "2:46:51", "remaining_time": "2:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 560, "loss": 0.1903, "learning_rate": 4.781903063173321e-05, "epoch": 5.6, "percentage": 56.25, "elapsed_time": "2:47:33", "remaining_time": "2:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 560, "loss": 0.1742, "learning_rate": 4.750770571696514e-05, "epoch": 5.6177777777777775, "percentage": 56.43, "elapsed_time": "2:48:21", "remaining_time": "2:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 317, "total_steps": 560, "loss": 0.1604, "learning_rate": 4.7196477638140404e-05, "epoch": 5.635555555555555, "percentage": 56.61, "elapsed_time": "2:48:50", "remaining_time": "2:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 560, "loss": 0.2142, "learning_rate": 4.68853584877574e-05, "epoch": 5.653333333333333, "percentage": 56.79, "elapsed_time": "2:49:29", "remaining_time": "2:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 319, "total_steps": 560, "loss": 0.1902, "learning_rate": 4.657436035408217e-05, "epoch": 5.671111111111111, "percentage": 56.96, "elapsed_time": "2:50:01", "remaining_time": "2:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 560, "loss": 0.1604, "learning_rate": 4.626349532067879e-05, "epoch": 5.688888888888889, "percentage": 57.14, "elapsed_time": "2:50:30", "remaining_time": "2:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 321, "total_steps": 560, "loss": 0.2049, "learning_rate": 4.595277546593984e-05, "epoch": 5.706666666666667, "percentage": 57.32, "elapsed_time": "2:51:17", "remaining_time": "2:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 560, "loss": 0.1715, "learning_rate": 4.564221286261709e-05, "epoch": 5.724444444444444, "percentage": 57.5, "elapsed_time": "2:51:49", "remaining_time": "2:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 323, "total_steps": 560, "loss": 0.1601, "learning_rate": 4.5331819577352474e-05, "epoch": 5.742222222222222, "percentage": 57.68, "elapsed_time": "2:52:12", "remaining_time": "2:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 560, "loss": 0.1589, "learning_rate": 4.502160767020918e-05, "epoch": 5.76, "percentage": 57.86, "elapsed_time": "2:52:33", "remaining_time": "2:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 560, "loss": 0.1656, "learning_rate": 4.471158919420312e-05, "epoch": 5.777777777777778, "percentage": 58.04, "elapsed_time": "2:53:00", "remaining_time": "2:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 560, "loss": 0.1821, "learning_rate": 4.4401776194834613e-05, "epoch": 5.795555555555556, "percentage": 58.21, "elapsed_time": "2:53:23", "remaining_time": "2:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 327, "total_steps": 560, "loss": 0.1752, "learning_rate": 4.409218070962036e-05, "epoch": 5.8133333333333335, "percentage": 58.39, "elapsed_time": "2:53:58", "remaining_time": "2:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 560, "loss": 0.204, "learning_rate": 4.378281476762576e-05, "epoch": 5.831111111111111, "percentage": 58.57, "elapsed_time": "2:54:38", "remaining_time": "2:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 329, "total_steps": 560, "loss": 0.1562, "learning_rate": 4.347369038899744e-05, "epoch": 5.848888888888889, "percentage": 58.75, "elapsed_time": "2:55:01", "remaining_time": "2:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 560, "loss": 0.2376, "learning_rate": 4.316481958449634e-05, "epoch": 5.866666666666667, "percentage": 58.93, "elapsed_time": "2:55:29", "remaining_time": "2:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 331, "total_steps": 560, "loss": 0.1699, "learning_rate": 4.285621435503101e-05, "epoch": 5.884444444444444, "percentage": 59.11, "elapsed_time": "2:55:59", "remaining_time": "2:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 560, "loss": 0.1652, "learning_rate": 4.254788669119127e-05, "epoch": 5.902222222222222, "percentage": 59.29, "elapsed_time": "2:56:31", "remaining_time": "2:01:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 333, "total_steps": 560, "loss": 0.1695, "learning_rate": 4.223984857278242e-05, "epoch": 5.92, "percentage": 59.46, "elapsed_time": "2:57:08", "remaining_time": "2:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 560, "loss": 0.1673, "learning_rate": 4.1932111968359664e-05, "epoch": 5.937777777777778, "percentage": 59.64, "elapsed_time": "2:57:45", "remaining_time": "2:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 560, "loss": 0.1852, "learning_rate": 4.162468883476319e-05, "epoch": 5.955555555555556, "percentage": 59.82, "elapsed_time": "2:58:11", "remaining_time": "1:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 560, "loss": 0.1847, "learning_rate": 4.131759111665349e-05, "epoch": 5.973333333333334, "percentage": 60.0, "elapsed_time": "2:58:36", "remaining_time": "1:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 337, "total_steps": 560, "loss": 0.1709, "learning_rate": 4.101083074604737e-05, "epoch": 5.9911111111111115, "percentage": 60.18, "elapsed_time": "2:59:15", "remaining_time": "1:58:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 560, "loss": 0.1476, "learning_rate": 4.0704419641854274e-05, "epoch": 6.0088888888888885, "percentage": 60.36, "elapsed_time": "2:59:38", "remaining_time": "1:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 339, "total_steps": 560, "loss": 0.1731, "learning_rate": 4.03983697094132e-05, "epoch": 6.026666666666666, "percentage": 60.54, "elapsed_time": "3:00:09", "remaining_time": "1:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 560, "loss": 0.1625, "learning_rate": 4.0092692840030134e-05, "epoch": 6.044444444444444, "percentage": 60.71, "elapsed_time": "3:00:47", "remaining_time": "1:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 341, "total_steps": 560, "loss": 0.1718, "learning_rate": 3.978740091051599e-05, "epoch": 6.062222222222222, "percentage": 60.89, "elapsed_time": "3:01:20", "remaining_time": "1:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 560, "loss": 0.1793, "learning_rate": 3.9482505782725224e-05, "epoch": 6.08, "percentage": 61.07, "elapsed_time": "3:02:00", "remaining_time": "1:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 343, "total_steps": 560, "loss": 0.1675, "learning_rate": 3.917801930309486e-05, "epoch": 6.097777777777778, "percentage": 61.25, "elapsed_time": "3:02:35", "remaining_time": "1:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 560, "loss": 0.1528, "learning_rate": 3.887395330218429e-05, "epoch": 6.115555555555556, "percentage": 61.43, "elapsed_time": "3:03:05", "remaining_time": "1:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 560, "loss": 0.1437, "learning_rate": 3.857031959421553e-05, "epoch": 6.133333333333334, "percentage": 61.61, "elapsed_time": "3:03:32", "remaining_time": "1:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 560, "loss": 0.1647, "learning_rate": 3.8267129976614254e-05, "epoch": 6.151111111111111, "percentage": 61.79, "elapsed_time": "3:04:10", "remaining_time": "1:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 347, "total_steps": 560, "loss": 0.1436, "learning_rate": 3.7964396229551364e-05, "epoch": 6.168888888888889, "percentage": 61.96, "elapsed_time": "3:04:41", "remaining_time": "1:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 560, "loss": 0.148, "learning_rate": 3.7662130115485314e-05, "epoch": 6.1866666666666665, "percentage": 62.14, "elapsed_time": "3:05:12", "remaining_time": "1:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 349, "total_steps": 560, "loss": 0.1413, "learning_rate": 3.7360343378705124e-05, "epoch": 6.204444444444444, "percentage": 62.32, "elapsed_time": "3:05:40", "remaining_time": "1:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 560, "loss": 0.1528, "learning_rate": 3.705904774487396e-05, "epoch": 6.222222222222222, "percentage": 62.5, "elapsed_time": "3:06:11", "remaining_time": "1:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 351, "total_steps": 560, "loss": 0.1639, "learning_rate": 3.675825492057364e-05, "epoch": 6.24, "percentage": 62.68, "elapsed_time": "3:06:39", "remaining_time": "1:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 560, "loss": 0.2024, "learning_rate": 3.6457976592849754e-05, "epoch": 6.257777777777778, "percentage": 62.86, "elapsed_time": "3:07:18", "remaining_time": "1:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 353, "total_steps": 560, "loss": 0.1443, "learning_rate": 3.6158224428757535e-05, "epoch": 6.275555555555556, "percentage": 63.04, "elapsed_time": "3:07:41", "remaining_time": "1:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 560, "loss": 0.1314, "learning_rate": 3.585901007490863e-05, "epoch": 6.293333333333333, "percentage": 63.21, "elapsed_time": "3:08:04", "remaining_time": "1:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 560, "loss": 0.1495, "learning_rate": 3.556034515701852e-05, "epoch": 6.311111111111111, "percentage": 63.39, "elapsed_time": "3:08:37", "remaining_time": "1:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 560, "loss": 0.1571, "learning_rate": 3.5262241279454785e-05, "epoch": 6.328888888888889, "percentage": 63.57, "elapsed_time": "3:09:14", "remaining_time": "1:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 357, "total_steps": 560, "loss": 0.1413, "learning_rate": 3.4964710024786354e-05, "epoch": 6.346666666666667, "percentage": 63.75, "elapsed_time": "3:09:41", "remaining_time": "1:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 560, "loss": 0.1643, "learning_rate": 3.4667762953333295e-05, "epoch": 6.364444444444445, "percentage": 63.93, "elapsed_time": "3:10:06", "remaining_time": "1:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 359, "total_steps": 560, "loss": 0.1716, "learning_rate": 3.4371411602717784e-05, "epoch": 6.3822222222222225, "percentage": 64.11, "elapsed_time": "3:10:37", "remaining_time": "1:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 560, "loss": 0.1671, "learning_rate": 3.4075667487415785e-05, "epoch": 6.4, "percentage": 64.29, "elapsed_time": "3:11:17", "remaining_time": "1:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 361, "total_steps": 560, "loss": 0.167, "learning_rate": 3.3780542098309654e-05, "epoch": 6.417777777777777, "percentage": 64.46, "elapsed_time": "3:11:54", "remaining_time": "1:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 560, "loss": 0.1518, "learning_rate": 3.3486046902241664e-05, "epoch": 6.435555555555555, "percentage": 64.64, "elapsed_time": "3:12:22", "remaining_time": "1:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 363, "total_steps": 560, "loss": 0.1888, "learning_rate": 3.319219334156847e-05, "epoch": 6.453333333333333, "percentage": 64.82, "elapsed_time": "3:12:56", "remaining_time": "1:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 560, "loss": 0.1374, "learning_rate": 3.289899283371657e-05, "epoch": 6.471111111111111, "percentage": 65.0, "elapsed_time": "3:13:23", "remaining_time": "1:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 560, "loss": 0.1823, "learning_rate": 3.2606456770738636e-05, "epoch": 6.488888888888889, "percentage": 65.18, "elapsed_time": "3:14:04", "remaining_time": "1:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 560, "loss": 0.1424, "learning_rate": 3.231459651887093e-05, "epoch": 6.506666666666667, "percentage": 65.36, "elapsed_time": "3:14:45", "remaining_time": "1:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 367, "total_steps": 560, "loss": 0.1354, "learning_rate": 3.2023423418091626e-05, "epoch": 6.524444444444445, "percentage": 65.54, "elapsed_time": "3:15:13", "remaining_time": "1:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 560, "loss": 0.1658, "learning_rate": 3.173294878168025e-05, "epoch": 6.542222222222223, "percentage": 65.71, "elapsed_time": "3:15:42", "remaining_time": "1:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 369, "total_steps": 560, "loss": 0.1341, "learning_rate": 3.1443183895778105e-05, "epoch": 6.5600000000000005, "percentage": 65.89, "elapsed_time": "3:16:05", "remaining_time": "1:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 560, "loss": 0.1746, "learning_rate": 3.115414001894974e-05, "epoch": 6.5777777777777775, "percentage": 66.07, "elapsed_time": "3:16:30", "remaining_time": "1:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 371, "total_steps": 560, "loss": 0.1655, "learning_rate": 3.086582838174551e-05, "epoch": 6.595555555555555, "percentage": 66.25, "elapsed_time": "3:17:03", "remaining_time": "1:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 560, "loss": 0.1489, "learning_rate": 3.0578260186265265e-05, "epoch": 6.613333333333333, "percentage": 66.43, "elapsed_time": "3:17:32", "remaining_time": "1:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 373, "total_steps": 560, "loss": 0.1327, "learning_rate": 3.029144660572304e-05, "epoch": 6.631111111111111, "percentage": 66.61, "elapsed_time": "3:17:54", "remaining_time": "1:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 560, "loss": 0.1593, "learning_rate": 3.000539878401296e-05, "epoch": 6.648888888888889, "percentage": 66.79, "elapsed_time": "3:18:30", "remaining_time": "1:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 560, "loss": 0.1551, "learning_rate": 2.9720127835276256e-05, "epoch": 6.666666666666667, "percentage": 66.96, "elapsed_time": "3:19:05", "remaining_time": "1:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 560, "loss": 0.1526, "learning_rate": 2.9435644843469436e-05, "epoch": 6.684444444444445, "percentage": 67.14, "elapsed_time": "3:19:36", "remaining_time": "1:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 377, "total_steps": 560, "loss": 0.183, "learning_rate": 2.9151960861933614e-05, "epoch": 6.702222222222222, "percentage": 67.32, "elapsed_time": "3:20:14", "remaining_time": "1:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 560, "loss": 0.1624, "learning_rate": 2.886908691296504e-05, "epoch": 6.72, "percentage": 67.5, "elapsed_time": "3:20:39", "remaining_time": "1:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 379, "total_steps": 560, "loss": 0.1373, "learning_rate": 2.858703398738686e-05, "epoch": 6.737777777777778, "percentage": 67.68, "elapsed_time": "3:21:07", "remaining_time": "1:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 560, "loss": 0.1786, "learning_rate": 2.8305813044122097e-05, "epoch": 6.7555555555555555, "percentage": 67.86, "elapsed_time": "3:21:42", "remaining_time": "1:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 381, "total_steps": 560, "loss": 0.1432, "learning_rate": 2.8025435009767747e-05, "epoch": 6.773333333333333, "percentage": 68.04, "elapsed_time": "3:22:12", "remaining_time": "1:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 560, "loss": 0.1483, "learning_rate": 2.774591077817038e-05, "epoch": 6.791111111111111, "percentage": 68.21, "elapsed_time": "3:22:33", "remaining_time": "1:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 383, "total_steps": 560, "loss": 0.1709, "learning_rate": 2.746725121000273e-05, "epoch": 6.808888888888889, "percentage": 68.39, "elapsed_time": "3:23:10", "remaining_time": "1:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 560, "loss": 0.1944, "learning_rate": 2.718946713234185e-05, "epoch": 6.826666666666666, "percentage": 68.57, "elapsed_time": "3:23:51", "remaining_time": "1:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 560, "loss": 0.1471, "learning_rate": 2.6912569338248315e-05, "epoch": 6.844444444444444, "percentage": 68.75, "elapsed_time": "3:24:22", "remaining_time": "1:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 560, "loss": 0.1755, "learning_rate": 2.66365685863469e-05, "epoch": 6.862222222222222, "percentage": 68.93, "elapsed_time": "3:24:57", "remaining_time": "1:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 387, "total_steps": 560, "loss": 0.1354, "learning_rate": 2.636147560040866e-05, "epoch": 6.88, "percentage": 69.11, "elapsed_time": "3:25:27", "remaining_time": "1:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 560, "loss": 0.1803, "learning_rate": 2.6087301068934106e-05, "epoch": 6.897777777777778, "percentage": 69.29, "elapsed_time": "3:26:02", "remaining_time": "1:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 389, "total_steps": 560, "loss": 0.1762, "learning_rate": 2.581405564473801e-05, "epoch": 6.915555555555556, "percentage": 69.46, "elapsed_time": "3:26:47", "remaining_time": "1:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 560, "loss": 0.1644, "learning_rate": 2.5541749944535554e-05, "epoch": 6.933333333333334, "percentage": 69.64, "elapsed_time": "3:27:28", "remaining_time": "1:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 391, "total_steps": 560, "loss": 0.1719, "learning_rate": 2.527039454852963e-05, "epoch": 6.9511111111111115, "percentage": 69.82, "elapsed_time": "3:28:01", "remaining_time": "1:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 560, "loss": 0.1366, "learning_rate": 2.500000000000001e-05, "epoch": 6.968888888888889, "percentage": 70.0, "elapsed_time": "3:28:29", "remaining_time": "1:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 393, "total_steps": 560, "loss": 0.155, "learning_rate": 2.473057680489348e-05, "epoch": 6.986666666666666, "percentage": 70.18, "elapsed_time": "3:28:57", "remaining_time": "1:28:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 560, "loss": 0.1627, "learning_rate": 2.4462135431415733e-05, "epoch": 7.004444444444444, "percentage": 70.36, "elapsed_time": "3:29:38", "remaining_time": "1:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 560, "loss": 0.1384, "learning_rate": 2.4194686309624663e-05, "epoch": 7.022222222222222, "percentage": 70.54, "elapsed_time": "3:30:05", "remaining_time": "1:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 560, "loss": 0.1731, "learning_rate": 2.39282398310251e-05, "epoch": 7.04, "percentage": 70.71, "elapsed_time": "3:30:40", "remaining_time": "1:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 397, "total_steps": 560, "loss": 0.1471, "learning_rate": 2.366280634816496e-05, "epoch": 7.057777777777778, "percentage": 70.89, "elapsed_time": "3:31:13", "remaining_time": "1:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 560, "loss": 0.1066, "learning_rate": 2.3398396174233178e-05, "epoch": 7.075555555555556, "percentage": 71.07, "elapsed_time": "3:31:29", "remaining_time": "1:26:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 399, "total_steps": 560, "loss": 0.1201, "learning_rate": 2.3135019582658802e-05, "epoch": 7.093333333333334, "percentage": 71.25, "elapsed_time": "3:31:55", "remaining_time": "1:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 560, "loss": 0.1401, "learning_rate": 2.2872686806712035e-05, "epoch": 7.111111111111111, "percentage": 71.43, "elapsed_time": "3:32:35", "remaining_time": "1:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 401, "total_steps": 560, "loss": 0.1096, "learning_rate": 2.261140803910644e-05, "epoch": 7.128888888888889, "percentage": 71.61, "elapsed_time": "3:33:02", "remaining_time": "1:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 560, "loss": 0.1555, "learning_rate": 2.235119343160303e-05, "epoch": 7.1466666666666665, "percentage": 71.79, "elapsed_time": "3:33:42", "remaining_time": "1:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 403, "total_steps": 560, "loss": 0.1301, "learning_rate": 2.2092053094615813e-05, "epoch": 7.164444444444444, "percentage": 71.96, "elapsed_time": "3:34:04", "remaining_time": "1:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 560, "loss": 0.1345, "learning_rate": 2.1833997096818898e-05, "epoch": 7.182222222222222, "percentage": 72.14, "elapsed_time": "3:34:30", "remaining_time": "1:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 560, "loss": 0.1733, "learning_rate": 2.157703546475539e-05, "epoch": 7.2, "percentage": 72.32, "elapsed_time": "3:35:12", "remaining_time": "1:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 560, "loss": 0.1491, "learning_rate": 2.132117818244771e-05, "epoch": 7.217777777777778, "percentage": 72.5, "elapsed_time": "3:35:55", "remaining_time": "1:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 407, "total_steps": 560, "loss": 0.1226, "learning_rate": 2.1066435191009715e-05, "epoch": 7.235555555555556, "percentage": 72.68, "elapsed_time": "3:36:20", "remaining_time": "1:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 560, "loss": 0.1455, "learning_rate": 2.0812816388260518e-05, "epoch": 7.253333333333333, "percentage": 72.86, "elapsed_time": "3:36:52", "remaining_time": "1:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 409, "total_steps": 560, "loss": 0.1176, "learning_rate": 2.056033162833977e-05, "epoch": 7.271111111111111, "percentage": 73.04, "elapsed_time": "3:37:18", "remaining_time": "1:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 560, "loss": 0.1654, "learning_rate": 2.0308990721324927e-05, "epoch": 7.288888888888889, "percentage": 73.21, "elapsed_time": "3:37:51", "remaining_time": "1:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 411, "total_steps": 560, "loss": 0.1741, "learning_rate": 2.0058803432849987e-05, "epoch": 7.306666666666667, "percentage": 73.39, "elapsed_time": "3:38:26", "remaining_time": "1:19:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 560, "loss": 0.1198, "learning_rate": 1.980977948372612e-05, "epoch": 7.3244444444444445, "percentage": 73.57, "elapsed_time": "3:38:50", "remaining_time": "1:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 413, "total_steps": 560, "loss": 0.1176, "learning_rate": 1.9561928549563968e-05, "epoch": 7.342222222222222, "percentage": 73.75, "elapsed_time": "3:39:16", "remaining_time": "1:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 560, "loss": 0.1487, "learning_rate": 1.931526026039764e-05, "epoch": 7.36, "percentage": 73.93, "elapsed_time": "3:39:44", "remaining_time": "1:17:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 560, "loss": 0.1809, "learning_rate": 1.906978420031059e-05, "epoch": 7.377777777777778, "percentage": 74.11, "elapsed_time": "3:40:14", "remaining_time": "1:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 560, "loss": 0.1134, "learning_rate": 1.8825509907063327e-05, "epoch": 7.395555555555555, "percentage": 74.29, "elapsed_time": "3:40:32", "remaining_time": "1:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 417, "total_steps": 560, "loss": 0.1467, "learning_rate": 1.8582446871722636e-05, "epoch": 7.413333333333333, "percentage": 74.46, "elapsed_time": "3:41:08", "remaining_time": "1:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 560, "loss": 0.1813, "learning_rate": 1.8340604538293015e-05, "epoch": 7.431111111111111, "percentage": 74.64, "elapsed_time": "3:41:55", "remaining_time": "1:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 419, "total_steps": 560, "loss": 0.1514, "learning_rate": 1.8099992303349577e-05, "epoch": 7.448888888888889, "percentage": 74.82, "elapsed_time": "3:42:15", "remaining_time": "1:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 560, "loss": 0.1348, "learning_rate": 1.7860619515673033e-05, "epoch": 7.466666666666667, "percentage": 75.0, "elapsed_time": "3:42:41", "remaining_time": "1:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 421, "total_steps": 560, "loss": 0.127, "learning_rate": 1.7622495475886487e-05, "epoch": 7.484444444444445, "percentage": 75.18, "elapsed_time": "3:43:09", "remaining_time": "1:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 560, "loss": 0.1081, "learning_rate": 1.738562943609396e-05, "epoch": 7.502222222222223, "percentage": 75.36, "elapsed_time": "3:43:35", "remaining_time": "1:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 423, "total_steps": 560, "loss": 0.1875, "learning_rate": 1.7150030599520984e-05, "epoch": 7.52, "percentage": 75.54, "elapsed_time": "3:44:09", "remaining_time": "1:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 560, "loss": 0.1278, "learning_rate": 1.691570812015704e-05, "epoch": 7.5377777777777775, "percentage": 75.71, "elapsed_time": "3:44:35", "remaining_time": "1:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 560, "loss": 0.1391, "learning_rate": 1.6682671102399805e-05, "epoch": 7.555555555555555, "percentage": 75.89, "elapsed_time": "3:45:07", "remaining_time": "1:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 560, "loss": 0.1568, "learning_rate": 1.6450928600701504e-05, "epoch": 7.573333333333333, "percentage": 76.07, "elapsed_time": "3:45:57", "remaining_time": "1:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 427, "total_steps": 560, "loss": 0.1352, "learning_rate": 1.622048961921699e-05, "epoch": 7.591111111111111, "percentage": 76.25, "elapsed_time": "3:46:33", "remaining_time": "1:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 560, "loss": 0.1635, "learning_rate": 1.599136311145402e-05, "epoch": 7.608888888888889, "percentage": 76.43, "elapsed_time": "3:47:14", "remaining_time": "1:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 429, "total_steps": 560, "loss": 0.1637, "learning_rate": 1.5763557979925324e-05, "epoch": 7.626666666666667, "percentage": 76.61, "elapsed_time": "3:47:52", "remaining_time": "1:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 560, "loss": 0.1537, "learning_rate": 1.553708307580265e-05, "epoch": 7.644444444444445, "percentage": 76.79, "elapsed_time": "3:48:30", "remaining_time": "1:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 431, "total_steps": 560, "loss": 0.1205, "learning_rate": 1.531194719857292e-05, "epoch": 7.662222222222223, "percentage": 76.96, "elapsed_time": "3:48:52", "remaining_time": "1:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 560, "loss": 0.128, "learning_rate": 1.5088159095696363e-05, "epoch": 7.68, "percentage": 77.14, "elapsed_time": "3:49:23", "remaining_time": "1:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 433, "total_steps": 560, "loss": 0.1254, "learning_rate": 1.4865727462266543e-05, "epoch": 7.697777777777778, "percentage": 77.32, "elapsed_time": "3:49:50", "remaining_time": "1:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 560, "loss": 0.1451, "learning_rate": 1.4644660940672627e-05, "epoch": 7.7155555555555555, "percentage": 77.5, "elapsed_time": "3:50:25", "remaining_time": "1:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 560, "loss": 0.1285, "learning_rate": 1.4424968120263504e-05, "epoch": 7.733333333333333, "percentage": 77.68, "elapsed_time": "3:50:52", "remaining_time": "1:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 560, "loss": 0.1817, "learning_rate": 1.4206657537014079e-05, "epoch": 7.751111111111111, "percentage": 77.86, "elapsed_time": "3:51:24", "remaining_time": "1:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 437, "total_steps": 560, "loss": 0.1569, "learning_rate": 1.398973767319368e-05, "epoch": 7.768888888888889, "percentage": 78.04, "elapsed_time": "3:51:59", "remaining_time": "1:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 560, "loss": 0.1493, "learning_rate": 1.3774216957036367e-05, "epoch": 7.786666666666667, "percentage": 78.21, "elapsed_time": "3:52:32", "remaining_time": "1:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 439, "total_steps": 560, "loss": 0.1215, "learning_rate": 1.3560103762413584e-05, "epoch": 7.804444444444444, "percentage": 78.39, "elapsed_time": "3:52:54", "remaining_time": "1:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 560, "loss": 0.1389, "learning_rate": 1.3347406408508695e-05, "epoch": 7.822222222222222, "percentage": 78.57, "elapsed_time": "3:53:34", "remaining_time": "1:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 441, "total_steps": 560, "loss": 0.113, "learning_rate": 1.3136133159493802e-05, "epoch": 7.84, "percentage": 78.75, "elapsed_time": "3:53:51", "remaining_time": "1:03:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 560, "loss": 0.1344, "learning_rate": 1.2926292224208664e-05, "epoch": 7.857777777777778, "percentage": 78.93, "elapsed_time": "3:54:21", "remaining_time": "1:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 443, "total_steps": 560, "loss": 0.1363, "learning_rate": 1.2717891755841722e-05, "epoch": 7.875555555555556, "percentage": 79.11, "elapsed_time": "3:54:53", "remaining_time": "1:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 560, "loss": 0.1293, "learning_rate": 1.2510939851613285e-05, "epoch": 7.8933333333333335, "percentage": 79.29, "elapsed_time": "3:55:23", "remaining_time": "1:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 560, "loss": 0.161, "learning_rate": 1.230544455246101e-05, "epoch": 7.911111111111111, "percentage": 79.46, "elapsed_time": "3:56:03", "remaining_time": "1:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 560, "loss": 0.1336, "learning_rate": 1.2101413842727345e-05, "epoch": 7.928888888888888, "percentage": 79.64, "elapsed_time": "3:56:37", "remaining_time": "1:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 447, "total_steps": 560, "loss": 0.177, "learning_rate": 1.1898855649849461e-05, "epoch": 7.946666666666666, "percentage": 79.82, "elapsed_time": "3:57:29", "remaining_time": "1:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 560, "loss": 0.1431, "learning_rate": 1.1697777844051105e-05, "epoch": 7.964444444444444, "percentage": 80.0, "elapsed_time": "3:58:11", "remaining_time": "0:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 449, "total_steps": 560, "loss": 0.1503, "learning_rate": 1.1498188238036861e-05, "epoch": 7.982222222222222, "percentage": 80.18, "elapsed_time": "3:58:50", "remaining_time": "0:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 560, "loss": 0.1328, "learning_rate": 1.130009458668863e-05, "epoch": 8.0, "percentage": 80.36, "elapsed_time": "3:59:22", "remaining_time": "0:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 451, "total_steps": 560, "loss": 0.1182, "learning_rate": 1.1103504586764263e-05, "epoch": 8.017777777777777, "percentage": 80.54, "elapsed_time": "3:59:50", "remaining_time": "0:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 560, "loss": 0.1369, "learning_rate": 1.090842587659851e-05, "epoch": 8.035555555555556, "percentage": 80.71, "elapsed_time": "4:00:30", "remaining_time": "0:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 453, "total_steps": 560, "loss": 0.1346, "learning_rate": 1.0714866035806326e-05, "epoch": 8.053333333333333, "percentage": 80.89, "elapsed_time": "4:00:58", "remaining_time": "0:56:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 560, "loss": 0.144, "learning_rate": 1.0522832584988234e-05, "epoch": 8.071111111111112, "percentage": 81.07, "elapsed_time": "4:01:37", "remaining_time": "0:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 560, "loss": 0.1522, "learning_rate": 1.0332332985438248e-05, "epoch": 8.088888888888889, "percentage": 81.25, "elapsed_time": "4:02:20", "remaining_time": "0:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 560, "loss": 0.1347, "learning_rate": 1.0143374638853891e-05, "epoch": 8.106666666666667, "percentage": 81.43, "elapsed_time": "4:02:51", "remaining_time": "0:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 457, "total_steps": 560, "loss": 0.1371, "learning_rate": 9.955964887048607e-06, "epoch": 8.124444444444444, "percentage": 81.61, "elapsed_time": "4:03:22", "remaining_time": "0:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 560, "loss": 0.1247, "learning_rate": 9.770111011666583e-06, "epoch": 8.142222222222221, "percentage": 81.79, "elapsed_time": "4:03:59", "remaining_time": "0:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 459, "total_steps": 560, "loss": 0.1328, "learning_rate": 9.58582023389974e-06, "epoch": 8.16, "percentage": 81.96, "elapsed_time": "4:04:39", "remaining_time": "0:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 560, "loss": 0.1485, "learning_rate": 9.403099714207175e-06, "epoch": 8.177777777777777, "percentage": 82.14, "elapsed_time": "4:05:07", "remaining_time": "0:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 461, "total_steps": 560, "loss": 0.1226, "learning_rate": 9.221956552036992e-06, "epoch": 8.195555555555556, "percentage": 82.32, "elapsed_time": "4:05:40", "remaining_time": "0:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 560, "loss": 0.1297, "learning_rate": 9.042397785550405e-06, "epoch": 8.213333333333333, "percentage": 82.5, "elapsed_time": "4:06:15", "remaining_time": "0:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 463, "total_steps": 560, "loss": 0.1209, "learning_rate": 8.864430391348332e-06, "epoch": 8.231111111111112, "percentage": 82.68, "elapsed_time": "4:06:49", "remaining_time": "0:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 560, "loss": 0.0914, "learning_rate": 8.688061284200266e-06, "epoch": 8.248888888888889, "percentage": 82.86, "elapsed_time": "4:07:13", "remaining_time": "0:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 560, "loss": 0.1514, "learning_rate": 8.513297316775625e-06, "epoch": 8.266666666666667, "percentage": 83.04, "elapsed_time": "4:07:47", "remaining_time": "0:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 560, "loss": 0.1336, "learning_rate": 8.34014527937756e-06, "epoch": 8.284444444444444, "percentage": 83.21, "elapsed_time": "4:08:15", "remaining_time": "0:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 467, "total_steps": 560, "loss": 0.1287, "learning_rate": 8.168611899679013e-06, "epoch": 8.302222222222222, "percentage": 83.39, "elapsed_time": "4:08:46", "remaining_time": "0:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 560, "loss": 0.1336, "learning_rate": 7.998703842461431e-06, "epoch": 8.32, "percentage": 83.57, "elapsed_time": "4:09:11", "remaining_time": "0:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 469, "total_steps": 560, "loss": 0.1321, "learning_rate": 7.830427709355725e-06, "epoch": 8.337777777777777, "percentage": 83.75, "elapsed_time": "4:09:53", "remaining_time": "0:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 560, "loss": 0.1072, "learning_rate": 7.663790038585793e-06, "epoch": 8.355555555555556, "percentage": 83.93, "elapsed_time": "4:10:12", "remaining_time": "0:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 471, "total_steps": 560, "loss": 0.1336, "learning_rate": 7.498797304714544e-06, "epoch": 8.373333333333333, "percentage": 84.11, "elapsed_time": "4:10:48", "remaining_time": "0:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 560, "loss": 0.1141, "learning_rate": 7.33545591839222e-06, "epoch": 8.391111111111112, "percentage": 84.29, "elapsed_time": "4:11:19", "remaining_time": "0:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 473, "total_steps": 560, "loss": 0.1143, "learning_rate": 7.173772226107434e-06, "epoch": 8.408888888888889, "percentage": 84.46, "elapsed_time": "4:11:45", "remaining_time": "0:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 560, "loss": 0.1242, "learning_rate": 7.013752509940485e-06, "epoch": 8.426666666666666, "percentage": 84.64, "elapsed_time": "4:12:26", "remaining_time": "0:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 560, "loss": 0.1302, "learning_rate": 6.855402987319348e-06, "epoch": 8.444444444444445, "percentage": 84.82, "elapsed_time": "4:12:54", "remaining_time": "0:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 560, "loss": 0.1245, "learning_rate": 6.698729810778065e-06, "epoch": 8.462222222222222, "percentage": 85.0, "elapsed_time": "4:13:24", "remaining_time": "0:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 477, "total_steps": 560, "loss": 0.134, "learning_rate": 6.54373906771768e-06, "epoch": 8.48, "percentage": 85.18, "elapsed_time": "4:13:59", "remaining_time": "0:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 560, "loss": 0.1106, "learning_rate": 6.390436780169734e-06, "epoch": 8.497777777777777, "percentage": 85.36, "elapsed_time": "4:14:25", "remaining_time": "0:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 479, "total_steps": 560, "loss": 0.1309, "learning_rate": 6.238828904562316e-06, "epoch": 8.515555555555556, "percentage": 85.54, "elapsed_time": "4:15:03", "remaining_time": "0:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 560, "loss": 0.1263, "learning_rate": 6.088921331488568e-06, "epoch": 8.533333333333333, "percentage": 85.71, "elapsed_time": "4:15:25", "remaining_time": "0:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 481, "total_steps": 560, "loss": 0.1018, "learning_rate": 5.94071988547788e-06, "epoch": 8.551111111111112, "percentage": 85.89, "elapsed_time": "4:15:53", "remaining_time": "0:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 560, "loss": 0.1568, "learning_rate": 5.794230324769517e-06, "epoch": 8.568888888888889, "percentage": 86.07, "elapsed_time": "4:16:33", "remaining_time": "0:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 483, "total_steps": 560, "loss": 0.1537, "learning_rate": 5.649458341088915e-06, "epoch": 8.586666666666666, "percentage": 86.25, "elapsed_time": "4:17:08", "remaining_time": "0:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 560, "loss": 0.1364, "learning_rate": 5.506409559426573e-06, "epoch": 8.604444444444445, "percentage": 86.43, "elapsed_time": "4:17:45", "remaining_time": "0:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 560, "loss": 0.1214, "learning_rate": 5.365089537819434e-06, "epoch": 8.622222222222222, "percentage": 86.61, "elapsed_time": "4:18:07", "remaining_time": "0:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 560, "loss": 0.1029, "learning_rate": 5.2255037671349535e-06, "epoch": 8.64, "percentage": 86.79, "elapsed_time": "4:18:30", "remaining_time": "0:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 487, "total_steps": 560, "loss": 0.1279, "learning_rate": 5.087657670857798e-06, "epoch": 8.657777777777778, "percentage": 86.96, "elapsed_time": "4:19:03", "remaining_time": "0:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 560, "loss": 0.1055, "learning_rate": 4.951556604879048e-06, "epoch": 8.675555555555556, "percentage": 87.14, "elapsed_time": "4:19:20", "remaining_time": "0:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 489, "total_steps": 560, "loss": 0.1115, "learning_rate": 4.8172058572881765e-06, "epoch": 8.693333333333333, "percentage": 87.32, "elapsed_time": "4:19:40", "remaining_time": "0:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 560, "loss": 0.1337, "learning_rate": 4.684610648167503e-06, "epoch": 8.71111111111111, "percentage": 87.5, "elapsed_time": "4:20:17", "remaining_time": "0:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 491, "total_steps": 560, "loss": 0.1677, "learning_rate": 4.5537761293894535e-06, "epoch": 8.72888888888889, "percentage": 87.68, "elapsed_time": "4:21:01", "remaining_time": "0:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 560, "loss": 0.1281, "learning_rate": 4.424707384416344e-06, "epoch": 8.746666666666666, "percentage": 87.86, "elapsed_time": "4:21:32", "remaining_time": "0:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 493, "total_steps": 560, "loss": 0.1464, "learning_rate": 4.29740942810285e-06, "epoch": 8.764444444444445, "percentage": 88.04, "elapsed_time": "4:22:09", "remaining_time": "0:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 560, "loss": 0.1266, "learning_rate": 4.1718872065011904e-06, "epoch": 8.782222222222222, "percentage": 88.21, "elapsed_time": "4:22:45", "remaining_time": "0:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 560, "loss": 0.1355, "learning_rate": 4.048145596668967e-06, "epoch": 8.8, "percentage": 88.39, "elapsed_time": "4:23:27", "remaining_time": "0:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 560, "loss": 0.144, "learning_rate": 3.9261894064796135e-06, "epoch": 8.817777777777778, "percentage": 88.57, "elapsed_time": "4:23:59", "remaining_time": "0:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 497, "total_steps": 560, "loss": 0.1422, "learning_rate": 3.8060233744356633e-06, "epoch": 8.835555555555555, "percentage": 88.75, "elapsed_time": "4:24:37", "remaining_time": "0:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 560, "loss": 0.1472, "learning_rate": 3.687652169484568e-06, "epoch": 8.853333333333333, "percentage": 88.93, "elapsed_time": "4:25:11", "remaining_time": "0:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 499, "total_steps": 560, "loss": 0.1145, "learning_rate": 3.5710803908373224e-06, "epoch": 8.87111111111111, "percentage": 89.11, "elapsed_time": "4:25:45", "remaining_time": "0:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 560, "loss": 0.1145, "learning_rate": 3.4563125677897932e-06, "epoch": 8.88888888888889, "percentage": 89.29, "elapsed_time": "4:26:14", "remaining_time": "0:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 560, "eval_loss": 0.3872971832752228, "epoch": 8.88888888888889, "percentage": 89.29, "elapsed_time": "4:26:58", "remaining_time": "0:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 501, "total_steps": 560, "loss": 0.1311, "learning_rate": 3.343353159546675e-06, "epoch": 8.906666666666666, "percentage": 89.46, "elapsed_time": "4:27:31", "remaining_time": "0:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 560, "loss": 0.1346, "learning_rate": 3.2322065550483007e-06, "epoch": 8.924444444444445, "percentage": 89.64, "elapsed_time": "4:27:53", "remaining_time": "0:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 503, "total_steps": 560, "loss": 0.1145, "learning_rate": 3.1228770728000455e-06, "epoch": 8.942222222222222, "percentage": 89.82, "elapsed_time": "4:28:25", "remaining_time": "0:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 560, "loss": 0.1122, "learning_rate": 3.0153689607045845e-06, "epoch": 8.96, "percentage": 90.0, "elapsed_time": "4:28:48", "remaining_time": "0:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 560, "loss": 0.155, "learning_rate": 2.9096863958968268e-06, "epoch": 8.977777777777778, "percentage": 90.18, "elapsed_time": "4:29:23", "remaining_time": "0:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 560, "loss": 0.1568, "learning_rate": 2.8058334845816213e-06, "epoch": 8.995555555555555, "percentage": 90.36, "elapsed_time": "4:30:08", "remaining_time": "0:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 507, "total_steps": 560, "loss": 0.129, "learning_rate": 2.7038142618741992e-06, "epoch": 9.013333333333334, "percentage": 90.54, "elapsed_time": "4:30:43", "remaining_time": "0:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 560, "loss": 0.1233, "learning_rate": 2.603632691643415e-06, "epoch": 9.03111111111111, "percentage": 90.71, "elapsed_time": "4:31:10", "remaining_time": "0:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 509, "total_steps": 560, "loss": 0.1235, "learning_rate": 2.5052926663577e-06, "epoch": 9.04888888888889, "percentage": 90.89, "elapsed_time": "4:31:44", "remaining_time": "0:27:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 560, "loss": 0.1068, "learning_rate": 2.408798006933882e-06, "epoch": 9.066666666666666, "percentage": 91.07, "elapsed_time": "4:32:11", "remaining_time": "0:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 511, "total_steps": 560, "loss": 0.1364, "learning_rate": 2.314152462588659e-06, "epoch": 9.084444444444445, "percentage": 91.25, "elapsed_time": "4:32:37", "remaining_time": "0:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 560, "loss": 0.1492, "learning_rate": 2.221359710692961e-06, "epoch": 9.102222222222222, "percentage": 91.43, "elapsed_time": "4:33:06", "remaining_time": "0:25:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 513, "total_steps": 560, "loss": 0.1079, "learning_rate": 2.1304233566290964e-06, "epoch": 9.12, "percentage": 91.61, "elapsed_time": "4:33:45", "remaining_time": "0:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 560, "loss": 0.1298, "learning_rate": 2.041346933650612e-06, "epoch": 9.137777777777778, "percentage": 91.79, "elapsed_time": "4:34:15", "remaining_time": "0:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 560, "loss": 0.1046, "learning_rate": 1.9541339027450256e-06, "epoch": 9.155555555555555, "percentage": 91.96, "elapsed_time": "4:34:41", "remaining_time": "0:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 560, "loss": 0.1129, "learning_rate": 1.8687876524993987e-06, "epoch": 9.173333333333334, "percentage": 92.14, "elapsed_time": "4:35:13", "remaining_time": "0:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 517, "total_steps": 560, "loss": 0.1036, "learning_rate": 1.785311498968617e-06, "epoch": 9.19111111111111, "percentage": 92.32, "elapsed_time": "4:35:33", "remaining_time": "0:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 560, "loss": 0.1266, "learning_rate": 1.70370868554659e-06, "epoch": 9.20888888888889, "percentage": 92.5, "elapsed_time": "4:36:07", "remaining_time": "0:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 519, "total_steps": 560, "loss": 0.1162, "learning_rate": 1.6239823828401945e-06, "epoch": 9.226666666666667, "percentage": 92.68, "elapsed_time": "4:36:34", "remaining_time": "0:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 560, "loss": 0.1179, "learning_rate": 1.5461356885461075e-06, "epoch": 9.244444444444444, "percentage": 92.86, "elapsed_time": "4:37:01", "remaining_time": "0:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 521, "total_steps": 560, "loss": 0.1342, "learning_rate": 1.4701716273304521e-06, "epoch": 9.262222222222222, "percentage": 93.04, "elapsed_time": "4:37:42", "remaining_time": "0:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 560, "loss": 0.1196, "learning_rate": 1.3960931507112752e-06, "epoch": 9.28, "percentage": 93.21, "elapsed_time": "4:38:20", "remaining_time": "0:20:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 523, "total_steps": 560, "loss": 0.1205, "learning_rate": 1.3239031369438326e-06, "epoch": 9.297777777777778, "percentage": 93.39, "elapsed_time": "4:38:42", "remaining_time": "0:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 560, "loss": 0.1159, "learning_rate": 1.2536043909088191e-06, "epoch": 9.315555555555555, "percentage": 93.57, "elapsed_time": "4:39:07", "remaining_time": "0:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 560, "loss": 0.1529, "learning_rate": 1.1851996440033319e-06, "epoch": 9.333333333333334, "percentage": 93.75, "elapsed_time": "4:39:53", "remaining_time": "0:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 560, "loss": 0.1398, "learning_rate": 1.118691554034773e-06, "epoch": 9.351111111111111, "percentage": 93.93, "elapsed_time": "4:40:24", "remaining_time": "0:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 527, "total_steps": 560, "loss": 0.1054, "learning_rate": 1.0540827051175818e-06, "epoch": 9.36888888888889, "percentage": 94.11, "elapsed_time": "4:40:53", "remaining_time": "0:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 560, "loss": 0.1361, "learning_rate": 9.913756075728087e-07, "epoch": 9.386666666666667, "percentage": 94.29, "elapsed_time": "4:41:32", "remaining_time": "0:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 529, "total_steps": 560, "loss": 0.0994, "learning_rate": 9.305726978306173e-07, "epoch": 9.404444444444444, "percentage": 94.46, "elapsed_time": "4:42:01", "remaining_time": "0:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 560, "loss": 0.1426, "learning_rate": 8.716763383355864e-07, "epoch": 9.422222222222222, "percentage": 94.64, "elapsed_time": "4:42:41", "remaining_time": "0:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 531, "total_steps": 560, "loss": 0.1543, "learning_rate": 8.146888174549339e-07, "epoch": 9.44, "percentage": 94.82, "elapsed_time": "4:43:21", "remaining_time": "0:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 560, "loss": 0.124, "learning_rate": 7.596123493895991e-07, "epoch": 9.457777777777778, "percentage": 95.0, "elapsed_time": "4:43:57", "remaining_time": "0:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 533, "total_steps": 560, "loss": 0.1438, "learning_rate": 7.064490740882057e-07, "epoch": 9.475555555555555, "percentage": 95.18, "elapsed_time": "4:44:36", "remaining_time": "0:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 560, "loss": 0.1099, "learning_rate": 6.552010571639456e-07, "epoch": 9.493333333333334, "percentage": 95.36, "elapsed_time": "4:45:03", "remaining_time": "0:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 560, "loss": 0.1444, "learning_rate": 6.058702898142643e-07, "epoch": 9.511111111111111, "percentage": 95.54, "elapsed_time": "4:45:41", "remaining_time": "0:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 560, "loss": 0.1354, "learning_rate": 5.584586887435739e-07, "epoch": 9.528888888888888, "percentage": 95.71, "elapsed_time": "4:46:24", "remaining_time": "0:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 537, "total_steps": 560, "loss": 0.1367, "learning_rate": 5.129680960887007e-07, "epoch": 9.546666666666667, "percentage": 95.89, "elapsed_time": "4:46:59", "remaining_time": "0:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 560, "loss": 0.1215, "learning_rate": 4.6940027934735954e-07, "epoch": 9.564444444444444, "percentage": 96.07, "elapsed_time": "4:47:25", "remaining_time": "0:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 539, "total_steps": 560, "loss": 0.0906, "learning_rate": 4.277569313094809e-07, "epoch": 9.582222222222223, "percentage": 96.25, "elapsed_time": "4:47:49", "remaining_time": "0:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 560, "loss": 0.0995, "learning_rate": 3.8803966999139684e-07, "epoch": 9.6, "percentage": 96.43, "elapsed_time": "4:48:15", "remaining_time": "0:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 541, "total_steps": 560, "loss": 0.1209, "learning_rate": 3.50250038573019e-07, "epoch": 9.617777777777778, "percentage": 96.61, "elapsed_time": "4:48:43", "remaining_time": "0:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 560, "loss": 0.1201, "learning_rate": 3.143895053378698e-07, "epoch": 9.635555555555555, "percentage": 96.79, "elapsed_time": "4:49:18", "remaining_time": "0:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 543, "total_steps": 560, "loss": 0.1151, "learning_rate": 2.8045946361601183e-07, "epoch": 9.653333333333332, "percentage": 96.96, "elapsed_time": "4:49:48", "remaining_time": "0:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 560, "loss": 0.1356, "learning_rate": 2.4846123172992954e-07, "epoch": 9.671111111111111, "percentage": 97.14, "elapsed_time": "4:50:21", "remaining_time": "0:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 560, "loss": 0.1461, "learning_rate": 2.1839605294330933e-07, "epoch": 9.688888888888888, "percentage": 97.32, "elapsed_time": "4:50:58", "remaining_time": "0:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 560, "loss": 0.1065, "learning_rate": 1.9026509541272275e-07, "epoch": 9.706666666666667, "percentage": 97.5, "elapsed_time": "4:51:32", "remaining_time": "0:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 547, "total_steps": 560, "loss": 0.1043, "learning_rate": 1.640694521422459e-07, "epoch": 9.724444444444444, "percentage": 97.68, "elapsed_time": "4:51:57", "remaining_time": "0:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 560, "loss": 0.1214, "learning_rate": 1.3981014094099353e-07, "epoch": 9.742222222222223, "percentage": 97.86, "elapsed_time": "4:52:27", "remaining_time": "0:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 549, "total_steps": 560, "loss": 0.1368, "learning_rate": 1.1748810438355628e-07, "epoch": 9.76, "percentage": 98.04, "elapsed_time": "4:53:01", "remaining_time": "0:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 560, "loss": 0.136, "learning_rate": 9.710420977340762e-08, "epoch": 9.777777777777779, "percentage": 98.21, "elapsed_time": "4:53:36", "remaining_time": "0:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 551, "total_steps": 560, "loss": 0.126, "learning_rate": 7.865924910916977e-08, "epoch": 9.795555555555556, "percentage": 98.39, "elapsed_time": "4:54:13", "remaining_time": "0:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 560, "loss": 0.1457, "learning_rate": 6.215393905388278e-08, "epoch": 9.813333333333333, "percentage": 98.57, "elapsed_time": "4:54:51", "remaining_time": "0:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 553, "total_steps": 560, "loss": 0.1103, "learning_rate": 4.7588920907110094e-08, "epoch": 9.831111111111111, "percentage": 98.75, "elapsed_time": "4:55:18", "remaining_time": "0:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 560, "loss": 0.1487, "learning_rate": 3.496476058006959e-08, "epoch": 9.848888888888888, "percentage": 98.93, "elapsed_time": "4:55:54", "remaining_time": "0:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 560, "loss": 0.1124, "learning_rate": 2.4281948573617874e-08, "epoch": 9.866666666666667, "percentage": 99.11, "elapsed_time": "4:56:26", "remaining_time": "0:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 560, "loss": 0.1004, "learning_rate": 1.5540899959187727e-08, "epoch": 9.884444444444444, "percentage": 99.29, "elapsed_time": "4:56:50", "remaining_time": "0:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 557, "total_steps": 560, "loss": 0.1479, "learning_rate": 8.741954362678772e-09, "epoch": 9.902222222222223, "percentage": 99.46, "elapsed_time": "4:57:22", "remaining_time": "0:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 560, "loss": 0.1138, "learning_rate": 3.885375951256931e-09, "epoch": 9.92, "percentage": 99.64, "elapsed_time": "4:57:52", "remaining_time": "0:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 559, "total_steps": 560, "loss": 0.1207, "learning_rate": 9.713534230904041e-10, "epoch": 9.937777777777779, "percentage": 99.82, "elapsed_time": "4:58:15", "remaining_time": "0:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 560, "loss": 0.1334, "learning_rate": 0.0, "epoch": 9.955555555555556, "percentage": 100.0, "elapsed_time": "4:58:48", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 560, "epoch": 9.955555555555556, "percentage": 100.0, "elapsed_time": "4:58:50", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}