{"current_steps": 10, "total_steps": 10000, "loss": 0.8354, "accuracy": 0.5, "learning_rate": 5.0000000000000004e-08, "epoch": 0.001, "percentage": 0.1, "elapsed_time": "0:00:20", "remaining_time": "5:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 10000, "loss": 1.0858, "accuracy": 0.699999988079071, "learning_rate": 1.0000000000000001e-07, "epoch": 0.002, "percentage": 0.2, "elapsed_time": "0:00:37", "remaining_time": "5:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 10000, "loss": 1.3177, "accuracy": 0.5, "learning_rate": 1.5000000000000002e-07, "epoch": 0.003, "percentage": 0.3, "elapsed_time": "0:02:28", "remaining_time": "13:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 10000, "loss": 0.6804, "accuracy": 0.699999988079071, "learning_rate": 2.0000000000000002e-07, "epoch": 0.004, "percentage": 0.4, "elapsed_time": "0:02:40", "remaining_time": "11:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 10000, "loss": 1.0372, "accuracy": 0.4000000059604645, "learning_rate": 2.5000000000000004e-07, "epoch": 0.005, "percentage": 0.5, "elapsed_time": "0:02:50", "remaining_time": "9:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 10000, "loss": 1.6069, "accuracy": 0.30000001192092896, "learning_rate": 3.0000000000000004e-07, "epoch": 0.006, "percentage": 0.6, "elapsed_time": "0:03:00", "remaining_time": "8:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 10000, "loss": 1.3632, "accuracy": 0.5, "learning_rate": 3.5000000000000004e-07, "epoch": 0.007, "percentage": 0.7, "elapsed_time": "0:03:10", "remaining_time": "7:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 10000, "loss": 0.5711, "accuracy": 0.800000011920929, "learning_rate": 4.0000000000000003e-07, "epoch": 0.008, "percentage": 0.8, "elapsed_time": "0:03:21", "remaining_time": "6:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 10000, "loss": 0.3843, "accuracy": 0.800000011920929, "learning_rate": 4.5000000000000003e-07, "epoch": 0.009, "percentage": 0.9, "elapsed_time": "0:03:31", "remaining_time": "6:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 10000, "loss": 1.0243, "accuracy": 0.6000000238418579, "learning_rate": 5.000000000000001e-07, "epoch": 0.01, "percentage": 1.0, "elapsed_time": "0:03:42", "remaining_time": "6:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 10000, "loss": 0.579, "accuracy": 0.800000011920929, "learning_rate": 5.5e-07, "epoch": 0.011, "percentage": 1.1, "elapsed_time": "0:03:58", "remaining_time": "5:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 10000, "loss": 1.1696, "accuracy": 0.4000000059604645, "learning_rate": 6.000000000000001e-07, "epoch": 0.012, "percentage": 1.2, "elapsed_time": "0:04:07", "remaining_time": "5:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 10000, "loss": 0.7542, "accuracy": 0.699999988079071, "learning_rate": 6.5e-07, "epoch": 0.013, "percentage": 1.3, "elapsed_time": "0:04:17", "remaining_time": "5:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 10000, "loss": 0.2059, "accuracy": 0.8999999761581421, "learning_rate": 7.000000000000001e-07, "epoch": 0.014, "percentage": 1.4, "elapsed_time": "0:04:29", "remaining_time": "5:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 10000, "loss": 0.1128, "accuracy": 1.0, "learning_rate": 7.5e-07, "epoch": 0.015, "percentage": 1.5, "elapsed_time": "0:04:40", "remaining_time": "5:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 10000, "loss": 0.9627, "accuracy": 0.5, "learning_rate": 8.000000000000001e-07, "epoch": 0.016, "percentage": 1.6, "elapsed_time": "0:04:50", "remaining_time": "4:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 10000, "loss": 0.122, "accuracy": 1.0, "learning_rate": 8.500000000000001e-07, "epoch": 0.017, "percentage": 1.7, "elapsed_time": "0:05:01", "remaining_time": "4:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 10000, "loss": 0.3737, "accuracy": 0.8999999761581421, "learning_rate": 9.000000000000001e-07, "epoch": 0.018, "percentage": 1.8, "elapsed_time": "0:05:11", "remaining_time": "4:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 10000, "loss": 0.806, "accuracy": 0.699999988079071, "learning_rate": 9.500000000000001e-07, "epoch": 0.019, "percentage": 1.9, "elapsed_time": "0:05:22", "remaining_time": "4:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 10000, "loss": 0.2169, "accuracy": 0.8999999761581421, "learning_rate": 1.0000000000000002e-06, "epoch": 0.02, "percentage": 2.0, "elapsed_time": "0:05:33", "remaining_time": "4:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 10000, "loss": 0.136, "accuracy": 1.0, "learning_rate": 1.0500000000000001e-06, "epoch": 0.021, "percentage": 2.1, "elapsed_time": "0:05:44", "remaining_time": "4:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 10000, "loss": 1.2207, "accuracy": 0.6000000238418579, "learning_rate": 1.1e-06, "epoch": 0.022, "percentage": 2.2, "elapsed_time": "0:05:54", "remaining_time": "4:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 10000, "loss": 0.8165, "accuracy": 0.8999999761581421, "learning_rate": 1.1500000000000002e-06, "epoch": 0.023, "percentage": 2.3, "elapsed_time": "0:06:04", "remaining_time": "4:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 10000, "loss": 0.2748, "accuracy": 0.8999999761581421, "learning_rate": 1.2000000000000002e-06, "epoch": 0.024, "percentage": 2.4, "elapsed_time": "0:06:15", "remaining_time": "4:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 10000, "loss": 0.6446, "accuracy": 0.800000011920929, "learning_rate": 1.25e-06, "epoch": 0.025, "percentage": 2.5, "elapsed_time": "0:06:26", "remaining_time": "4:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 10000, "loss": 0.3227, "accuracy": 0.800000011920929, "learning_rate": 1.3e-06, "epoch": 0.026, "percentage": 2.6, "elapsed_time": "0:06:37", "remaining_time": "4:08:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 10000, "loss": 0.631, "accuracy": 0.6000000238418579, "learning_rate": 1.3500000000000002e-06, "epoch": 0.027, "percentage": 2.7, "elapsed_time": "0:06:47", "remaining_time": "4:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 10000, "loss": 0.0141, "accuracy": 1.0, "learning_rate": 1.4000000000000001e-06, "epoch": 0.028, "percentage": 2.8, "elapsed_time": "0:07:00", "remaining_time": "4:03:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 10000, "loss": 0.0695, "accuracy": 1.0, "learning_rate": 1.45e-06, "epoch": 0.029, "percentage": 2.9, "elapsed_time": "0:07:11", "remaining_time": "4:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 10000, "loss": 0.0554, "accuracy": 1.0, "learning_rate": 1.5e-06, "epoch": 0.03, "percentage": 3.0, "elapsed_time": "0:07:21", "remaining_time": "3:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 10000, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 1.5500000000000002e-06, "epoch": 0.031, "percentage": 3.1, "elapsed_time": "0:07:32", "remaining_time": "3:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 10000, "loss": 0.0029, "accuracy": 1.0, "learning_rate": 1.6000000000000001e-06, "epoch": 0.032, "percentage": 3.2, "elapsed_time": "0:07:42", "remaining_time": "3:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 10000, "loss": 0.027, "accuracy": 1.0, "learning_rate": 1.6500000000000003e-06, "epoch": 0.033, "percentage": 3.3, "elapsed_time": "0:07:54", "remaining_time": "3:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 10000, "loss": 0.8495, "accuracy": 0.8999999761581421, "learning_rate": 1.7000000000000002e-06, "epoch": 0.034, "percentage": 3.4, "elapsed_time": "0:08:04", "remaining_time": "3:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 10000, "loss": 0.0637, "accuracy": 1.0, "learning_rate": 1.75e-06, "epoch": 0.035, "percentage": 3.5, "elapsed_time": "0:08:15", "remaining_time": "3:47:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.8000000000000001e-06, "epoch": 0.036, "percentage": 3.6, "elapsed_time": "0:08:26", "remaining_time": "3:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 10000, "loss": 0.0656, "accuracy": 1.0, "learning_rate": 1.85e-06, "epoch": 0.037, "percentage": 3.7, "elapsed_time": "0:08:39", "remaining_time": "3:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 10000, "loss": 0.037, "accuracy": 1.0, "learning_rate": 1.9000000000000002e-06, "epoch": 0.038, "percentage": 3.8, "elapsed_time": "0:08:50", "remaining_time": "3:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 10000, "loss": 0.9008, "accuracy": 0.699999988079071, "learning_rate": 1.9500000000000004e-06, "epoch": 0.039, "percentage": 3.9, "elapsed_time": "0:09:00", "remaining_time": "3:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 10000, "loss": 0.0888, "accuracy": 1.0, "learning_rate": 2.0000000000000003e-06, "epoch": 0.04, "percentage": 4.0, "elapsed_time": "0:09:09", "remaining_time": "3:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.05e-06, "epoch": 0.041, "percentage": 4.1, "elapsed_time": "0:09:19", "remaining_time": "3:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 10000, "loss": 0.5212, "accuracy": 0.800000011920929, "learning_rate": 2.1000000000000002e-06, "epoch": 0.042, "percentage": 4.2, "elapsed_time": "0:09:28", "remaining_time": "3:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 10000, "loss": 0.5238, "accuracy": 0.800000011920929, "learning_rate": 2.15e-06, "epoch": 0.043, "percentage": 4.3, "elapsed_time": "0:09:38", "remaining_time": "3:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 10000, "loss": 0.1815, "accuracy": 0.8999999761581421, "learning_rate": 2.2e-06, "epoch": 0.044, "percentage": 4.4, "elapsed_time": "0:09:47", "remaining_time": "3:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 10000, "loss": 0.0933, "accuracy": 0.8999999761581421, "learning_rate": 2.25e-06, "epoch": 0.045, "percentage": 4.5, "elapsed_time": "0:09:58", "remaining_time": "3:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 10000, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.3000000000000004e-06, "epoch": 0.046, "percentage": 4.6, "elapsed_time": "0:10:07", "remaining_time": "3:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 10000, "loss": 0.1292, "accuracy": 0.8999999761581421, "learning_rate": 2.35e-06, "epoch": 0.047, "percentage": 4.7, "elapsed_time": "0:10:18", "remaining_time": "3:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 10000, "loss": 0.3037, "accuracy": 0.8999999761581421, "learning_rate": 2.4000000000000003e-06, "epoch": 0.048, "percentage": 4.8, "elapsed_time": "0:10:31", "remaining_time": "3:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 10000, "loss": 0.6083, "accuracy": 0.8999999761581421, "learning_rate": 2.4500000000000003e-06, "epoch": 0.049, "percentage": 4.9, "elapsed_time": "0:10:41", "remaining_time": "3:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 10000, "loss": 0.024, "accuracy": 1.0, "learning_rate": 2.5e-06, "epoch": 0.05, "percentage": 5.0, "elapsed_time": "0:10:51", "remaining_time": "3:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 10000, "loss": 0.0038, "accuracy": 1.0, "learning_rate": 2.55e-06, "epoch": 0.051, "percentage": 5.1, "elapsed_time": "0:11:01", "remaining_time": "3:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.6e-06, "epoch": 0.052, "percentage": 5.2, "elapsed_time": "0:11:11", "remaining_time": "3:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 10000, "loss": 0.1536, "accuracy": 0.8999999761581421, "learning_rate": 2.6500000000000005e-06, "epoch": 0.053, "percentage": 5.3, "elapsed_time": "0:11:20", "remaining_time": "3:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 10000, "loss": 2.0321, "accuracy": 0.699999988079071, "learning_rate": 2.7000000000000004e-06, "epoch": 0.054, "percentage": 5.4, "elapsed_time": "0:11:30", "remaining_time": "3:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 10000, "loss": 0.2331, "accuracy": 0.8999999761581421, "learning_rate": 2.7500000000000004e-06, "epoch": 0.055, "percentage": 5.5, "elapsed_time": "0:11:41", "remaining_time": "3:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 10000, "loss": 0.9147, "accuracy": 0.800000011920929, "learning_rate": 2.8000000000000003e-06, "epoch": 0.056, "percentage": 5.6, "elapsed_time": "0:11:51", "remaining_time": "3:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 10000, "loss": 0.5182, "accuracy": 0.8999999761581421, "learning_rate": 2.85e-06, "epoch": 0.057, "percentage": 5.7, "elapsed_time": "0:12:04", "remaining_time": "3:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 10000, "loss": 0.0091, "accuracy": 1.0, "learning_rate": 2.9e-06, "epoch": 0.058, "percentage": 5.8, "elapsed_time": "0:12:14", "remaining_time": "3:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 10000, "loss": 0.0496, "accuracy": 1.0, "learning_rate": 2.95e-06, "epoch": 0.059, "percentage": 5.9, "elapsed_time": "0:12:29", "remaining_time": "3:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 10000, "loss": 0.5942, "accuracy": 0.8999999761581421, "learning_rate": 3e-06, "epoch": 0.06, "percentage": 6.0, "elapsed_time": "0:12:40", "remaining_time": "3:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 10000, "loss": 0.5041, "accuracy": 0.8999999761581421, "learning_rate": 3.05e-06, "epoch": 0.061, "percentage": 6.1, "elapsed_time": "0:12:50", "remaining_time": "3:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 10000, "loss": 0.1221, "accuracy": 0.8999999761581421, "learning_rate": 3.1000000000000004e-06, "epoch": 0.062, "percentage": 6.2, "elapsed_time": "0:13:00", "remaining_time": "3:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 10000, "loss": 0.4131, "accuracy": 0.8999999761581421, "learning_rate": 3.1500000000000003e-06, "epoch": 0.063, "percentage": 6.3, "elapsed_time": "0:13:12", "remaining_time": "3:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 10000, "loss": 0.0031, "accuracy": 1.0, "learning_rate": 3.2000000000000003e-06, "epoch": 0.064, "percentage": 6.4, "elapsed_time": "0:13:31", "remaining_time": "3:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 10000, "loss": 0.0998, "accuracy": 0.8999999761581421, "learning_rate": 3.2500000000000002e-06, "epoch": 0.065, "percentage": 6.5, "elapsed_time": "0:13:41", "remaining_time": "3:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 10000, "loss": 1.4947, "accuracy": 0.8999999761581421, "learning_rate": 3.3000000000000006e-06, "epoch": 0.066, "percentage": 6.6, "elapsed_time": "0:13:56", "remaining_time": "3:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.3500000000000005e-06, "epoch": 0.067, "percentage": 6.7, "elapsed_time": "0:14:08", "remaining_time": "3:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 10000, "loss": 0.0185, "accuracy": 1.0, "learning_rate": 3.4000000000000005e-06, "epoch": 0.068, "percentage": 6.8, "elapsed_time": "0:14:24", "remaining_time": "3:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.45e-06, "epoch": 0.069, "percentage": 6.9, "elapsed_time": "0:14:34", "remaining_time": "3:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.5e-06, "epoch": 0.07, "percentage": 7.0, "elapsed_time": "0:14:45", "remaining_time": "3:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 10000, "loss": 0.008, "accuracy": 1.0, "learning_rate": 3.5500000000000003e-06, "epoch": 0.071, "percentage": 7.1, "elapsed_time": "0:14:56", "remaining_time": "3:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 10000, "loss": 0.1291, "accuracy": 0.8999999761581421, "learning_rate": 3.6000000000000003e-06, "epoch": 0.072, "percentage": 7.2, "elapsed_time": "0:15:05", "remaining_time": "3:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 10000, "loss": 0.4251, "accuracy": 0.8999999761581421, "learning_rate": 3.65e-06, "epoch": 0.073, "percentage": 7.3, "elapsed_time": "0:15:13", "remaining_time": "3:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 10000, "loss": 0.0822, "accuracy": 0.8999999761581421, "learning_rate": 3.7e-06, "epoch": 0.074, "percentage": 7.4, "elapsed_time": "0:15:23", "remaining_time": "3:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 10000, "loss": 0.0146, "accuracy": 1.0, "learning_rate": 3.7500000000000005e-06, "epoch": 0.075, "percentage": 7.5, "elapsed_time": "0:15:35", "remaining_time": "3:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 10000, "loss": 0.1328, "accuracy": 1.0, "learning_rate": 3.8000000000000005e-06, "epoch": 0.076, "percentage": 7.6, "elapsed_time": "0:15:45", "remaining_time": "3:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 10000, "loss": 0.0194, "accuracy": 1.0, "learning_rate": 3.85e-06, "epoch": 0.077, "percentage": 7.7, "elapsed_time": "0:15:56", "remaining_time": "3:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 10000, "loss": 0.0177, "accuracy": 1.0, "learning_rate": 3.900000000000001e-06, "epoch": 0.078, "percentage": 7.8, "elapsed_time": "0:16:05", "remaining_time": "3:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 10000, "loss": 0.1973, "accuracy": 0.8999999761581421, "learning_rate": 3.95e-06, "epoch": 0.079, "percentage": 7.9, "elapsed_time": "0:16:18", "remaining_time": "3:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.000000000000001e-06, "epoch": 0.08, "percentage": 8.0, "elapsed_time": "0:16:29", "remaining_time": "3:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 10000, "loss": 0.1291, "accuracy": 0.8999999761581421, "learning_rate": 4.05e-06, "epoch": 0.081, "percentage": 8.1, "elapsed_time": "0:16:40", "remaining_time": "3:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 10000, "loss": 0.0028, "accuracy": 1.0, "learning_rate": 4.1e-06, "epoch": 0.082, "percentage": 8.2, "elapsed_time": "0:16:51", "remaining_time": "3:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 10000, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.15e-06, "epoch": 0.083, "percentage": 8.3, "elapsed_time": "0:17:01", "remaining_time": "3:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 10000, "loss": 0.0019, "accuracy": 1.0, "learning_rate": 4.2000000000000004e-06, "epoch": 0.084, "percentage": 8.4, "elapsed_time": "0:17:11", "remaining_time": "3:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.25e-06, "epoch": 0.085, "percentage": 8.5, "elapsed_time": "0:17:21", "remaining_time": "3:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 10000, "loss": 0.0026, "accuracy": 1.0, "learning_rate": 4.3e-06, "epoch": 0.086, "percentage": 8.6, "elapsed_time": "0:17:42", "remaining_time": "3:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 10000, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.350000000000001e-06, "epoch": 0.087, "percentage": 8.7, "elapsed_time": "0:17:52", "remaining_time": "3:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 10000, "loss": 1.691, "accuracy": 0.8999999761581421, "learning_rate": 4.4e-06, "epoch": 0.088, "percentage": 8.8, "elapsed_time": "0:18:02", "remaining_time": "3:06:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 10000, "loss": 1.6639, "accuracy": 0.800000011920929, "learning_rate": 4.450000000000001e-06, "epoch": 0.089, "percentage": 8.9, "elapsed_time": "0:18:13", "remaining_time": "3:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 10000, "loss": 0.1378, "accuracy": 0.8999999761581421, "learning_rate": 4.5e-06, "epoch": 0.09, "percentage": 9.0, "elapsed_time": "0:18:23", "remaining_time": "3:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 10000, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.5500000000000005e-06, "epoch": 0.091, "percentage": 9.1, "elapsed_time": "0:18:34", "remaining_time": "3:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.600000000000001e-06, "epoch": 0.092, "percentage": 9.2, "elapsed_time": "0:18:45", "remaining_time": "3:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.65e-06, "epoch": 0.093, "percentage": 9.3, "elapsed_time": "0:18:55", "remaining_time": "3:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.7e-06, "epoch": 0.094, "percentage": 9.4, "elapsed_time": "0:19:06", "remaining_time": "3:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 10000, "loss": 0.8787, "accuracy": 0.8999999761581421, "learning_rate": 4.75e-06, "epoch": 0.095, "percentage": 9.5, "elapsed_time": "0:19:15", "remaining_time": "3:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 10000, "loss": 0.2883, "accuracy": 0.8999999761581421, "learning_rate": 4.800000000000001e-06, "epoch": 0.096, "percentage": 9.6, "elapsed_time": "0:19:34", "remaining_time": "3:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.85e-06, "epoch": 0.097, "percentage": 9.7, "elapsed_time": "0:19:53", "remaining_time": "3:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.9000000000000005e-06, "epoch": 0.098, "percentage": 9.8, "elapsed_time": "0:20:07", "remaining_time": "3:05:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.95e-06, "epoch": 0.099, "percentage": 9.9, "elapsed_time": "0:20:21", "remaining_time": "3:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 5e-06, "epoch": 0.1, "percentage": 10.0, "elapsed_time": "0:20:29", "remaining_time": "3:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 10000, "loss": 0.3016, "accuracy": 0.8999999761581421, "learning_rate": 4.999984769144476e-06, "epoch": 0.101, "percentage": 10.1, "elapsed_time": "0:20:48", "remaining_time": "3:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 10000, "loss": 0.0408, "accuracy": 1.0, "learning_rate": 4.999939076763487e-06, "epoch": 0.102, "percentage": 10.2, "elapsed_time": "0:20:59", "remaining_time": "3:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.999862923413781e-06, "epoch": 0.103, "percentage": 10.3, "elapsed_time": "0:21:11", "remaining_time": "3:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 10000, "loss": 1.8217, "accuracy": 0.8999999761581421, "learning_rate": 4.999756310023261e-06, "epoch": 0.104, "percentage": 10.4, "elapsed_time": "0:21:24", "remaining_time": "3:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.9996192378909785e-06, "epoch": 0.105, "percentage": 10.5, "elapsed_time": "0:21:37", "remaining_time": "3:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 10000, "loss": 1.0262, "accuracy": 0.8999999761581421, "learning_rate": 4.999451708687114e-06, "epoch": 0.106, "percentage": 10.6, "elapsed_time": "0:21:48", "remaining_time": "3:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 10000, "loss": 0.0341, "accuracy": 1.0, "learning_rate": 4.9992537244529585e-06, "epoch": 0.107, "percentage": 10.7, "elapsed_time": "0:21:59", "remaining_time": "3:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 10000, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.999025287600886e-06, "epoch": 0.108, "percentage": 10.8, "elapsed_time": "0:22:10", "remaining_time": "3:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 10000, "loss": 0.0734, "accuracy": 0.8999999761581421, "learning_rate": 4.998766400914329e-06, "epoch": 0.109, "percentage": 10.9, "elapsed_time": "0:22:19", "remaining_time": "3:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.99847706754774e-06, "epoch": 0.11, "percentage": 11.0, "elapsed_time": "0:22:29", "remaining_time": "3:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 10000, "loss": 1.2719, "accuracy": 0.800000011920929, "learning_rate": 4.998157291026553e-06, "epoch": 0.111, "percentage": 11.1, "elapsed_time": "0:22:41", "remaining_time": "3:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 10000, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.997807075247147e-06, "epoch": 0.112, "percentage": 11.2, "elapsed_time": "0:22:54", "remaining_time": "3:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 10000, "loss": 0.0778, "accuracy": 0.8999999761581421, "learning_rate": 4.997426424476787e-06, "epoch": 0.113, "percentage": 11.3, "elapsed_time": "0:23:05", "remaining_time": "3:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 10000, "loss": 0.0942, "accuracy": 0.8999999761581421, "learning_rate": 4.9970153433535855e-06, "epoch": 0.114, "percentage": 11.4, "elapsed_time": "0:23:13", "remaining_time": "3:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.9965738368864345e-06, "epoch": 0.115, "percentage": 11.5, "elapsed_time": "0:23:23", "remaining_time": "3:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.996101910454953e-06, "epoch": 0.116, "percentage": 11.6, "elapsed_time": "0:23:33", "remaining_time": "2:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.995599569809414e-06, "epoch": 0.117, "percentage": 11.7, "elapsed_time": "0:23:44", "remaining_time": "2:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 10000, "loss": 0.268, "accuracy": 0.8999999761581421, "learning_rate": 4.9950668210706795e-06, "epoch": 0.118, "percentage": 11.8, "elapsed_time": "0:23:55", "remaining_time": "2:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 10000, "loss": 0.2434, "accuracy": 0.8999999761581421, "learning_rate": 4.994503670730126e-06, "epoch": 0.119, "percentage": 11.9, "elapsed_time": "0:24:07", "remaining_time": "2:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 10000, "loss": 0.0264, "accuracy": 1.0, "learning_rate": 4.993910125649561e-06, "epoch": 0.12, "percentage": 12.0, "elapsed_time": "0:24:17", "remaining_time": "2:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.993286193061145e-06, "epoch": 0.121, "percentage": 12.1, "elapsed_time": "0:24:26", "remaining_time": "2:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 10000, "loss": 0.0834, "accuracy": 0.8999999761581421, "learning_rate": 4.992631880567301e-06, "epoch": 0.122, "percentage": 12.2, "elapsed_time": "0:24:38", "remaining_time": "2:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.991947196140619e-06, "epoch": 0.123, "percentage": 12.3, "elapsed_time": "0:24:49", "remaining_time": "2:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 10000, "loss": 0.0135, "accuracy": 1.0, "learning_rate": 4.9912321481237616e-06, "epoch": 0.124, "percentage": 12.4, "elapsed_time": "0:25:00", "remaining_time": "2:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.990486745229364e-06, "epoch": 0.125, "percentage": 12.5, "elapsed_time": "0:25:11", "remaining_time": "2:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.989710996539926e-06, "epoch": 0.126, "percentage": 12.6, "elapsed_time": "0:25:21", "remaining_time": "2:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.9889049115077e-06, "epoch": 0.127, "percentage": 12.7, "elapsed_time": "0:25:32", "remaining_time": "2:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 10000, "loss": 0.0027, "accuracy": 1.0, "learning_rate": 4.988068499954578e-06, "epoch": 0.128, "percentage": 12.8, "elapsed_time": "0:25:41", "remaining_time": "2:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 10000, "loss": 0.0012, "accuracy": 1.0, "learning_rate": 4.987201772071971e-06, "epoch": 0.129, "percentage": 12.9, "elapsed_time": "0:25:53", "remaining_time": "2:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.986304738420684e-06, "epoch": 0.13, "percentage": 13.0, "elapsed_time": "0:26:03", "remaining_time": "2:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 10000, "loss": 1.3087, "accuracy": 0.8999999761581421, "learning_rate": 4.985377409930789e-06, "epoch": 0.131, "percentage": 13.1, "elapsed_time": "0:26:13", "remaining_time": "2:54:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 10000, "loss": 0.1654, "accuracy": 0.8999999761581421, "learning_rate": 4.984419797901491e-06, "epoch": 0.132, "percentage": 13.2, "elapsed_time": "0:26:25", "remaining_time": "2:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 10000, "loss": 0.0457, "accuracy": 1.0, "learning_rate": 4.983431914000991e-06, "epoch": 0.133, "percentage": 13.3, "elapsed_time": "0:26:36", "remaining_time": "2:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.9824137702663424e-06, "epoch": 0.134, "percentage": 13.4, "elapsed_time": "0:26:48", "remaining_time": "2:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 10000, "loss": 0.765, "accuracy": 0.8999999761581421, "learning_rate": 4.981365379103306e-06, "epoch": 0.135, "percentage": 13.5, "elapsed_time": "0:26:59", "remaining_time": "2:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 10000, "loss": 0.2196, "accuracy": 0.8999999761581421, "learning_rate": 4.980286753286196e-06, "epoch": 0.136, "percentage": 13.6, "elapsed_time": "0:27:11", "remaining_time": "2:52:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 10000, "loss": 0.4068, "accuracy": 0.8999999761581421, "learning_rate": 4.979177905957726e-06, "epoch": 0.137, "percentage": 13.7, "elapsed_time": "0:27:21", "remaining_time": "2:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 10000, "loss": 1.068, "accuracy": 0.8999999761581421, "learning_rate": 4.978038850628855e-06, "epoch": 0.138, "percentage": 13.8, "elapsed_time": "0:27:33", "remaining_time": "2:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.9768696011786095e-06, "epoch": 0.139, "percentage": 13.9, "elapsed_time": "0:27:42", "remaining_time": "2:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 10000, "loss": 0.0048, "accuracy": 1.0, "learning_rate": 4.975670171853926e-06, "epoch": 0.14, "percentage": 14.0, "elapsed_time": "0:27:53", "remaining_time": "2:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 10000, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.974440577269473e-06, "epoch": 0.141, "percentage": 14.1, "elapsed_time": "0:28:04", "remaining_time": "2:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.973180832407471e-06, "epoch": 0.142, "percentage": 14.2, "elapsed_time": "0:28:18", "remaining_time": "2:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 10000, "loss": 0.399, "accuracy": 0.8999999761581421, "learning_rate": 4.971890952617515e-06, "epoch": 0.143, "percentage": 14.3, "elapsed_time": "0:28:27", "remaining_time": "2:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.970570953616383e-06, "epoch": 0.144, "percentage": 14.4, "elapsed_time": "0:28:38", "remaining_time": "2:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.9692208514878445e-06, "epoch": 0.145, "percentage": 14.5, "elapsed_time": "0:29:02", "remaining_time": "2:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.96784066268247e-06, "epoch": 0.146, "percentage": 14.6, "elapsed_time": "0:29:13", "remaining_time": "2:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.966430404017424e-06, "epoch": 0.147, "percentage": 14.7, "elapsed_time": "0:29:22", "remaining_time": "2:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.964990092676263e-06, "epoch": 0.148, "percentage": 14.8, "elapsed_time": "0:29:33", "remaining_time": "2:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 10000, "loss": 0.0079, "accuracy": 1.0, "learning_rate": 4.963519746208726e-06, "epoch": 0.149, "percentage": 14.9, "elapsed_time": "0:29:49", "remaining_time": "2:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 10000, "loss": 0.0013, "accuracy": 1.0, "learning_rate": 4.962019382530521e-06, "epoch": 0.15, "percentage": 15.0, "elapsed_time": "0:30:00", "remaining_time": "2:50:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.960489019923105e-06, "epoch": 0.151, "percentage": 15.1, "elapsed_time": "0:30:11", "remaining_time": "2:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.958928677033465e-06, "epoch": 0.152, "percentage": 15.2, "elapsed_time": "0:30:22", "remaining_time": "2:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.957338372873886e-06, "epoch": 0.153, "percentage": 15.3, "elapsed_time": "0:30:33", "remaining_time": "2:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 10000, "loss": 1.0402, "accuracy": 0.8999999761581421, "learning_rate": 4.9557181268217225e-06, "epoch": 0.154, "percentage": 15.4, "elapsed_time": "0:30:44", "remaining_time": "2:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 10000, "loss": 0.0013, "accuracy": 1.0, "learning_rate": 4.9540679586191605e-06, "epoch": 0.155, "percentage": 15.5, "elapsed_time": "0:30:56", "remaining_time": "2:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.9523878883729794e-06, "epoch": 0.156, "percentage": 15.6, "elapsed_time": "0:31:26", "remaining_time": "2:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.9506779365543054e-06, "epoch": 0.157, "percentage": 15.7, "elapsed_time": "0:31:38", "remaining_time": "2:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 10000, "loss": 0.0242, "accuracy": 1.0, "learning_rate": 4.94893812399836e-06, "epoch": 0.158, "percentage": 15.8, "elapsed_time": "0:31:54", "remaining_time": "2:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 10000, "loss": 0.0445, "accuracy": 1.0, "learning_rate": 4.947168471904213e-06, "epoch": 0.159, "percentage": 15.9, "elapsed_time": "0:32:11", "remaining_time": "2:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 10000, "loss": 0.0661, "accuracy": 1.0, "learning_rate": 4.9453690018345144e-06, "epoch": 0.16, "percentage": 16.0, "elapsed_time": "0:32:46", "remaining_time": "2:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 10000, "loss": 0.0506, "accuracy": 1.0, "learning_rate": 4.9435397357152406e-06, "epoch": 0.161, "percentage": 16.1, "elapsed_time": "0:33:19", "remaining_time": "2:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 10000, "loss": 0.002, "accuracy": 1.0, "learning_rate": 4.9416806958354206e-06, "epoch": 0.162, "percentage": 16.2, "elapsed_time": "0:33:32", "remaining_time": "2:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.939791904846869e-06, "epoch": 0.163, "percentage": 16.3, "elapsed_time": "0:33:44", "remaining_time": "2:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.937873385763909e-06, "epoch": 0.164, "percentage": 16.4, "elapsed_time": "0:34:00", "remaining_time": "2:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.935925161963089e-06, "epoch": 0.165, "percentage": 16.5, "elapsed_time": "0:34:12", "remaining_time": "2:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.933947257182901e-06, "epoch": 0.166, "percentage": 16.6, "elapsed_time": "0:34:27", "remaining_time": "2:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.9319396955234925e-06, "epoch": 0.167, "percentage": 16.7, "elapsed_time": "0:34:46", "remaining_time": "2:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.9299025014463665e-06, "epoch": 0.168, "percentage": 16.8, "elapsed_time": "0:35:01", "remaining_time": "2:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1690, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.92783569977409e-06, "epoch": 0.169, "percentage": 16.9, "elapsed_time": "0:35:14", "remaining_time": "2:53:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 10000, "loss": 0.1435, "accuracy": 0.8999999761581421, "learning_rate": 4.925739315689991e-06, "epoch": 0.17, "percentage": 17.0, "elapsed_time": "0:35:31", "remaining_time": "2:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1710, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.923613374737848e-06, "epoch": 0.171, "percentage": 17.1, "elapsed_time": "0:35:48", "remaining_time": "2:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1720, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.921457902821578e-06, "epoch": 0.172, "percentage": 17.2, "elapsed_time": "0:36:03", "remaining_time": "2:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 10000, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.9192729262049285e-06, "epoch": 0.173, "percentage": 17.3, "elapsed_time": "0:36:16", "remaining_time": "2:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1740, "total_steps": 10000, "loss": 0.006, "accuracy": 1.0, "learning_rate": 4.917058471511149e-06, "epoch": 0.174, "percentage": 17.4, "elapsed_time": "0:36:34", "remaining_time": "2:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.914814565722671e-06, "epoch": 0.175, "percentage": 17.5, "elapsed_time": "0:36:48", "remaining_time": "2:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1760, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.912541236180779e-06, "epoch": 0.176, "percentage": 17.6, "elapsed_time": "0:37:03", "remaining_time": "2:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1770, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.910238510585275e-06, "epoch": 0.177, "percentage": 17.7, "elapsed_time": "0:37:17", "remaining_time": "2:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1780, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.907906416994146e-06, "epoch": 0.178, "percentage": 17.8, "elapsed_time": "0:37:29", "remaining_time": "2:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1790, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.905544983823214e-06, "epoch": 0.179, "percentage": 17.9, "elapsed_time": "0:37:44", "remaining_time": "2:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.903154239845798e-06, "epoch": 0.18, "percentage": 18.0, "elapsed_time": "0:38:00", "remaining_time": "2:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1810, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.900734214192358e-06, "epoch": 0.181, "percentage": 18.1, "elapsed_time": "0:38:12", "remaining_time": "2:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1820, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.898284936350144e-06, "epoch": 0.182, "percentage": 18.2, "elapsed_time": "0:38:28", "remaining_time": "2:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1830, "total_steps": 10000, "loss": 0.0126, "accuracy": 1.0, "learning_rate": 4.8958064361628334e-06, "epoch": 0.183, "percentage": 18.3, "elapsed_time": "0:38:42", "remaining_time": "2:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1840, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.893298743830168e-06, "epoch": 0.184, "percentage": 18.4, "elapsed_time": "0:38:56", "remaining_time": "2:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.890761889907589e-06, "epoch": 0.185, "percentage": 18.5, "elapsed_time": "0:39:10", "remaining_time": "2:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1860, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.888195905305859e-06, "epoch": 0.186, "percentage": 18.6, "elapsed_time": "0:39:23", "remaining_time": "2:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1870, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.885600821290692e-06, "epoch": 0.187, "percentage": 18.7, "elapsed_time": "0:39:36", "remaining_time": "2:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1880, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.882976669482368e-06, "epoch": 0.188, "percentage": 18.8, "elapsed_time": "0:39:55", "remaining_time": "2:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1890, "total_steps": 10000, "loss": 0.0104, "accuracy": 1.0, "learning_rate": 4.880323481855347e-06, "epoch": 0.189, "percentage": 18.9, "elapsed_time": "0:40:08", "remaining_time": "2:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.8776412907378845e-06, "epoch": 0.19, "percentage": 19.0, "elapsed_time": "0:40:22", "remaining_time": "2:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1910, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.874930128811631e-06, "epoch": 0.191, "percentage": 19.1, "elapsed_time": "0:40:38", "remaining_time": "2:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1920, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.8721900291112415e-06, "epoch": 0.192, "percentage": 19.2, "elapsed_time": "0:40:51", "remaining_time": "2:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1930, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.869421025023965e-06, "epoch": 0.193, "percentage": 19.3, "elapsed_time": "0:41:02", "remaining_time": "2:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1940, "total_steps": 10000, "loss": 0.5865, "accuracy": 0.8999999761581421, "learning_rate": 4.866623150289241e-06, "epoch": 0.194, "percentage": 19.4, "elapsed_time": "0:41:14", "remaining_time": "2:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1950, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.863796438998293e-06, "epoch": 0.195, "percentage": 19.5, "elapsed_time": "0:41:27", "remaining_time": "2:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1960, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.860940925593703e-06, "epoch": 0.196, "percentage": 19.6, "elapsed_time": "0:41:42", "remaining_time": "2:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1970, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.858056644869002e-06, "epoch": 0.197, "percentage": 19.7, "elapsed_time": "0:41:57", "remaining_time": "2:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1980, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.855143631968242e-06, "epoch": 0.198, "percentage": 19.8, "elapsed_time": "0:42:12", "remaining_time": "2:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1990, "total_steps": 10000, "loss": 0.0053, "accuracy": 1.0, "learning_rate": 4.852201922385564e-06, "epoch": 0.199, "percentage": 19.9, "elapsed_time": "0:42:27", "remaining_time": "2:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 10000, "loss": 0.0872, "accuracy": 0.8999999761581421, "learning_rate": 4.849231551964771e-06, "epoch": 0.2, "percentage": 20.0, "elapsed_time": "0:42:39", "remaining_time": "2:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2010, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.84623255689889e-06, "epoch": 0.201, "percentage": 20.1, "elapsed_time": "0:42:58", "remaining_time": "2:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2020, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.84320497372973e-06, "epoch": 0.202, "percentage": 20.2, "elapsed_time": "0:43:13", "remaining_time": "2:50:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2030, "total_steps": 10000, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 4.840148839347434e-06, "epoch": 0.203, "percentage": 20.3, "elapsed_time": "0:43:26", "remaining_time": "2:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2040, "total_steps": 10000, "loss": 0.1777, "accuracy": 0.8999999761581421, "learning_rate": 4.837064190990036e-06, "epoch": 0.204, "percentage": 20.4, "elapsed_time": "0:43:42", "remaining_time": "2:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2050, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.833951066243004e-06, "epoch": 0.205, "percentage": 20.5, "elapsed_time": "0:43:55", "remaining_time": "2:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2060, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.830809503038781e-06, "epoch": 0.206, "percentage": 20.6, "elapsed_time": "0:44:08", "remaining_time": "2:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2070, "total_steps": 10000, "loss": 0.0424, "accuracy": 1.0, "learning_rate": 4.8276395396563215e-06, "epoch": 0.207, "percentage": 20.7, "elapsed_time": "0:44:22", "remaining_time": "2:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2080, "total_steps": 10000, "loss": 0.0042, "accuracy": 1.0, "learning_rate": 4.824441214720629e-06, "epoch": 0.208, "percentage": 20.8, "elapsed_time": "0:44:38", "remaining_time": "2:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2090, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.821214567202284e-06, "epoch": 0.209, "percentage": 20.9, "elapsed_time": "0:44:52", "remaining_time": "2:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2100, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.817959636416969e-06, "epoch": 0.21, "percentage": 21.0, "elapsed_time": "0:45:13", "remaining_time": "2:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2110, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.814676462024988e-06, "epoch": 0.211, "percentage": 21.1, "elapsed_time": "0:45:28", "remaining_time": "2:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2120, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.811365084030784e-06, "epoch": 0.212, "percentage": 21.2, "elapsed_time": "0:45:42", "remaining_time": "2:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2130, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.808025542782453e-06, "epoch": 0.213, "percentage": 21.3, "elapsed_time": "0:45:55", "remaining_time": "2:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2140, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.804657878971252e-06, "epoch": 0.214, "percentage": 21.4, "elapsed_time": "0:46:14", "remaining_time": "2:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2150, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.801262133631101e-06, "epoch": 0.215, "percentage": 21.5, "elapsed_time": "0:46:30", "remaining_time": "2:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2160, "total_steps": 10000, "loss": 0.0155, "accuracy": 1.0, "learning_rate": 4.7978383481380865e-06, "epoch": 0.216, "percentage": 21.6, "elapsed_time": "0:46:42", "remaining_time": "2:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2170, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.794386564209953e-06, "epoch": 0.217, "percentage": 21.7, "elapsed_time": "0:47:31", "remaining_time": "2:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2180, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.790906823905599e-06, "epoch": 0.218, "percentage": 21.8, "elapsed_time": "0:47:48", "remaining_time": "2:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2190, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.787399169624562e-06, "epoch": 0.219, "percentage": 21.9, "elapsed_time": "0:48:08", "remaining_time": "2:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2200, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.783863644106502e-06, "epoch": 0.22, "percentage": 22.0, "elapsed_time": "0:48:27", "remaining_time": "2:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2210, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.780300290430683e-06, "epoch": 0.221, "percentage": 22.1, "elapsed_time": "0:48:44", "remaining_time": "2:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2220, "total_steps": 10000, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 4.776709152015443e-06, "epoch": 0.222, "percentage": 22.2, "elapsed_time": "0:48:58", "remaining_time": "2:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2230, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.773090272617672e-06, "epoch": 0.223, "percentage": 22.3, "elapsed_time": "0:49:11", "remaining_time": "2:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2240, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.769443696332272e-06, "epoch": 0.224, "percentage": 22.4, "elapsed_time": "0:49:28", "remaining_time": "2:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2250, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.765769467591626e-06, "epoch": 0.225, "percentage": 22.5, "elapsed_time": "0:49:40", "remaining_time": "2:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2260, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.762067631165049e-06, "epoch": 0.226, "percentage": 22.6, "elapsed_time": "0:49:54", "remaining_time": "2:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2270, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.7583382321582525e-06, "epoch": 0.227, "percentage": 22.7, "elapsed_time": "0:50:10", "remaining_time": "2:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2280, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.754581316012785e-06, "epoch": 0.228, "percentage": 22.8, "elapsed_time": "0:50:28", "remaining_time": "2:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2290, "total_steps": 10000, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.750796928505484e-06, "epoch": 0.229, "percentage": 22.9, "elapsed_time": "0:50:49", "remaining_time": "2:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2300, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.746985115747918e-06, "epoch": 0.23, "percentage": 23.0, "elapsed_time": "0:51:04", "remaining_time": "2:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2310, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.743145924185821e-06, "epoch": 0.231, "percentage": 23.1, "elapsed_time": "0:51:17", "remaining_time": "2:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2320, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.7392794005985324e-06, "epoch": 0.232, "percentage": 23.2, "elapsed_time": "0:51:29", "remaining_time": "2:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2330, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.735385592098421e-06, "epoch": 0.233, "percentage": 23.3, "elapsed_time": "0:51:45", "remaining_time": "2:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2340, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.731464546130315e-06, "epoch": 0.234, "percentage": 23.4, "elapsed_time": "0:51:59", "remaining_time": "2:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2350, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.72751631047092e-06, "epoch": 0.235, "percentage": 23.5, "elapsed_time": "0:52:12", "remaining_time": "2:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2360, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.723540933228245e-06, "epoch": 0.236, "percentage": 23.6, "elapsed_time": "0:52:28", "remaining_time": "2:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2370, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.719538462841003e-06, "epoch": 0.237, "percentage": 23.7, "elapsed_time": "0:52:42", "remaining_time": "2:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2380, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.715508948078037e-06, "epoch": 0.238, "percentage": 23.8, "elapsed_time": "0:52:58", "remaining_time": "2:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2390, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.71145243803771e-06, "epoch": 0.239, "percentage": 23.9, "elapsed_time": "0:53:11", "remaining_time": "2:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2400, "total_steps": 10000, "loss": 0.0221, "accuracy": 1.0, "learning_rate": 4.707368982147318e-06, "epoch": 0.24, "percentage": 24.0, "elapsed_time": "0:53:22", "remaining_time": "2:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2410, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.703258630162481e-06, "epoch": 0.241, "percentage": 24.1, "elapsed_time": "0:53:39", "remaining_time": "2:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2420, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.699121432166541e-06, "epoch": 0.242, "percentage": 24.2, "elapsed_time": "0:54:37", "remaining_time": "2:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2430, "total_steps": 10000, "loss": 0.0057, "accuracy": 1.0, "learning_rate": 4.6949574385699514e-06, "epoch": 0.243, "percentage": 24.3, "elapsed_time": "0:54:49", "remaining_time": "2:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2440, "total_steps": 10000, "loss": 0.3753, "accuracy": 0.8999999761581421, "learning_rate": 4.690766700109659e-06, "epoch": 0.244, "percentage": 24.4, "elapsed_time": "0:55:00", "remaining_time": "2:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2450, "total_steps": 10000, "loss": 0.0374, "accuracy": 1.0, "learning_rate": 4.68654926784849e-06, "epoch": 0.245, "percentage": 24.5, "elapsed_time": "0:55:38", "remaining_time": "2:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2460, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.682305193174524e-06, "epoch": 0.246, "percentage": 24.6, "elapsed_time": "0:55:50", "remaining_time": "2:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2470, "total_steps": 10000, "loss": 0.1193, "accuracy": 0.8999999761581421, "learning_rate": 4.6780345278004744e-06, "epoch": 0.247, "percentage": 24.7, "elapsed_time": "0:56:06", "remaining_time": "2:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2480, "total_steps": 10000, "loss": 0.4578, "accuracy": 0.8999999761581421, "learning_rate": 4.673737323763048e-06, "epoch": 0.248, "percentage": 24.8, "elapsed_time": "0:56:21", "remaining_time": "2:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2490, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.669413633422322e-06, "epoch": 0.249, "percentage": 24.9, "elapsed_time": "0:56:34", "remaining_time": "2:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 10000, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.665063509461098e-06, "epoch": 0.25, "percentage": 25.0, "elapsed_time": "0:56:47", "remaining_time": "2:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2510, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.6606870048842626e-06, "epoch": 0.251, "percentage": 25.1, "elapsed_time": "0:57:01", "remaining_time": "2:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2520, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.656284173018144e-06, "epoch": 0.252, "percentage": 25.2, "elapsed_time": "0:57:15", "remaining_time": "2:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2530, "total_steps": 10000, "loss": 0.3552, "accuracy": 0.8999999761581421, "learning_rate": 4.65185506750986e-06, "epoch": 0.253, "percentage": 25.3, "elapsed_time": "0:57:33", "remaining_time": "2:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2540, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.6473997423266615e-06, "epoch": 0.254, "percentage": 25.4, "elapsed_time": "0:57:47", "remaining_time": "2:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2550, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.642918251755281e-06, "epoch": 0.255, "percentage": 25.5, "elapsed_time": "0:58:00", "remaining_time": "2:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2560, "total_steps": 10000, "loss": 0.01, "accuracy": 1.0, "learning_rate": 4.638410650401267e-06, "epoch": 0.256, "percentage": 25.6, "elapsed_time": "0:58:12", "remaining_time": "2:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2570, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.633876993188319e-06, "epoch": 0.257, "percentage": 25.7, "elapsed_time": "0:58:26", "remaining_time": "2:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2580, "total_steps": 10000, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 4.62931733535762e-06, "epoch": 0.258, "percentage": 25.8, "elapsed_time": "0:58:38", "remaining_time": "2:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2590, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.62473173246716e-06, "epoch": 0.259, "percentage": 25.9, "elapsed_time": "0:58:55", "remaining_time": "2:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2600, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.620120240391065e-06, "epoch": 0.26, "percentage": 26.0, "elapsed_time": "0:59:11", "remaining_time": "2:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2610, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.6154829153189105e-06, "epoch": 0.261, "percentage": 26.1, "elapsed_time": "0:59:26", "remaining_time": "2:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2620, "total_steps": 10000, "loss": 0.5346, "accuracy": 0.8999999761581421, "learning_rate": 4.610819813755038e-06, "epoch": 0.262, "percentage": 26.2, "elapsed_time": "0:59:42", "remaining_time": "2:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2630, "total_steps": 10000, "loss": 0.0028, "accuracy": 1.0, "learning_rate": 4.60613099251787e-06, "epoch": 0.263, "percentage": 26.3, "elapsed_time": "0:59:57", "remaining_time": "2:48:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2640, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.601416508739211e-06, "epoch": 0.264, "percentage": 26.4, "elapsed_time": "1:00:10", "remaining_time": "2:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2650, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.596676419863561e-06, "epoch": 0.265, "percentage": 26.5, "elapsed_time": "1:00:27", "remaining_time": "2:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2660, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.591910783647405e-06, "epoch": 0.266, "percentage": 26.6, "elapsed_time": "1:00:41", "remaining_time": "2:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2670, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.587119658158517e-06, "epoch": 0.267, "percentage": 26.7, "elapsed_time": "1:00:51", "remaining_time": "2:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2680, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.582303101775249e-06, "epoch": 0.268, "percentage": 26.8, "elapsed_time": "1:01:09", "remaining_time": "2:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2690, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.577461173185821e-06, "epoch": 0.269, "percentage": 26.9, "elapsed_time": "1:01:23", "remaining_time": "2:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2700, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.572593931387604e-06, "epoch": 0.27, "percentage": 27.0, "elapsed_time": "1:01:38", "remaining_time": "2:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2710, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.567701435686405e-06, "epoch": 0.271, "percentage": 27.1, "elapsed_time": "1:01:49", "remaining_time": "2:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2720, "total_steps": 10000, "loss": 1.5142, "accuracy": 0.8999999761581421, "learning_rate": 4.562783745695738e-06, "epoch": 0.272, "percentage": 27.2, "elapsed_time": "1:02:08", "remaining_time": "2:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2730, "total_steps": 10000, "loss": 1.4694, "accuracy": 0.8999999761581421, "learning_rate": 4.5578409213361055e-06, "epoch": 0.273, "percentage": 27.3, "elapsed_time": "1:02:23", "remaining_time": "2:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2740, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.55287302283426e-06, "epoch": 0.274, "percentage": 27.4, "elapsed_time": "1:02:36", "remaining_time": "2:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2750, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.54788011072248e-06, "epoch": 0.275, "percentage": 27.5, "elapsed_time": "1:02:54", "remaining_time": "2:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2760, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.542862245837821e-06, "epoch": 0.276, "percentage": 27.6, "elapsed_time": "1:03:08", "remaining_time": "2:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2770, "total_steps": 10000, "loss": 0.0937, "accuracy": 0.8999999761581421, "learning_rate": 4.537819489321385e-06, "epoch": 0.277, "percentage": 27.7, "elapsed_time": "1:03:21", "remaining_time": "2:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2780, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.5327519026175694e-06, "epoch": 0.278, "percentage": 27.8, "elapsed_time": "1:03:40", "remaining_time": "2:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2790, "total_steps": 10000, "loss": 0.0015, "accuracy": 1.0, "learning_rate": 4.527659547473317e-06, "epoch": 0.279, "percentage": 27.9, "elapsed_time": "1:03:53", "remaining_time": "2:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2800, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.522542485937369e-06, "epoch": 0.28, "percentage": 28.0, "elapsed_time": "1:04:34", "remaining_time": "2:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2810, "total_steps": 10000, "loss": 0.2074, "accuracy": 0.8999999761581421, "learning_rate": 4.517400780359505e-06, "epoch": 0.281, "percentage": 28.1, "elapsed_time": "1:04:52", "remaining_time": "2:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2820, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.512234493389785e-06, "epoch": 0.282, "percentage": 28.2, "elapsed_time": "1:05:09", "remaining_time": "2:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2830, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.507043687977787e-06, "epoch": 0.283, "percentage": 28.3, "elapsed_time": "1:05:23", "remaining_time": "2:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2840, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.501828427371834e-06, "epoch": 0.284, "percentage": 28.4, "elapsed_time": "1:05:39", "remaining_time": "2:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2850, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.496588775118232e-06, "epoch": 0.285, "percentage": 28.5, "elapsed_time": "1:05:53", "remaining_time": "2:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2860, "total_steps": 10000, "loss": 0.0071, "accuracy": 1.0, "learning_rate": 4.491324795060491e-06, "epoch": 0.286, "percentage": 28.6, "elapsed_time": "1:06:08", "remaining_time": "2:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2870, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.4860365513385456e-06, "epoch": 0.287, "percentage": 28.7, "elapsed_time": "1:06:24", "remaining_time": "2:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2880, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.4807241083879774e-06, "epoch": 0.288, "percentage": 28.8, "elapsed_time": "1:06:41", "remaining_time": "2:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2890, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.475387530939226e-06, "epoch": 0.289, "percentage": 28.9, "elapsed_time": "1:06:56", "remaining_time": "2:44:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2900, "total_steps": 10000, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 4.470026884016805e-06, "epoch": 0.29, "percentage": 29.0, "elapsed_time": "1:07:07", "remaining_time": "2:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2910, "total_steps": 10000, "loss": 0.0013, "accuracy": 1.0, "learning_rate": 4.464642232938505e-06, "epoch": 0.291, "percentage": 29.1, "elapsed_time": "1:07:22", "remaining_time": "2:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2920, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.4592336433146e-06, "epoch": 0.292, "percentage": 29.2, "elapsed_time": "1:07:37", "remaining_time": "2:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2930, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.453801181047047e-06, "epoch": 0.293, "percentage": 29.3, "elapsed_time": "1:08:48", "remaining_time": "2:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2940, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.448344912328686e-06, "epoch": 0.294, "percentage": 29.4, "elapsed_time": "1:09:07", "remaining_time": "2:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2950, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.442864903642428e-06, "epoch": 0.295, "percentage": 29.5, "elapsed_time": "1:09:19", "remaining_time": "2:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2960, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.437361221760449e-06, "epoch": 0.296, "percentage": 29.6, "elapsed_time": "1:09:35", "remaining_time": "2:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2970, "total_steps": 10000, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 4.431833933743378e-06, "epoch": 0.297, "percentage": 29.7, "elapsed_time": "1:09:52", "remaining_time": "2:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2980, "total_steps": 10000, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.426283106939474e-06, "epoch": 0.298, "percentage": 29.8, "elapsed_time": "1:10:06", "remaining_time": "2:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2990, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.420708808983809e-06, "epoch": 0.299, "percentage": 29.9, "elapsed_time": "1:10:24", "remaining_time": "2:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.415111107797445e-06, "epoch": 0.3, "percentage": 30.0, "elapsed_time": "1:10:41", "remaining_time": "2:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3010, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.409490071586606e-06, "epoch": 0.301, "percentage": 30.1, "elapsed_time": "1:11:00", "remaining_time": "2:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3020, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.403845768841842e-06, "epoch": 0.302, "percentage": 30.2, "elapsed_time": "1:11:13", "remaining_time": "2:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3030, "total_steps": 10000, "loss": 0.0216, "accuracy": 1.0, "learning_rate": 4.398178268337203e-06, "epoch": 0.303, "percentage": 30.3, "elapsed_time": "1:11:33", "remaining_time": "2:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3040, "total_steps": 10000, "loss": 0.646, "accuracy": 0.8999999761581421, "learning_rate": 4.3924876391293915e-06, "epoch": 0.304, "percentage": 30.4, "elapsed_time": "1:11:47", "remaining_time": "2:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3050, "total_steps": 10000, "loss": 0.0012, "accuracy": 1.0, "learning_rate": 4.386773950556931e-06, "epoch": 0.305, "percentage": 30.5, "elapsed_time": "1:12:04", "remaining_time": "2:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3060, "total_steps": 10000, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 4.381037272239311e-06, "epoch": 0.306, "percentage": 30.6, "elapsed_time": "1:12:24", "remaining_time": "2:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3070, "total_steps": 10000, "loss": 0.0351, "accuracy": 1.0, "learning_rate": 4.3752776740761495e-06, "epoch": 0.307, "percentage": 30.7, "elapsed_time": "1:12:36", "remaining_time": "2:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3080, "total_steps": 10000, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.36949522624633e-06, "epoch": 0.308, "percentage": 30.8, "elapsed_time": "1:12:51", "remaining_time": "2:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3090, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.3636899992071555e-06, "epoch": 0.309, "percentage": 30.9, "elapsed_time": "1:13:05", "remaining_time": "2:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3100, "total_steps": 10000, "loss": 0.1594, "accuracy": 0.8999999761581421, "learning_rate": 4.357862063693486e-06, "epoch": 0.31, "percentage": 31.0, "elapsed_time": "1:13:25", "remaining_time": "2:43:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3110, "total_steps": 10000, "loss": 0.0017, "accuracy": 1.0, "learning_rate": 4.352011490716875e-06, "epoch": 0.311, "percentage": 31.1, "elapsed_time": "1:13:39", "remaining_time": "2:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3120, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.346138351564711e-06, "epoch": 0.312, "percentage": 31.2, "elapsed_time": "1:13:53", "remaining_time": "2:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3130, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.340242717799337e-06, "epoch": 0.313, "percentage": 31.3, "elapsed_time": "1:14:05", "remaining_time": "2:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3140, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.334324661257191e-06, "epoch": 0.314, "percentage": 31.4, "elapsed_time": "1:14:21", "remaining_time": "2:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3150, "total_steps": 10000, "loss": 1.1448, "accuracy": 0.800000011920929, "learning_rate": 4.328384254047927e-06, "epoch": 0.315, "percentage": 31.5, "elapsed_time": "1:14:36", "remaining_time": "2:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3160, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.322421568553529e-06, "epoch": 0.316, "percentage": 31.6, "elapsed_time": "1:14:53", "remaining_time": "2:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3170, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.316436677427441e-06, "epoch": 0.317, "percentage": 31.7, "elapsed_time": "1:15:48", "remaining_time": "2:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3180, "total_steps": 10000, "loss": 0.09, "accuracy": 0.8999999761581421, "learning_rate": 4.3104296535936695e-06, "epoch": 0.318, "percentage": 31.8, "elapsed_time": "1:16:01", "remaining_time": "2:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3190, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.3044005702459055e-06, "epoch": 0.319, "percentage": 31.9, "elapsed_time": "1:16:17", "remaining_time": "2:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3200, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.2983495008466285e-06, "epoch": 0.32, "percentage": 32.0, "elapsed_time": "1:16:30", "remaining_time": "2:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3210, "total_steps": 10000, "loss": 0.0095, "accuracy": 1.0, "learning_rate": 4.2922765191262075e-06, "epoch": 0.321, "percentage": 32.1, "elapsed_time": "1:16:43", "remaining_time": "2:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3220, "total_steps": 10000, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.286181699082008e-06, "epoch": 0.322, "percentage": 32.2, "elapsed_time": "1:17:00", "remaining_time": "2:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3230, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.280065114977492e-06, "epoch": 0.323, "percentage": 32.3, "elapsed_time": "1:17:16", "remaining_time": "2:41:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3240, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.273926841341303e-06, "epoch": 0.324, "percentage": 32.4, "elapsed_time": "1:17:29", "remaining_time": "2:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3250, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.267766952966369e-06, "epoch": 0.325, "percentage": 32.5, "elapsed_time": "1:17:47", "remaining_time": "2:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3260, "total_steps": 10000, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.261585524908987e-06, "epoch": 0.326, "percentage": 32.6, "elapsed_time": "1:18:02", "remaining_time": "2:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3270, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.255382632487907e-06, "epoch": 0.327, "percentage": 32.7, "elapsed_time": "1:18:17", "remaining_time": "2:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3280, "total_steps": 10000, "loss": 0.0993, "accuracy": 0.8999999761581421, "learning_rate": 4.249158351283414e-06, "epoch": 0.328, "percentage": 32.8, "elapsed_time": "1:18:32", "remaining_time": "2:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3290, "total_steps": 10000, "loss": 1.0371, "accuracy": 0.8999999761581421, "learning_rate": 4.242912757136412e-06, "epoch": 0.329, "percentage": 32.9, "elapsed_time": "1:18:45", "remaining_time": "2:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3300, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.236645926147493e-06, "epoch": 0.33, "percentage": 33.0, "elapsed_time": "1:18:59", "remaining_time": "2:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3310, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.230357934676017e-06, "epoch": 0.331, "percentage": 33.1, "elapsed_time": "1:19:15", "remaining_time": "2:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3320, "total_steps": 10000, "loss": 0.0936, "accuracy": 0.8999999761581421, "learning_rate": 4.224048859339175e-06, "epoch": 0.332, "percentage": 33.2, "elapsed_time": "1:19:32", "remaining_time": "2:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3330, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.217718777011058e-06, "epoch": 0.333, "percentage": 33.3, "elapsed_time": "1:19:44", "remaining_time": "2:39:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3340, "total_steps": 10000, "loss": 0.8769, "accuracy": 0.8999999761581421, "learning_rate": 4.211367764821722e-06, "epoch": 0.334, "percentage": 33.4, "elapsed_time": "1:19:57", "remaining_time": "2:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3350, "total_steps": 10000, "loss": 0.031, "accuracy": 1.0, "learning_rate": 4.204995900156247e-06, "epoch": 0.335, "percentage": 33.5, "elapsed_time": "1:20:16", "remaining_time": "2:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3360, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.198603260653792e-06, "epoch": 0.336, "percentage": 33.6, "elapsed_time": "1:20:31", "remaining_time": "2:39:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3370, "total_steps": 10000, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.192189924206652e-06, "epoch": 0.337, "percentage": 33.7, "elapsed_time": "1:20:48", "remaining_time": "2:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3380, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.185755968959308e-06, "epoch": 0.338, "percentage": 33.8, "elapsed_time": "1:21:13", "remaining_time": "2:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3390, "total_steps": 10000, "loss": 0.0581, "accuracy": 1.0, "learning_rate": 4.179301473307476e-06, "epoch": 0.339, "percentage": 33.9, "elapsed_time": "1:21:27", "remaining_time": "2:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3400, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.172826515897146e-06, "epoch": 0.34, "percentage": 34.0, "elapsed_time": "1:21:42", "remaining_time": "2:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3410, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.166331175623631e-06, "epoch": 0.341, "percentage": 34.1, "elapsed_time": "1:21:57", "remaining_time": "2:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3420, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.159815531630604e-06, "epoch": 0.342, "percentage": 34.2, "elapsed_time": "1:22:15", "remaining_time": "2:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3430, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.15327966330913e-06, "epoch": 0.343, "percentage": 34.3, "elapsed_time": "1:22:32", "remaining_time": "2:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3440, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.146723650296701e-06, "epoch": 0.344, "percentage": 34.4, "elapsed_time": "1:22:46", "remaining_time": "2:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3450, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.140147572476269e-06, "epoch": 0.345, "percentage": 34.5, "elapsed_time": "1:23:03", "remaining_time": "2:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3460, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.133551509975264e-06, "epoch": 0.346, "percentage": 34.6, "elapsed_time": "1:23:20", "remaining_time": "2:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3470, "total_steps": 10000, "loss": 1.2362, "accuracy": 0.800000011920929, "learning_rate": 4.126935543164628e-06, "epoch": 0.347, "percentage": 34.7, "elapsed_time": "1:23:40", "remaining_time": "2:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3480, "total_steps": 10000, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.120299752657828e-06, "epoch": 0.348, "percentage": 34.8, "elapsed_time": "1:23:58", "remaining_time": "2:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3490, "total_steps": 10000, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.113644219309877e-06, "epoch": 0.349, "percentage": 34.9, "elapsed_time": "1:24:13", "remaining_time": "2:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.106969024216348e-06, "epoch": 0.35, "percentage": 35.0, "elapsed_time": "1:24:29", "remaining_time": "2:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3510, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.1002742487123896e-06, "epoch": 0.351, "percentage": 35.1, "elapsed_time": "1:24:42", "remaining_time": "2:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3520, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.093559974371725e-06, "epoch": 0.352, "percentage": 35.2, "elapsed_time": "1:24:57", "remaining_time": "2:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3530, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.086826283005669e-06, "epoch": 0.353, "percentage": 35.3, "elapsed_time": "1:25:10", "remaining_time": "2:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3540, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.080073256662128e-06, "epoch": 0.354, "percentage": 35.4, "elapsed_time": "1:25:24", "remaining_time": "2:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3550, "total_steps": 10000, "loss": 0.0363, "accuracy": 1.0, "learning_rate": 4.073300977624594e-06, "epoch": 0.355, "percentage": 35.5, "elapsed_time": "1:25:40", "remaining_time": "2:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3560, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.066509528411151e-06, "epoch": 0.356, "percentage": 35.6, "elapsed_time": "1:25:52", "remaining_time": "2:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3570, "total_steps": 10000, "loss": 0.1134, "accuracy": 0.8999999761581421, "learning_rate": 4.059698991773466e-06, "epoch": 0.357, "percentage": 35.7, "elapsed_time": "1:26:08", "remaining_time": "2:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3580, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.052869450695776e-06, "epoch": 0.358, "percentage": 35.8, "elapsed_time": "1:26:22", "remaining_time": "2:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3590, "total_steps": 10000, "loss": 0.015, "accuracy": 1.0, "learning_rate": 4.046020988393886e-06, "epoch": 0.359, "percentage": 35.9, "elapsed_time": "1:26:37", "remaining_time": "2:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3600, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.039153688314146e-06, "epoch": 0.36, "percentage": 36.0, "elapsed_time": "1:26:51", "remaining_time": "2:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3610, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.032267634132442e-06, "epoch": 0.361, "percentage": 36.1, "elapsed_time": "1:27:05", "remaining_time": "2:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3620, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.02536290975317e-06, "epoch": 0.362, "percentage": 36.2, "elapsed_time": "1:27:20", "remaining_time": "2:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3630, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.018439599308217e-06, "epoch": 0.363, "percentage": 36.3, "elapsed_time": "1:27:33", "remaining_time": "2:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3640, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.011497787155938e-06, "epoch": 0.364, "percentage": 36.4, "elapsed_time": "1:27:46", "remaining_time": "2:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3650, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.0045375578801216e-06, "epoch": 0.365, "percentage": 36.5, "elapsed_time": "1:28:01", "remaining_time": "2:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3660, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.997558996288965e-06, "epoch": 0.366, "percentage": 36.6, "elapsed_time": "1:28:16", "remaining_time": "2:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3670, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.9905621874140396e-06, "epoch": 0.367, "percentage": 36.7, "elapsed_time": "1:28:32", "remaining_time": "2:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3680, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.983547216509254e-06, "epoch": 0.368, "percentage": 36.8, "elapsed_time": "1:28:47", "remaining_time": "2:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3690, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.976514169049814e-06, "epoch": 0.369, "percentage": 36.9, "elapsed_time": "1:29:01", "remaining_time": "2:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3700, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.969463130731183e-06, "epoch": 0.37, "percentage": 37.0, "elapsed_time": "1:29:20", "remaining_time": "2:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3710, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.962394187468039e-06, "epoch": 0.371, "percentage": 37.1, "elapsed_time": "1:29:31", "remaining_time": "2:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3720, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.955307425393224e-06, "epoch": 0.372, "percentage": 37.2, "elapsed_time": "1:29:48", "remaining_time": "2:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3730, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.948202930856697e-06, "epoch": 0.373, "percentage": 37.3, "elapsed_time": "1:30:04", "remaining_time": "2:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3740, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.941080790424483e-06, "epoch": 0.374, "percentage": 37.4, "elapsed_time": "1:30:17", "remaining_time": "2:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3750, "total_steps": 10000, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 3.933941090877615e-06, "epoch": 0.375, "percentage": 37.5, "elapsed_time": "1:30:29", "remaining_time": "2:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3760, "total_steps": 10000, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 3.92678391921108e-06, "epoch": 0.376, "percentage": 37.6, "elapsed_time": "1:30:42", "remaining_time": "2:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3770, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.9196093626327535e-06, "epoch": 0.377, "percentage": 37.7, "elapsed_time": "1:30:58", "remaining_time": "2:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3780, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.912417508562345e-06, "epoch": 0.378, "percentage": 37.8, "elapsed_time": "1:31:17", "remaining_time": "2:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3790, "total_steps": 10000, "loss": 2.9491, "accuracy": 0.8999999761581421, "learning_rate": 3.905208444630326e-06, "epoch": 0.379, "percentage": 37.9, "elapsed_time": "1:31:36", "remaining_time": "2:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3800, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.897982258676867e-06, "epoch": 0.38, "percentage": 38.0, "elapsed_time": "1:31:51", "remaining_time": "2:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3810, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.890739038750763e-06, "epoch": 0.381, "percentage": 38.1, "elapsed_time": "1:32:06", "remaining_time": "2:29:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3820, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.88347887310836e-06, "epoch": 0.382, "percentage": 38.2, "elapsed_time": "1:32:17", "remaining_time": "2:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3830, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.876201850212489e-06, "epoch": 0.383, "percentage": 38.3, "elapsed_time": "1:32:30", "remaining_time": "2:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3840, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.868908058731376e-06, "epoch": 0.384, "percentage": 38.4, "elapsed_time": "1:32:45", "remaining_time": "2:28:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3850, "total_steps": 10000, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 3.861597587537568e-06, "epoch": 0.385, "percentage": 38.5, "elapsed_time": "1:33:00", "remaining_time": "2:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3860, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.85427052570685e-06, "epoch": 0.386, "percentage": 38.6, "elapsed_time": "1:33:11", "remaining_time": "2:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3870, "total_steps": 10000, "loss": 0.0117, "accuracy": 1.0, "learning_rate": 3.846926962517158e-06, "epoch": 0.387, "percentage": 38.7, "elapsed_time": "1:33:30", "remaining_time": "2:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3880, "total_steps": 10000, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.839566987447492e-06, "epoch": 0.388, "percentage": 38.8, "elapsed_time": "1:33:44", "remaining_time": "2:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3890, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.832190690176825e-06, "epoch": 0.389, "percentage": 38.9, "elapsed_time": "1:33:56", "remaining_time": "2:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3900, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.824798160583012e-06, "epoch": 0.39, "percentage": 39.0, "elapsed_time": "1:34:15", "remaining_time": "2:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3910, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.817389488741694e-06, "epoch": 0.391, "percentage": 39.1, "elapsed_time": "1:34:34", "remaining_time": "2:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3920, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.8099647649251984e-06, "epoch": 0.392, "percentage": 39.2, "elapsed_time": "1:34:49", "remaining_time": "2:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3930, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.802524079601442e-06, "epoch": 0.393, "percentage": 39.3, "elapsed_time": "1:35:01", "remaining_time": "2:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3940, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.795067523432826e-06, "epoch": 0.394, "percentage": 39.4, "elapsed_time": "1:35:31", "remaining_time": "2:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3950, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.787595187275136e-06, "epoch": 0.395, "percentage": 39.5, "elapsed_time": "1:35:47", "remaining_time": "2:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3960, "total_steps": 10000, "loss": 0.053, "accuracy": 1.0, "learning_rate": 3.780107162176429e-06, "epoch": 0.396, "percentage": 39.6, "elapsed_time": "1:36:05", "remaining_time": "2:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3970, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.772603539375929e-06, "epoch": 0.397, "percentage": 39.7, "elapsed_time": "1:36:18", "remaining_time": "2:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3980, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.7650844103029093e-06, "epoch": 0.398, "percentage": 39.8, "elapsed_time": "1:36:34", "remaining_time": "2:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3990, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.7575498665755884e-06, "epoch": 0.399, "percentage": 39.9, "elapsed_time": "1:36:47", "remaining_time": "2:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4000, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.7500000000000005e-06, "epoch": 0.4, "percentage": 40.0, "elapsed_time": "1:37:05", "remaining_time": "2:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4010, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.742434902568889e-06, "epoch": 0.401, "percentage": 40.1, "elapsed_time": "1:37:28", "remaining_time": "2:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4020, "total_steps": 10000, "loss": 0.1245, "accuracy": 0.8999999761581421, "learning_rate": 3.7348546664605777e-06, "epoch": 0.402, "percentage": 40.2, "elapsed_time": "1:37:43", "remaining_time": "2:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4030, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.7272593840378526e-06, "epoch": 0.403, "percentage": 40.3, "elapsed_time": "1:37:56", "remaining_time": "2:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4040, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.7196491478468322e-06, "epoch": 0.404, "percentage": 40.4, "elapsed_time": "1:38:14", "remaining_time": "2:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4050, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.7120240506158433e-06, "epoch": 0.405, "percentage": 40.5, "elapsed_time": "1:38:27", "remaining_time": "2:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4060, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.7043841852542884e-06, "epoch": 0.406, "percentage": 40.6, "elapsed_time": "1:38:41", "remaining_time": "2:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4070, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.6967296448515176e-06, "epoch": 0.407, "percentage": 40.7, "elapsed_time": "1:38:59", "remaining_time": "2:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4080, "total_steps": 10000, "loss": 0.4617, "accuracy": 0.8999999761581421, "learning_rate": 3.689060522675689e-06, "epoch": 0.408, "percentage": 40.8, "elapsed_time": "1:39:13", "remaining_time": "2:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4090, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.6813769121726356e-06, "epoch": 0.409, "percentage": 40.9, "elapsed_time": "1:39:27", "remaining_time": "2:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4100, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.6736789069647273e-06, "epoch": 0.41, "percentage": 41.0, "elapsed_time": "1:39:46", "remaining_time": "2:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4110, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.6659666008497287e-06, "epoch": 0.411, "percentage": 41.1, "elapsed_time": "1:40:00", "remaining_time": "2:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4120, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.658240087799655e-06, "epoch": 0.412, "percentage": 41.2, "elapsed_time": "1:40:13", "remaining_time": "2:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4130, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.6504994619596295e-06, "epoch": 0.413, "percentage": 41.3, "elapsed_time": "1:40:31", "remaining_time": "2:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4140, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.642744817646736e-06, "epoch": 0.414, "percentage": 41.4, "elapsed_time": "1:41:07", "remaining_time": "2:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4150, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.634976249348867e-06, "epoch": 0.415, "percentage": 41.5, "elapsed_time": "1:41:19", "remaining_time": "2:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4160, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.627193851723577e-06, "epoch": 0.416, "percentage": 41.6, "elapsed_time": "1:41:30", "remaining_time": "2:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4170, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.6193977195969243e-06, "epoch": 0.417, "percentage": 41.7, "elapsed_time": "1:41:44", "remaining_time": "2:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4180, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.611587947962319e-06, "epoch": 0.418, "percentage": 41.8, "elapsed_time": "1:42:00", "remaining_time": "2:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4190, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.6037646319793635e-06, "epoch": 0.419, "percentage": 41.9, "elapsed_time": "1:42:13", "remaining_time": "2:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4200, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.595927866972694e-06, "epoch": 0.42, "percentage": 42.0, "elapsed_time": "1:42:30", "remaining_time": "2:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4210, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.5880777484308193e-06, "epoch": 0.421, "percentage": 42.1, "elapsed_time": "1:42:44", "remaining_time": "2:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4220, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.5802143720049565e-06, "epoch": 0.422, "percentage": 42.2, "elapsed_time": "1:42:58", "remaining_time": "2:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4230, "total_steps": 10000, "loss": 0.292, "accuracy": 0.8999999761581421, "learning_rate": 3.5723378335078653e-06, "epoch": 0.423, "percentage": 42.3, "elapsed_time": "1:43:12", "remaining_time": "2:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4240, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.564448228912682e-06, "epoch": 0.424, "percentage": 42.4, "elapsed_time": "1:43:26", "remaining_time": "2:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4250, "total_steps": 10000, "loss": 0.2262, "accuracy": 0.8999999761581421, "learning_rate": 3.556545654351749e-06, "epoch": 0.425, "percentage": 42.5, "elapsed_time": "1:43:42", "remaining_time": "2:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4260, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.5486302061154433e-06, "epoch": 0.426, "percentage": 42.6, "elapsed_time": "1:43:57", "remaining_time": "2:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4270, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.5407019806510035e-06, "epoch": 0.427, "percentage": 42.7, "elapsed_time": "1:44:12", "remaining_time": "2:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4280, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.532761074561355e-06, "epoch": 0.428, "percentage": 42.8, "elapsed_time": "1:44:23", "remaining_time": "2:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4290, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.524807584603932e-06, "epoch": 0.429, "percentage": 42.9, "elapsed_time": "1:44:35", "remaining_time": "2:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4300, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.516841607689501e-06, "epoch": 0.43, "percentage": 43.0, "elapsed_time": "1:44:52", "remaining_time": "2:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4310, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.5088632408809757e-06, "epoch": 0.431, "percentage": 43.1, "elapsed_time": "1:45:04", "remaining_time": "2:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4320, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.5008725813922383e-06, "epoch": 0.432, "percentage": 43.2, "elapsed_time": "1:45:20", "remaining_time": "2:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4330, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.4928697265869516e-06, "epoch": 0.433, "percentage": 43.3, "elapsed_time": "1:45:35", "remaining_time": "2:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4340, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.4848547739773782e-06, "epoch": 0.434, "percentage": 43.4, "elapsed_time": "1:45:49", "remaining_time": "2:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4350, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.476827821223184e-06, "epoch": 0.435, "percentage": 43.5, "elapsed_time": "1:46:09", "remaining_time": "2:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4360, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.4687889661302577e-06, "epoch": 0.436, "percentage": 43.6, "elapsed_time": "1:46:24", "remaining_time": "2:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4370, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.460738306649509e-06, "epoch": 0.437, "percentage": 43.7, "elapsed_time": "1:46:57", "remaining_time": "2:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4380, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.452675940875686e-06, "epoch": 0.438, "percentage": 43.8, "elapsed_time": "1:47:14", "remaining_time": "2:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4390, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.4446019670461684e-06, "epoch": 0.439, "percentage": 43.9, "elapsed_time": "1:47:31", "remaining_time": "2:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4400, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.436516483539781e-06, "epoch": 0.44, "percentage": 44.0, "elapsed_time": "1:47:45", "remaining_time": "2:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4410, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.4284195888755877e-06, "epoch": 0.441, "percentage": 44.1, "elapsed_time": "1:48:00", "remaining_time": "2:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4420, "total_steps": 10000, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 3.4203113817116955e-06, "epoch": 0.442, "percentage": 44.2, "elapsed_time": "1:48:21", "remaining_time": "2:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4430, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.412191960844049e-06, "epoch": 0.443, "percentage": 44.3, "elapsed_time": "1:48:33", "remaining_time": "2:16:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4440, "total_steps": 10000, "loss": 0.0023, "accuracy": 1.0, "learning_rate": 3.4040614252052305e-06, "epoch": 0.444, "percentage": 44.4, "elapsed_time": "1:48:49", "remaining_time": "2:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4450, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.39591987386325e-06, "epoch": 0.445, "percentage": 44.5, "elapsed_time": "1:49:02", "remaining_time": "2:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4460, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.387767406020343e-06, "epoch": 0.446, "percentage": 44.6, "elapsed_time": "1:49:19", "remaining_time": "2:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4470, "total_steps": 10000, "loss": 0.1911, "accuracy": 0.8999999761581421, "learning_rate": 3.3796041210117545e-06, "epoch": 0.447, "percentage": 44.7, "elapsed_time": "1:49:32", "remaining_time": "2:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4480, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.3714301183045382e-06, "epoch": 0.448, "percentage": 44.8, "elapsed_time": "1:49:44", "remaining_time": "2:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4490, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.3632454974963368e-06, "epoch": 0.449, "percentage": 44.9, "elapsed_time": "1:49:59", "remaining_time": "2:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4500, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.3550503583141726e-06, "epoch": 0.45, "percentage": 45.0, "elapsed_time": "1:50:10", "remaining_time": "2:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4510, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.346844800613229e-06, "epoch": 0.451, "percentage": 45.1, "elapsed_time": "1:50:28", "remaining_time": "2:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4520, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.338628924375638e-06, "epoch": 0.452, "percentage": 45.2, "elapsed_time": "1:50:43", "remaining_time": "2:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4530, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.3304028297092583e-06, "epoch": 0.453, "percentage": 45.3, "elapsed_time": "1:50:56", "remaining_time": "2:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4540, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.3221666168464584e-06, "epoch": 0.454, "percentage": 45.4, "elapsed_time": "1:51:20", "remaining_time": "2:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4550, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.313920386142892e-06, "epoch": 0.455, "percentage": 45.5, "elapsed_time": "1:51:34", "remaining_time": "2:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4560, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.3056642380762783e-06, "epoch": 0.456, "percentage": 45.6, "elapsed_time": "1:52:20", "remaining_time": "2:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4570, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.2973982732451753e-06, "epoch": 0.457, "percentage": 45.7, "elapsed_time": "1:52:35", "remaining_time": "2:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4580, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.2891225923677565e-06, "epoch": 0.458, "percentage": 45.8, "elapsed_time": "1:52:53", "remaining_time": "2:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4590, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.280837296280582e-06, "epoch": 0.459, "percentage": 45.9, "elapsed_time": "1:53:05", "remaining_time": "2:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4600, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.272542485937369e-06, "epoch": 0.46, "percentage": 46.0, "elapsed_time": "1:53:22", "remaining_time": "2:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4610, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.2642382624077647e-06, "epoch": 0.461, "percentage": 46.1, "elapsed_time": "1:53:40", "remaining_time": "2:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4620, "total_steps": 10000, "loss": 0.1734, "accuracy": 0.8999999761581421, "learning_rate": 3.2559247268761117e-06, "epoch": 0.462, "percentage": 46.2, "elapsed_time": "1:53:53", "remaining_time": "2:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4630, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.247601980640217e-06, "epoch": 0.463, "percentage": 46.3, "elapsed_time": "1:54:07", "remaining_time": "2:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4640, "total_steps": 10000, "loss": 0.0251, "accuracy": 1.0, "learning_rate": 3.2392701251101172e-06, "epoch": 0.464, "percentage": 46.4, "elapsed_time": "1:54:23", "remaining_time": "2:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4650, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.230929261806842e-06, "epoch": 0.465, "percentage": 46.5, "elapsed_time": "1:54:38", "remaining_time": "2:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4660, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.222579492361179e-06, "epoch": 0.466, "percentage": 46.6, "elapsed_time": "1:54:56", "remaining_time": "2:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4670, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.214220918512434e-06, "epoch": 0.467, "percentage": 46.7, "elapsed_time": "1:55:09", "remaining_time": "2:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4680, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.205853642107192e-06, "epoch": 0.468, "percentage": 46.8, "elapsed_time": "1:55:29", "remaining_time": "2:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4690, "total_steps": 10000, "loss": 0.0046, "accuracy": 1.0, "learning_rate": 3.1974777650980737e-06, "epoch": 0.469, "percentage": 46.9, "elapsed_time": "1:55:43", "remaining_time": "2:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4700, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.189093389542498e-06, "epoch": 0.47, "percentage": 47.0, "elapsed_time": "1:55:56", "remaining_time": "2:10:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4710, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.180700617601436e-06, "epoch": 0.471, "percentage": 47.1, "elapsed_time": "1:56:15", "remaining_time": "2:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4720, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.1722995515381644e-06, "epoch": 0.472, "percentage": 47.2, "elapsed_time": "1:56:29", "remaining_time": "2:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4730, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.1638902937170224e-06, "epoch": 0.473, "percentage": 47.3, "elapsed_time": "1:56:45", "remaining_time": "2:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4740, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.155472946602162e-06, "epoch": 0.474, "percentage": 47.4, "elapsed_time": "1:56:58", "remaining_time": "2:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4750, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.147047612756302e-06, "epoch": 0.475, "percentage": 47.5, "elapsed_time": "1:57:08", "remaining_time": "2:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4760, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.1386143948394764e-06, "epoch": 0.476, "percentage": 47.6, "elapsed_time": "1:57:23", "remaining_time": "2:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4770, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.130173395607785e-06, "epoch": 0.477, "percentage": 47.7, "elapsed_time": "1:57:38", "remaining_time": "2:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4780, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.121724717912138e-06, "epoch": 0.478, "percentage": 47.8, "elapsed_time": "1:57:52", "remaining_time": "2:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4790, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.1132684646970068e-06, "epoch": 0.479, "percentage": 47.9, "elapsed_time": "1:58:06", "remaining_time": "2:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4800, "total_steps": 10000, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.1048047389991693e-06, "epoch": 0.48, "percentage": 48.0, "elapsed_time": "1:58:20", "remaining_time": "2:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4810, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.0963336439464527e-06, "epoch": 0.481, "percentage": 48.1, "elapsed_time": "1:58:37", "remaining_time": "2:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4820, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.087855282756475e-06, "epoch": 0.482, "percentage": 48.2, "elapsed_time": "1:58:52", "remaining_time": "2:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4830, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.079369758735393e-06, "epoch": 0.483, "percentage": 48.3, "elapsed_time": "1:59:03", "remaining_time": "2:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4840, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.0708771752766397e-06, "epoch": 0.484, "percentage": 48.4, "elapsed_time": "1:59:15", "remaining_time": "2:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4850, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.062377635859663e-06, "epoch": 0.485, "percentage": 48.5, "elapsed_time": "1:59:37", "remaining_time": "2:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4860, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.053871244048669e-06, "epoch": 0.486, "percentage": 48.6, "elapsed_time": "2:00:02", "remaining_time": "2:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4870, "total_steps": 10000, "loss": 0.1168, "accuracy": 0.8999999761581421, "learning_rate": 3.045358103491357e-06, "epoch": 0.487, "percentage": 48.7, "elapsed_time": "2:00:11", "remaining_time": "2:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4880, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.0368383179176584e-06, "epoch": 0.488, "percentage": 48.8, "elapsed_time": "2:00:28", "remaining_time": "2:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4890, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.0283119911384724e-06, "epoch": 0.489, "percentage": 48.9, "elapsed_time": "2:00:41", "remaining_time": "2:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4900, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.019779227044398e-06, "epoch": 0.49, "percentage": 49.0, "elapsed_time": "2:00:53", "remaining_time": "2:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4910, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.0112401296044756e-06, "epoch": 0.491, "percentage": 49.1, "elapsed_time": "2:01:42", "remaining_time": "2:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4920, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.002694802864912e-06, "epoch": 0.492, "percentage": 49.2, "elapsed_time": "2:01:59", "remaining_time": "2:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4930, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.9941433509478157e-06, "epoch": 0.493, "percentage": 49.3, "elapsed_time": "2:02:12", "remaining_time": "2:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4940, "total_steps": 10000, "loss": 0.0095, "accuracy": 1.0, "learning_rate": 2.98558587804993e-06, "epoch": 0.494, "percentage": 49.4, "elapsed_time": "2:02:26", "remaining_time": "2:05:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4950, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.9770224884413625e-06, "epoch": 0.495, "percentage": 49.5, "elapsed_time": "2:02:46", "remaining_time": "2:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4960, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.9684532864643123e-06, "epoch": 0.496, "percentage": 49.6, "elapsed_time": "2:04:06", "remaining_time": "2:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4970, "total_steps": 10000, "loss": 0.0028, "accuracy": 1.0, "learning_rate": 2.9598783765318005e-06, "epoch": 0.497, "percentage": 49.7, "elapsed_time": "2:04:18", "remaining_time": "2:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4980, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.9512978631264006e-06, "epoch": 0.498, "percentage": 49.8, "elapsed_time": "2:04:32", "remaining_time": "2:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4990, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.942711850798959e-06, "epoch": 0.499, "percentage": 49.9, "elapsed_time": "2:04:43", "remaining_time": "2:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5000, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.9341204441673267e-06, "epoch": 0.5, "percentage": 50.0, "elapsed_time": "2:04:54", "remaining_time": "2:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5010, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.9255237479150815e-06, "epoch": 0.501, "percentage": 50.1, "elapsed_time": "2:05:11", "remaining_time": "2:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5020, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.9169218667902562e-06, "epoch": 0.502, "percentage": 50.2, "elapsed_time": "2:05:25", "remaining_time": "2:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5030, "total_steps": 10000, "loss": 0.031, "accuracy": 1.0, "learning_rate": 2.908314905604056e-06, "epoch": 0.503, "percentage": 50.3, "elapsed_time": "2:05:37", "remaining_time": "2:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5040, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.8997029692295875e-06, "epoch": 0.504, "percentage": 50.4, "elapsed_time": "2:05:47", "remaining_time": "2:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5050, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.8910861626005774e-06, "epoch": 0.505, "percentage": 50.5, "elapsed_time": "2:05:58", "remaining_time": "2:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5060, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.8824645907100957e-06, "epoch": 0.506, "percentage": 50.6, "elapsed_time": "2:06:10", "remaining_time": "2:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5070, "total_steps": 10000, "loss": 0.3021, "accuracy": 0.8999999761581421, "learning_rate": 2.8738383586092745e-06, "epoch": 0.507, "percentage": 50.7, "elapsed_time": "2:06:24", "remaining_time": "2:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5080, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.8652075714060296e-06, "epoch": 0.508, "percentage": 50.8, "elapsed_time": "2:06:36", "remaining_time": "2:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5090, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.8565723342637797e-06, "epoch": 0.509, "percentage": 50.9, "elapsed_time": "2:06:48", "remaining_time": "2:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5100, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.847932752400164e-06, "epoch": 0.51, "percentage": 51.0, "elapsed_time": "2:07:00", "remaining_time": "2:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5110, "total_steps": 10000, "loss": 0.0361, "accuracy": 1.0, "learning_rate": 2.8392889310857615e-06, "epoch": 0.511, "percentage": 51.1, "elapsed_time": "2:07:11", "remaining_time": "2:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5120, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.8306409756428067e-06, "epoch": 0.512, "percentage": 51.2, "elapsed_time": "2:07:24", "remaining_time": "2:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5130, "total_steps": 10000, "loss": 0.1724, "accuracy": 0.8999999761581421, "learning_rate": 2.8219889914439073e-06, "epoch": 0.513, "percentage": 51.3, "elapsed_time": "2:07:36", "remaining_time": "2:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5140, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.813333083910761e-06, "epoch": 0.514, "percentage": 51.4, "elapsed_time": "2:07:50", "remaining_time": "2:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5150, "total_steps": 10000, "loss": 0.0017, "accuracy": 1.0, "learning_rate": 2.804673358512869e-06, "epoch": 0.515, "percentage": 51.5, "elapsed_time": "2:08:04", "remaining_time": "2:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5160, "total_steps": 10000, "loss": 0.9996, "accuracy": 0.8999999761581421, "learning_rate": 2.7960099207662535e-06, "epoch": 0.516, "percentage": 51.6, "elapsed_time": "2:08:16", "remaining_time": "2:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5170, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.7873428762321667e-06, "epoch": 0.517, "percentage": 51.7, "elapsed_time": "2:08:28", "remaining_time": "2:00:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5180, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.778672330515814e-06, "epoch": 0.518, "percentage": 51.8, "elapsed_time": "2:08:40", "remaining_time": "1:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5190, "total_steps": 10000, "loss": 0.0039, "accuracy": 1.0, "learning_rate": 2.769998389265057e-06, "epoch": 0.519, "percentage": 51.9, "elapsed_time": "2:08:53", "remaining_time": "1:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5200, "total_steps": 10000, "loss": 0.0021, "accuracy": 1.0, "learning_rate": 2.761321158169134e-06, "epoch": 0.52, "percentage": 52.0, "elapsed_time": "2:09:05", "remaining_time": "1:59:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5210, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.752640742957366e-06, "epoch": 0.521, "percentage": 52.1, "elapsed_time": "2:09:19", "remaining_time": "1:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5220, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.743957249397874e-06, "epoch": 0.522, "percentage": 52.2, "elapsed_time": "2:09:30", "remaining_time": "1:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5230, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.7352707832962865e-06, "epoch": 0.523, "percentage": 52.3, "elapsed_time": "2:09:43", "remaining_time": "1:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5240, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.726581450494451e-06, "epoch": 0.524, "percentage": 52.4, "elapsed_time": "2:09:54", "remaining_time": "1:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5250, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.717889356869146e-06, "epoch": 0.525, "percentage": 52.5, "elapsed_time": "2:10:07", "remaining_time": "1:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5260, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.70919460833079e-06, "epoch": 0.526, "percentage": 52.6, "elapsed_time": "2:10:19", "remaining_time": "1:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5270, "total_steps": 10000, "loss": 0.0073, "accuracy": 1.0, "learning_rate": 2.700497310822147e-06, "epoch": 0.527, "percentage": 52.7, "elapsed_time": "2:10:31", "remaining_time": "1:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5280, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.6917975703170466e-06, "epoch": 0.528, "percentage": 52.8, "elapsed_time": "2:10:44", "remaining_time": "1:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5290, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.6830954928190795e-06, "epoch": 0.529, "percentage": 52.9, "elapsed_time": "2:10:59", "remaining_time": "1:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5300, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.6743911843603134e-06, "epoch": 0.53, "percentage": 53.0, "elapsed_time": "2:11:11", "remaining_time": "1:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5310, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.6656847510000013e-06, "epoch": 0.531, "percentage": 53.1, "elapsed_time": "2:11:21", "remaining_time": "1:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5320, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.6569762988232838e-06, "epoch": 0.532, "percentage": 53.2, "elapsed_time": "2:11:34", "remaining_time": "1:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5330, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.6482659339399047e-06, "epoch": 0.533, "percentage": 53.3, "elapsed_time": "2:11:47", "remaining_time": "1:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5340, "total_steps": 10000, "loss": 0.2173, "accuracy": 0.8999999761581421, "learning_rate": 2.63955376248291e-06, "epoch": 0.534, "percentage": 53.4, "elapsed_time": "2:11:58", "remaining_time": "1:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5350, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.6308398906073603e-06, "epoch": 0.535, "percentage": 53.5, "elapsed_time": "2:12:11", "remaining_time": "1:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5360, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.6221244244890336e-06, "epoch": 0.536, "percentage": 53.6, "elapsed_time": "2:12:22", "remaining_time": "1:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5370, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.613407470323134e-06, "epoch": 0.537, "percentage": 53.7, "elapsed_time": "2:12:34", "remaining_time": "1:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5380, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.604689134322999e-06, "epoch": 0.538, "percentage": 53.8, "elapsed_time": "2:12:51", "remaining_time": "1:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5390, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.5959695227188e-06, "epoch": 0.539, "percentage": 53.9, "elapsed_time": "2:13:04", "remaining_time": "1:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5400, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.587248741756253e-06, "epoch": 0.54, "percentage": 54.0, "elapsed_time": "2:13:16", "remaining_time": "1:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5410, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.578526897695321e-06, "epoch": 0.541, "percentage": 54.1, "elapsed_time": "2:13:27", "remaining_time": "1:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5420, "total_steps": 10000, "loss": 0.0091, "accuracy": 1.0, "learning_rate": 2.569804096808923e-06, "epoch": 0.542, "percentage": 54.2, "elapsed_time": "2:13:38", "remaining_time": "1:52:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5430, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.5610804453816333e-06, "epoch": 0.543, "percentage": 54.3, "elapsed_time": "2:13:52", "remaining_time": "1:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5440, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.5523560497083927e-06, "epoch": 0.544, "percentage": 54.4, "elapsed_time": "2:14:06", "remaining_time": "1:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5450, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.543631016093209e-06, "epoch": 0.545, "percentage": 54.5, "elapsed_time": "2:14:18", "remaining_time": "1:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5460, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.5349054508478636e-06, "epoch": 0.546, "percentage": 54.6, "elapsed_time": "2:14:30", "remaining_time": "1:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5470, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.526179460290615e-06, "epoch": 0.547, "percentage": 54.7, "elapsed_time": "2:14:40", "remaining_time": "1:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5480, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.517453150744904e-06, "epoch": 0.548, "percentage": 54.8, "elapsed_time": "2:14:53", "remaining_time": "1:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5490, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.5087266285380597e-06, "epoch": 0.549, "percentage": 54.9, "elapsed_time": "2:15:04", "remaining_time": "1:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5500, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.5e-06, "epoch": 0.55, "percentage": 55.0, "elapsed_time": "2:15:17", "remaining_time": "1:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5510, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.4912733714619415e-06, "epoch": 0.551, "percentage": 55.1, "elapsed_time": "2:15:30", "remaining_time": "1:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5520, "total_steps": 10000, "loss": 0.59, "accuracy": 0.8999999761581421, "learning_rate": 2.482546849255096e-06, "epoch": 0.552, "percentage": 55.2, "elapsed_time": "2:15:44", "remaining_time": "1:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5530, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.4738205397093863e-06, "epoch": 0.553, "percentage": 55.3, "elapsed_time": "2:15:55", "remaining_time": "1:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5540, "total_steps": 10000, "loss": 0.0025, "accuracy": 1.0, "learning_rate": 2.4650945491521372e-06, "epoch": 0.554, "percentage": 55.4, "elapsed_time": "2:16:09", "remaining_time": "1:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5550, "total_steps": 10000, "loss": 0.1537, "accuracy": 0.8999999761581421, "learning_rate": 2.4563689839067913e-06, "epoch": 0.555, "percentage": 55.5, "elapsed_time": "2:16:21", "remaining_time": "1:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5560, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.447643950291608e-06, "epoch": 0.556, "percentage": 55.6, "elapsed_time": "2:16:35", "remaining_time": "1:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5570, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.4389195546183676e-06, "epoch": 0.557, "percentage": 55.7, "elapsed_time": "2:16:48", "remaining_time": "1:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5580, "total_steps": 10000, "loss": 0.0618, "accuracy": 1.0, "learning_rate": 2.4301959031910785e-06, "epoch": 0.558, "percentage": 55.8, "elapsed_time": "2:17:00", "remaining_time": "1:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5590, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.4214731023046795e-06, "epoch": 0.559, "percentage": 55.9, "elapsed_time": "2:17:13", "remaining_time": "1:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5600, "total_steps": 10000, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 2.4127512582437486e-06, "epoch": 0.56, "percentage": 56.0, "elapsed_time": "2:17:25", "remaining_time": "1:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5610, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.4040304772812002e-06, "epoch": 0.561, "percentage": 56.1, "elapsed_time": "2:17:36", "remaining_time": "1:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5620, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3953108656770018e-06, "epoch": 0.562, "percentage": 56.2, "elapsed_time": "2:17:48", "remaining_time": "1:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5630, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3865925296768658e-06, "epoch": 0.563, "percentage": 56.3, "elapsed_time": "2:18:00", "remaining_time": "1:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5640, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.377875575510967e-06, "epoch": 0.564, "percentage": 56.4, "elapsed_time": "2:18:12", "remaining_time": "1:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5650, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3691601093926406e-06, "epoch": 0.565, "percentage": 56.5, "elapsed_time": "2:18:23", "remaining_time": "1:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5660, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3604462375170905e-06, "epoch": 0.566, "percentage": 56.6, "elapsed_time": "2:18:36", "remaining_time": "1:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5670, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3517340660600965e-06, "epoch": 0.567, "percentage": 56.7, "elapsed_time": "2:18:47", "remaining_time": "1:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5680, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3430237011767166e-06, "epoch": 0.568, "percentage": 56.8, "elapsed_time": "2:18:59", "remaining_time": "1:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5690, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3343152490000004e-06, "epoch": 0.569, "percentage": 56.9, "elapsed_time": "2:19:11", "remaining_time": "1:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5700, "total_steps": 10000, "loss": 0.0887, "accuracy": 0.8999999761581421, "learning_rate": 2.325608815639687e-06, "epoch": 0.57, "percentage": 57.0, "elapsed_time": "2:19:26", "remaining_time": "1:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5710, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3169045071809217e-06, "epoch": 0.571, "percentage": 57.1, "elapsed_time": "2:19:38", "remaining_time": "1:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5720, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3082024296829538e-06, "epoch": 0.572, "percentage": 57.2, "elapsed_time": "2:19:52", "remaining_time": "1:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5730, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.2995026891778533e-06, "epoch": 0.573, "percentage": 57.3, "elapsed_time": "2:20:05", "remaining_time": "1:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5740, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.290805391669212e-06, "epoch": 0.574, "percentage": 57.4, "elapsed_time": "2:20:17", "remaining_time": "1:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5750, "total_steps": 10000, "loss": 0.1444, "accuracy": 0.8999999761581421, "learning_rate": 2.2821106431308546e-06, "epoch": 0.575, "percentage": 57.5, "elapsed_time": "2:20:30", "remaining_time": "1:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5760, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.2734185495055503e-06, "epoch": 0.576, "percentage": 57.6, "elapsed_time": "2:20:42", "remaining_time": "1:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5770, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.2647292167037143e-06, "epoch": 0.577, "percentage": 57.7, "elapsed_time": "2:20:55", "remaining_time": "1:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5780, "total_steps": 10000, "loss": 0.0145, "accuracy": 1.0, "learning_rate": 2.256042750602127e-06, "epoch": 0.578, "percentage": 57.8, "elapsed_time": "2:21:05", "remaining_time": "1:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5790, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.2473592570426343e-06, "epoch": 0.579, "percentage": 57.9, "elapsed_time": "2:21:19", "remaining_time": "1:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5800, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.238678841830867e-06, "epoch": 0.58, "percentage": 58.0, "elapsed_time": "2:21:31", "remaining_time": "1:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5810, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.230001610734943e-06, "epoch": 0.581, "percentage": 58.1, "elapsed_time": "2:21:45", "remaining_time": "1:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5820, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.2213276694841866e-06, "epoch": 0.582, "percentage": 58.2, "elapsed_time": "2:21:57", "remaining_time": "1:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5830, "total_steps": 10000, "loss": 0.0012, "accuracy": 1.0, "learning_rate": 2.212657123767834e-06, "epoch": 0.583, "percentage": 58.3, "elapsed_time": "2:22:07", "remaining_time": "1:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5840, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.2039900792337477e-06, "epoch": 0.584, "percentage": 58.4, "elapsed_time": "2:22:24", "remaining_time": "1:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5850, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.195326641487132e-06, "epoch": 0.585, "percentage": 58.5, "elapsed_time": "2:22:37", "remaining_time": "1:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5860, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.186666916089239e-06, "epoch": 0.586, "percentage": 58.6, "elapsed_time": "2:22:49", "remaining_time": "1:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5870, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.1780110085560935e-06, "epoch": 0.587, "percentage": 58.7, "elapsed_time": "2:23:03", "remaining_time": "1:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5880, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.1693590243571937e-06, "epoch": 0.588, "percentage": 58.8, "elapsed_time": "2:23:15", "remaining_time": "1:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5890, "total_steps": 10000, "loss": 0.1048, "accuracy": 0.8999999761581421, "learning_rate": 2.1607110689142393e-06, "epoch": 0.589, "percentage": 58.9, "elapsed_time": "2:23:26", "remaining_time": "1:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5900, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.1520672475998374e-06, "epoch": 0.59, "percentage": 59.0, "elapsed_time": "2:23:38", "remaining_time": "1:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5910, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.143427665736221e-06, "epoch": 0.591, "percentage": 59.1, "elapsed_time": "2:23:50", "remaining_time": "1:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5920, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.134792428593971e-06, "epoch": 0.592, "percentage": 59.2, "elapsed_time": "2:24:05", "remaining_time": "1:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5930, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.1261616413907267e-06, "epoch": 0.593, "percentage": 59.3, "elapsed_time": "2:24:18", "remaining_time": "1:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5940, "total_steps": 10000, "loss": 0.1809, "accuracy": 0.8999999761581421, "learning_rate": 2.117535409289905e-06, "epoch": 0.594, "percentage": 59.4, "elapsed_time": "2:24:29", "remaining_time": "1:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5950, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.1089138373994226e-06, "epoch": 0.595, "percentage": 59.5, "elapsed_time": "2:24:43", "remaining_time": "1:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5960, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.1002970307704134e-06, "epoch": 0.596, "percentage": 59.6, "elapsed_time": "2:24:56", "remaining_time": "1:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5970, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.0916850943959453e-06, "epoch": 0.597, "percentage": 59.7, "elapsed_time": "2:25:08", "remaining_time": "1:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5980, "total_steps": 10000, "loss": 0.2396, "accuracy": 0.8999999761581421, "learning_rate": 2.0830781332097446e-06, "epoch": 0.598, "percentage": 59.8, "elapsed_time": "2:25:19", "remaining_time": "1:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5990, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.0744762520849193e-06, "epoch": 0.599, "percentage": 59.9, "elapsed_time": "2:25:29", "remaining_time": "1:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6000, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.0658795558326745e-06, "epoch": 0.6, "percentage": 60.0, "elapsed_time": "2:25:42", "remaining_time": "1:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6010, "total_steps": 10000, "loss": 0.0029, "accuracy": 1.0, "learning_rate": 2.0572881492010423e-06, "epoch": 0.601, "percentage": 60.1, "elapsed_time": "2:25:58", "remaining_time": "1:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6020, "total_steps": 10000, "loss": 1.1745, "accuracy": 0.8999999761581421, "learning_rate": 2.0487021368736002e-06, "epoch": 0.602, "percentage": 60.2, "elapsed_time": "2:26:12", "remaining_time": "1:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6030, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.0401216234682e-06, "epoch": 0.603, "percentage": 60.3, "elapsed_time": "2:26:26", "remaining_time": "1:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6040, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.031546713535688e-06, "epoch": 0.604, "percentage": 60.4, "elapsed_time": "2:26:35", "remaining_time": "1:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6050, "total_steps": 10000, "loss": 0.0528, "accuracy": 1.0, "learning_rate": 2.022977511558638e-06, "epoch": 0.605, "percentage": 60.5, "elapsed_time": "2:26:47", "remaining_time": "1:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6060, "total_steps": 10000, "loss": 0.0037, "accuracy": 1.0, "learning_rate": 2.0144141219500707e-06, "epoch": 0.606, "percentage": 60.6, "elapsed_time": "2:27:02", "remaining_time": "1:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6070, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.0058566490521848e-06, "epoch": 0.607, "percentage": 60.7, "elapsed_time": "2:27:14", "remaining_time": "1:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6080, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.997305197135089e-06, "epoch": 0.608, "percentage": 60.8, "elapsed_time": "2:27:25", "remaining_time": "1:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6090, "total_steps": 10000, "loss": 0.2139, "accuracy": 0.8999999761581421, "learning_rate": 1.9887598703955244e-06, "epoch": 0.609, "percentage": 60.9, "elapsed_time": "2:27:36", "remaining_time": "1:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6100, "total_steps": 10000, "loss": 0.0025, "accuracy": 1.0, "learning_rate": 1.9802207729556023e-06, "epoch": 0.61, "percentage": 61.0, "elapsed_time": "2:27:47", "remaining_time": "1:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6110, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.971688008861529e-06, "epoch": 0.611, "percentage": 61.1, "elapsed_time": "2:28:01", "remaining_time": "1:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6120, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.963161682082342e-06, "epoch": 0.612, "percentage": 61.2, "elapsed_time": "2:28:13", "remaining_time": "1:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6130, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.9546418965086444e-06, "epoch": 0.613, "percentage": 61.3, "elapsed_time": "2:28:26", "remaining_time": "1:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6140, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.946128755951332e-06, "epoch": 0.614, "percentage": 61.4, "elapsed_time": "2:28:38", "remaining_time": "1:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6150, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.937622364140338e-06, "epoch": 0.615, "percentage": 61.5, "elapsed_time": "2:28:52", "remaining_time": "1:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6160, "total_steps": 10000, "loss": 1.1588, "accuracy": 0.8999999761581421, "learning_rate": 1.9291228247233607e-06, "epoch": 0.616, "percentage": 61.6, "elapsed_time": "2:29:04", "remaining_time": "1:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6170, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.9206302412646074e-06, "epoch": 0.617, "percentage": 61.7, "elapsed_time": "2:29:16", "remaining_time": "1:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6180, "total_steps": 10000, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 1.912144717243525e-06, "epoch": 0.618, "percentage": 61.8, "elapsed_time": "2:29:28", "remaining_time": "1:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6190, "total_steps": 10000, "loss": 1.2391, "accuracy": 0.8999999761581421, "learning_rate": 1.9036663560535484e-06, "epoch": 0.619, "percentage": 61.9, "elapsed_time": "2:29:38", "remaining_time": "1:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6200, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.895195261000831e-06, "epoch": 0.62, "percentage": 62.0, "elapsed_time": "2:29:50", "remaining_time": "1:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6210, "total_steps": 10000, "loss": 0.3969, "accuracy": 0.8999999761581421, "learning_rate": 1.8867315353029937e-06, "epoch": 0.621, "percentage": 62.1, "elapsed_time": "2:30:00", "remaining_time": "1:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6220, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.8782752820878636e-06, "epoch": 0.622, "percentage": 62.2, "elapsed_time": "2:30:14", "remaining_time": "1:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6230, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.8698266043922159e-06, "epoch": 0.623, "percentage": 62.3, "elapsed_time": "2:30:25", "remaining_time": "1:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6240, "total_steps": 10000, "loss": 0.037, "accuracy": 1.0, "learning_rate": 1.8613856051605242e-06, "epoch": 0.624, "percentage": 62.4, "elapsed_time": "2:30:36", "remaining_time": "1:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6250, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.852952387243698e-06, "epoch": 0.625, "percentage": 62.5, "elapsed_time": "2:30:48", "remaining_time": "1:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6260, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.8445270533978387e-06, "epoch": 0.626, "percentage": 62.6, "elapsed_time": "2:31:01", "remaining_time": "1:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6270, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.836109706282978e-06, "epoch": 0.627, "percentage": 62.7, "elapsed_time": "2:31:12", "remaining_time": "1:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6280, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.827700448461836e-06, "epoch": 0.628, "percentage": 62.8, "elapsed_time": "2:31:23", "remaining_time": "1:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6290, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.8192993823985643e-06, "epoch": 0.629, "percentage": 62.9, "elapsed_time": "2:31:34", "remaining_time": "1:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6300, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.8109066104575023e-06, "epoch": 0.63, "percentage": 63.0, "elapsed_time": "2:31:45", "remaining_time": "1:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6310, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.8025222349019273e-06, "epoch": 0.631, "percentage": 63.1, "elapsed_time": "2:31:58", "remaining_time": "1:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6320, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.7941463578928088e-06, "epoch": 0.632, "percentage": 63.2, "elapsed_time": "2:32:09", "remaining_time": "1:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6330, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.7857790814875665e-06, "epoch": 0.633, "percentage": 63.3, "elapsed_time": "2:32:21", "remaining_time": "1:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6340, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.7774205076388207e-06, "epoch": 0.634, "percentage": 63.4, "elapsed_time": "2:32:31", "remaining_time": "1:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6350, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.7690707381931585e-06, "epoch": 0.635, "percentage": 63.5, "elapsed_time": "2:32:42", "remaining_time": "1:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6360, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.7607298748898844e-06, "epoch": 0.636, "percentage": 63.6, "elapsed_time": "2:32:53", "remaining_time": "1:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6370, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.7523980193597837e-06, "epoch": 0.637, "percentage": 63.7, "elapsed_time": "2:33:05", "remaining_time": "1:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6380, "total_steps": 10000, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 1.744075273123889e-06, "epoch": 0.638, "percentage": 63.8, "elapsed_time": "2:33:18", "remaining_time": "1:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6390, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.735761737592236e-06, "epoch": 0.639, "percentage": 63.9, "elapsed_time": "2:33:30", "remaining_time": "1:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6400, "total_steps": 10000, "loss": 0.0124, "accuracy": 1.0, "learning_rate": 1.7274575140626318e-06, "epoch": 0.64, "percentage": 64.0, "elapsed_time": "2:33:43", "remaining_time": "1:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6410, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.7191627037194187e-06, "epoch": 0.641, "percentage": 64.1, "elapsed_time": "2:33:55", "remaining_time": "1:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6420, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.7108774076322443e-06, "epoch": 0.642, "percentage": 64.2, "elapsed_time": "2:34:06", "remaining_time": "1:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6430, "total_steps": 10000, "loss": 1.7103, "accuracy": 0.8999999761581421, "learning_rate": 1.702601726754825e-06, "epoch": 0.643, "percentage": 64.3, "elapsed_time": "2:34:22", "remaining_time": "1:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6440, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.6943357619237227e-06, "epoch": 0.644, "percentage": 64.4, "elapsed_time": "2:34:33", "remaining_time": "1:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6450, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.686079613857109e-06, "epoch": 0.645, "percentage": 64.5, "elapsed_time": "2:34:44", "remaining_time": "1:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6460, "total_steps": 10000, "loss": 1.7072, "accuracy": 0.8999999761581421, "learning_rate": 1.677833383153542e-06, "epoch": 0.646, "percentage": 64.6, "elapsed_time": "2:34:56", "remaining_time": "1:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6470, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.6695971702907425e-06, "epoch": 0.647, "percentage": 64.7, "elapsed_time": "2:35:07", "remaining_time": "1:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6480, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.661371075624363e-06, "epoch": 0.648, "percentage": 64.8, "elapsed_time": "2:35:20", "remaining_time": "1:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6490, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.6531551993867717e-06, "epoch": 0.649, "percentage": 64.9, "elapsed_time": "2:35:31", "remaining_time": "1:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6500, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.6449496416858285e-06, "epoch": 0.65, "percentage": 65.0, "elapsed_time": "2:35:42", "remaining_time": "1:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6510, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.6367545025036634e-06, "epoch": 0.651, "percentage": 65.1, "elapsed_time": "2:35:54", "remaining_time": "1:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6520, "total_steps": 10000, "loss": 0.01, "accuracy": 1.0, "learning_rate": 1.6285698816954626e-06, "epoch": 0.652, "percentage": 65.2, "elapsed_time": "2:36:06", "remaining_time": "1:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6530, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.6203958789882457e-06, "epoch": 0.653, "percentage": 65.3, "elapsed_time": "2:36:17", "remaining_time": "1:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6540, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.612232593979658e-06, "epoch": 0.654, "percentage": 65.4, "elapsed_time": "2:36:29", "remaining_time": "1:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6550, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.6040801261367494e-06, "epoch": 0.655, "percentage": 65.5, "elapsed_time": "2:36:40", "remaining_time": "1:22:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6560, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5959385747947697e-06, "epoch": 0.656, "percentage": 65.6, "elapsed_time": "2:36:51", "remaining_time": "1:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6570, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5878080391559507e-06, "epoch": 0.657, "percentage": 65.7, "elapsed_time": "2:37:02", "remaining_time": "1:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6580, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5796886182883053e-06, "epoch": 0.658, "percentage": 65.8, "elapsed_time": "2:37:14", "remaining_time": "1:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6590, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5715804111244138e-06, "epoch": 0.659, "percentage": 65.9, "elapsed_time": "2:37:25", "remaining_time": "1:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6600, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.56348351646022e-06, "epoch": 0.66, "percentage": 66.0, "elapsed_time": "2:37:37", "remaining_time": "1:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6610, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5553980329538326e-06, "epoch": 0.661, "percentage": 66.1, "elapsed_time": "2:37:49", "remaining_time": "1:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6620, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.547324059124315e-06, "epoch": 0.662, "percentage": 66.2, "elapsed_time": "2:38:01", "remaining_time": "1:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6630, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.539261693350491e-06, "epoch": 0.663, "percentage": 66.3, "elapsed_time": "2:38:12", "remaining_time": "1:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6640, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5312110338697427e-06, "epoch": 0.664, "percentage": 66.4, "elapsed_time": "2:38:24", "remaining_time": "1:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6650, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5231721787768162e-06, "epoch": 0.665, "percentage": 66.5, "elapsed_time": "2:38:37", "remaining_time": "1:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6660, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5151452260226224e-06, "epoch": 0.666, "percentage": 66.6, "elapsed_time": "2:38:51", "remaining_time": "1:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6670, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5071302734130488e-06, "epoch": 0.667, "percentage": 66.7, "elapsed_time": "2:39:03", "remaining_time": "1:19:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6680, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.4991274186077632e-06, "epoch": 0.668, "percentage": 66.8, "elapsed_time": "2:39:17", "remaining_time": "1:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6690, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.491136759119025e-06, "epoch": 0.669, "percentage": 66.9, "elapsed_time": "2:39:29", "remaining_time": "1:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6700, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.4831583923104997e-06, "epoch": 0.67, "percentage": 67.0, "elapsed_time": "2:39:41", "remaining_time": "1:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6710, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.4751924153960681e-06, "epoch": 0.671, "percentage": 67.1, "elapsed_time": "2:39:55", "remaining_time": "1:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6720, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.467238925438646e-06, "epoch": 0.672, "percentage": 67.2, "elapsed_time": "2:40:08", "remaining_time": "1:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6730, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.4592980193489975e-06, "epoch": 0.673, "percentage": 67.3, "elapsed_time": "2:40:20", "remaining_time": "1:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6740, "total_steps": 10000, "loss": 0.0217, "accuracy": 1.0, "learning_rate": 1.4513697938845571e-06, "epoch": 0.674, "percentage": 67.4, "elapsed_time": "2:40:33", "remaining_time": "1:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6750, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.443454345648252e-06, "epoch": 0.675, "percentage": 67.5, "elapsed_time": "2:40:45", "remaining_time": "1:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6760, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.4355517710873184e-06, "epoch": 0.676, "percentage": 67.6, "elapsed_time": "2:40:57", "remaining_time": "1:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6770, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.4276621664921358e-06, "epoch": 0.677, "percentage": 67.7, "elapsed_time": "2:41:09", "remaining_time": "1:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6780, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.419785627995044e-06, "epoch": 0.678, "percentage": 67.8, "elapsed_time": "2:41:22", "remaining_time": "1:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6790, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.4119222515691817e-06, "epoch": 0.679, "percentage": 67.9, "elapsed_time": "2:41:34", "remaining_time": "1:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6800, "total_steps": 10000, "loss": 0.1543, "accuracy": 0.8999999761581421, "learning_rate": 1.4040721330273063e-06, "epoch": 0.68, "percentage": 68.0, "elapsed_time": "2:41:46", "remaining_time": "1:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6810, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.3962353680206372e-06, "epoch": 0.681, "percentage": 68.1, "elapsed_time": "2:41:59", "remaining_time": "1:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6820, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.388412052037682e-06, "epoch": 0.682, "percentage": 68.2, "elapsed_time": "2:42:11", "remaining_time": "1:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6830, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.380602280403076e-06, "epoch": 0.683, "percentage": 68.3, "elapsed_time": "2:42:23", "remaining_time": "1:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6840, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.3728061482764238e-06, "epoch": 0.684, "percentage": 68.4, "elapsed_time": "2:42:35", "remaining_time": "1:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6850, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.3650237506511333e-06, "epoch": 0.685, "percentage": 68.5, "elapsed_time": "2:42:49", "remaining_time": "1:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6860, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.3572551823532654e-06, "epoch": 0.686, "percentage": 68.6, "elapsed_time": "2:43:02", "remaining_time": "1:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6870, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.349500538040371e-06, "epoch": 0.687, "percentage": 68.7, "elapsed_time": "2:43:15", "remaining_time": "1:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6880, "total_steps": 10000, "loss": 0.0015, "accuracy": 1.0, "learning_rate": 1.3417599122003464e-06, "epoch": 0.688, "percentage": 68.8, "elapsed_time": "2:43:26", "remaining_time": "1:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6890, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.3340333991502723e-06, "epoch": 0.689, "percentage": 68.9, "elapsed_time": "2:43:37", "remaining_time": "1:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6900, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.3263210930352737e-06, "epoch": 0.69, "percentage": 69.0, "elapsed_time": "2:43:49", "remaining_time": "1:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6910, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.3186230878273654e-06, "epoch": 0.691, "percentage": 69.1, "elapsed_time": "2:44:01", "remaining_time": "1:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6920, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.3109394773243117e-06, "epoch": 0.692, "percentage": 69.2, "elapsed_time": "2:44:14", "remaining_time": "1:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6930, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.3032703551484832e-06, "epoch": 0.693, "percentage": 69.3, "elapsed_time": "2:44:26", "remaining_time": "1:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6940, "total_steps": 10000, "loss": 0.1174, "accuracy": 0.8999999761581421, "learning_rate": 1.2956158147457116e-06, "epoch": 0.694, "percentage": 69.4, "elapsed_time": "2:44:37", "remaining_time": "1:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6950, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.2879759493841577e-06, "epoch": 0.695, "percentage": 69.5, "elapsed_time": "2:44:47", "remaining_time": "1:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6960, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.280350852153168e-06, "epoch": 0.696, "percentage": 69.6, "elapsed_time": "2:45:00", "remaining_time": "1:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6970, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.272740615962148e-06, "epoch": 0.697, "percentage": 69.7, "elapsed_time": "2:45:13", "remaining_time": "1:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6980, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.2651453335394232e-06, "epoch": 0.698, "percentage": 69.8, "elapsed_time": "2:45:27", "remaining_time": "1:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6990, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.2575650974311118e-06, "epoch": 0.699, "percentage": 69.9, "elapsed_time": "2:45:38", "remaining_time": "1:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7000, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.2500000000000007e-06, "epoch": 0.7, "percentage": 70.0, "elapsed_time": "2:45:49", "remaining_time": "1:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7010, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.2424501334244124e-06, "epoch": 0.701, "percentage": 70.1, "elapsed_time": "2:46:10", "remaining_time": "1:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7020, "total_steps": 10000, "loss": 0.018, "accuracy": 1.0, "learning_rate": 1.234915589697091e-06, "epoch": 0.702, "percentage": 70.2, "elapsed_time": "2:46:23", "remaining_time": "1:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7030, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.2273964606240718e-06, "epoch": 0.703, "percentage": 70.3, "elapsed_time": "2:46:34", "remaining_time": "1:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7040, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.2198928378235717e-06, "epoch": 0.704, "percentage": 70.4, "elapsed_time": "2:46:46", "remaining_time": "1:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7050, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.2124048127248644e-06, "epoch": 0.705, "percentage": 70.5, "elapsed_time": "2:46:57", "remaining_time": "1:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7060, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.204932476567175e-06, "epoch": 0.706, "percentage": 70.6, "elapsed_time": "2:47:09", "remaining_time": "1:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7070, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.19747592039856e-06, "epoch": 0.707, "percentage": 70.7, "elapsed_time": "2:47:23", "remaining_time": "1:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7080, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.1900352350748026e-06, "epoch": 0.708, "percentage": 70.8, "elapsed_time": "2:47:34", "remaining_time": "1:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7090, "total_steps": 10000, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 1.1826105112583061e-06, "epoch": 0.709, "percentage": 70.9, "elapsed_time": "2:47:49", "remaining_time": "1:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7100, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.1752018394169882e-06, "epoch": 0.71, "percentage": 71.0, "elapsed_time": "2:48:02", "remaining_time": "1:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7110, "total_steps": 10000, "loss": 0.5563, "accuracy": 0.8999999761581421, "learning_rate": 1.1678093098231748e-06, "epoch": 0.711, "percentage": 71.1, "elapsed_time": "2:48:12", "remaining_time": "1:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7120, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.160433012552508e-06, "epoch": 0.712, "percentage": 71.2, "elapsed_time": "2:48:24", "remaining_time": "1:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7130, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.1530730374828424e-06, "epoch": 0.713, "percentage": 71.3, "elapsed_time": "2:48:37", "remaining_time": "1:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7140, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.1457294742931508e-06, "epoch": 0.714, "percentage": 71.4, "elapsed_time": "2:48:51", "remaining_time": "1:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7150, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.1384024124624324e-06, "epoch": 0.715, "percentage": 71.5, "elapsed_time": "2:49:02", "remaining_time": "1:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7160, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.1310919412686248e-06, "epoch": 0.716, "percentage": 71.6, "elapsed_time": "2:49:15", "remaining_time": "1:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7170, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.1237981497875112e-06, "epoch": 0.717, "percentage": 71.7, "elapsed_time": "2:49:26", "remaining_time": "1:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7180, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.11652112689164e-06, "epoch": 0.718, "percentage": 71.8, "elapsed_time": "2:49:38", "remaining_time": "1:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7190, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.109260961249238e-06, "epoch": 0.719, "percentage": 71.9, "elapsed_time": "2:49:50", "remaining_time": "1:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7200, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.1020177413231334e-06, "epoch": 0.72, "percentage": 72.0, "elapsed_time": "2:50:03", "remaining_time": "1:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7210, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0947915553696742e-06, "epoch": 0.721, "percentage": 72.1, "elapsed_time": "2:50:14", "remaining_time": "1:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7220, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0875824914376555e-06, "epoch": 0.722, "percentage": 72.2, "elapsed_time": "2:50:26", "remaining_time": "1:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7230, "total_steps": 10000, "loss": 0.4843, "accuracy": 0.8999999761581421, "learning_rate": 1.0803906373672477e-06, "epoch": 0.723, "percentage": 72.3, "elapsed_time": "2:50:39", "remaining_time": "1:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7240, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.073216080788921e-06, "epoch": 0.724, "percentage": 72.4, "elapsed_time": "2:50:51", "remaining_time": "1:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7250, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0660589091223854e-06, "epoch": 0.725, "percentage": 72.5, "elapsed_time": "2:51:02", "remaining_time": "1:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7260, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.0589192095755172e-06, "epoch": 0.726, "percentage": 72.6, "elapsed_time": "2:51:13", "remaining_time": "1:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7270, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0517970691433035e-06, "epoch": 0.727, "percentage": 72.7, "elapsed_time": "2:51:26", "remaining_time": "1:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7280, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0446925746067768e-06, "epoch": 0.728, "percentage": 72.8, "elapsed_time": "2:51:38", "remaining_time": "1:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7290, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0376058125319614e-06, "epoch": 0.729, "percentage": 72.9, "elapsed_time": "2:51:51", "remaining_time": "1:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7300, "total_steps": 10000, "loss": 0.0038, "accuracy": 1.0, "learning_rate": 1.0305368692688175e-06, "epoch": 0.73, "percentage": 73.0, "elapsed_time": "2:52:03", "remaining_time": "1:03:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7310, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0234858309501864e-06, "epoch": 0.731, "percentage": 73.1, "elapsed_time": "2:52:16", "remaining_time": "1:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7320, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0164527834907468e-06, "epoch": 0.732, "percentage": 73.2, "elapsed_time": "2:52:28", "remaining_time": "1:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7330, "total_steps": 10000, "loss": 0.0089, "accuracy": 1.0, "learning_rate": 1.0094378125859602e-06, "epoch": 0.733, "percentage": 73.3, "elapsed_time": "2:52:39", "remaining_time": "1:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7340, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0024410037110356e-06, "epoch": 0.734, "percentage": 73.4, "elapsed_time": "2:52:51", "remaining_time": "1:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7350, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.95462442119879e-07, "epoch": 0.735, "percentage": 73.5, "elapsed_time": "2:53:02", "remaining_time": "1:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7360, "total_steps": 10000, "loss": 0.0176, "accuracy": 1.0, "learning_rate": 9.88502212844063e-07, "epoch": 0.736, "percentage": 73.6, "elapsed_time": "2:53:15", "remaining_time": "1:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7370, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.815604006917839e-07, "epoch": 0.737, "percentage": 73.7, "elapsed_time": "2:53:27", "remaining_time": "1:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7380, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.746370902468311e-07, "epoch": 0.738, "percentage": 73.8, "elapsed_time": "2:53:39", "remaining_time": "1:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7390, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.677323658675594e-07, "epoch": 0.739, "percentage": 73.9, "elapsed_time": "2:53:50", "remaining_time": "1:01:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7400, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.608463116858544e-07, "epoch": 0.74, "percentage": 74.0, "elapsed_time": "2:54:03", "remaining_time": "1:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7410, "total_steps": 10000, "loss": 0.0036, "accuracy": 1.0, "learning_rate": 9.53979011606115e-07, "epoch": 0.741, "percentage": 74.1, "elapsed_time": "2:54:15", "remaining_time": "1:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7420, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.471305493042243e-07, "epoch": 0.742, "percentage": 74.2, "elapsed_time": "2:54:28", "remaining_time": "1:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7430, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.403010082265351e-07, "epoch": 0.743, "percentage": 74.3, "elapsed_time": "2:54:40", "remaining_time": "1:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7440, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.334904715888496e-07, "epoch": 0.744, "percentage": 74.4, "elapsed_time": "2:54:52", "remaining_time": "1:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7450, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.266990223754069e-07, "epoch": 0.745, "percentage": 74.5, "elapsed_time": "2:55:04", "remaining_time": "0:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7460, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.199267433378728e-07, "epoch": 0.746, "percentage": 74.6, "elapsed_time": "2:55:15", "remaining_time": "0:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7470, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 9.131737169943314e-07, "epoch": 0.747, "percentage": 74.7, "elapsed_time": "2:55:27", "remaining_time": "0:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7480, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.064400256282757e-07, "epoch": 0.748, "percentage": 74.8, "elapsed_time": "2:55:38", "remaining_time": "0:59:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7490, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.99725751287611e-07, "epoch": 0.749, "percentage": 74.9, "elapsed_time": "2:55:49", "remaining_time": "0:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7500, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.930309757836517e-07, "epoch": 0.75, "percentage": 75.0, "elapsed_time": "2:56:01", "remaining_time": "0:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7510, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.863557806901233e-07, "epoch": 0.751, "percentage": 75.1, "elapsed_time": "2:56:15", "remaining_time": "0:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7520, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 8.797002473421729e-07, "epoch": 0.752, "percentage": 75.2, "elapsed_time": "2:56:25", "remaining_time": "0:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7530, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.73064456835373e-07, "epoch": 0.753, "percentage": 75.3, "elapsed_time": "2:56:39", "remaining_time": "0:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7540, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.664484900247363e-07, "epoch": 0.754, "percentage": 75.4, "elapsed_time": "2:56:52", "remaining_time": "0:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7550, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.598524275237321e-07, "epoch": 0.755, "percentage": 75.5, "elapsed_time": "2:57:03", "remaining_time": "0:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7560, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.532763497032987e-07, "epoch": 0.756, "percentage": 75.6, "elapsed_time": "2:57:15", "remaining_time": "0:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7570, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.467203366908708e-07, "epoch": 0.757, "percentage": 75.7, "elapsed_time": "2:57:27", "remaining_time": "0:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7580, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.40184468369396e-07, "epoch": 0.758, "percentage": 75.8, "elapsed_time": "2:57:39", "remaining_time": "0:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7590, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.336688243763691e-07, "epoch": 0.759, "percentage": 75.9, "elapsed_time": "2:57:53", "remaining_time": "0:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7600, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 8.271734841028553e-07, "epoch": 0.76, "percentage": 76.0, "elapsed_time": "2:58:04", "remaining_time": "0:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7610, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.206985266925249e-07, "epoch": 0.761, "percentage": 76.1, "elapsed_time": "2:58:16", "remaining_time": "0:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7620, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.142440310406923e-07, "epoch": 0.762, "percentage": 76.2, "elapsed_time": "2:58:27", "remaining_time": "0:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7630, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.078100757933486e-07, "epoch": 0.763, "percentage": 76.3, "elapsed_time": "2:58:39", "remaining_time": "0:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7640, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.013967393462094e-07, "epoch": 0.764, "percentage": 76.4, "elapsed_time": "2:58:50", "remaining_time": "0:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7650, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.950040998437541e-07, "epoch": 0.765, "percentage": 76.5, "elapsed_time": "2:59:01", "remaining_time": "0:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7660, "total_steps": 10000, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 7.886322351782782e-07, "epoch": 0.766, "percentage": 76.6, "elapsed_time": "2:59:13", "remaining_time": "0:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7670, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.822812229889429e-07, "epoch": 0.767, "percentage": 76.7, "elapsed_time": "2:59:27", "remaining_time": "0:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7680, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 7.759511406608255e-07, "epoch": 0.768, "percentage": 76.8, "elapsed_time": "2:59:38", "remaining_time": "0:54:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7690, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.696420653239834e-07, "epoch": 0.769, "percentage": 76.9, "elapsed_time": "2:59:50", "remaining_time": "0:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7700, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.633540738525066e-07, "epoch": 0.77, "percentage": 77.0, "elapsed_time": "3:00:04", "remaining_time": "0:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7710, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.57087242863589e-07, "epoch": 0.771, "percentage": 77.1, "elapsed_time": "3:00:15", "remaining_time": "0:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7720, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.508416487165864e-07, "epoch": 0.772, "percentage": 77.2, "elapsed_time": "3:00:30", "remaining_time": "0:53:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7730, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.446173675120943e-07, "epoch": 0.773, "percentage": 77.3, "elapsed_time": "3:00:43", "remaining_time": "0:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7740, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.384144750910133e-07, "epoch": 0.774, "percentage": 77.4, "elapsed_time": "3:00:55", "remaining_time": "0:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7750, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.322330470336314e-07, "epoch": 0.775, "percentage": 77.5, "elapsed_time": "3:01:10", "remaining_time": "0:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7760, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.260731586586983e-07, "epoch": 0.776, "percentage": 77.6, "elapsed_time": "3:01:21", "remaining_time": "0:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7770, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.199348850225091e-07, "epoch": 0.777, "percentage": 77.7, "elapsed_time": "3:01:31", "remaining_time": "0:52:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7780, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 7.138183009179922e-07, "epoch": 0.778, "percentage": 77.8, "elapsed_time": "3:01:42", "remaining_time": "0:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7790, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.077234808737932e-07, "epoch": 0.779, "percentage": 77.9, "elapsed_time": "3:01:54", "remaining_time": "0:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7800, "total_steps": 10000, "loss": 0.4145, "accuracy": 0.8999999761581421, "learning_rate": 7.016504991533727e-07, "epoch": 0.78, "percentage": 78.0, "elapsed_time": "3:02:07", "remaining_time": "0:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7810, "total_steps": 10000, "loss": 0.0058, "accuracy": 1.0, "learning_rate": 6.955994297540947e-07, "epoch": 0.781, "percentage": 78.1, "elapsed_time": "3:02:20", "remaining_time": "0:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7820, "total_steps": 10000, "loss": 0.0111, "accuracy": 1.0, "learning_rate": 6.895703464063319e-07, "epoch": 0.782, "percentage": 78.2, "elapsed_time": "3:02:31", "remaining_time": "0:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7830, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.835633225725604e-07, "epoch": 0.783, "percentage": 78.3, "elapsed_time": "3:02:44", "remaining_time": "0:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7840, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.775784314464717e-07, "epoch": 0.784, "percentage": 78.4, "elapsed_time": "3:02:55", "remaining_time": "0:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7850, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.716157459520739e-07, "epoch": 0.785, "percentage": 78.5, "elapsed_time": "3:03:07", "remaining_time": "0:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7860, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.656753387428089e-07, "epoch": 0.786, "percentage": 78.6, "elapsed_time": "3:03:17", "remaining_time": "0:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7870, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.597572822006643e-07, "epoch": 0.787, "percentage": 78.7, "elapsed_time": "3:03:30", "remaining_time": "0:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7880, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.538616484352902e-07, "epoch": 0.788, "percentage": 78.8, "elapsed_time": "3:03:44", "remaining_time": "0:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7890, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.479885092831248e-07, "epoch": 0.789, "percentage": 78.9, "elapsed_time": "3:03:56", "remaining_time": "0:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7900, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.421379363065142e-07, "epoch": 0.79, "percentage": 79.0, "elapsed_time": "3:04:08", "remaining_time": "0:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7910, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.363100007928447e-07, "epoch": 0.791, "percentage": 79.1, "elapsed_time": "3:04:20", "remaining_time": "0:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7920, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.305047737536707e-07, "epoch": 0.792, "percentage": 79.2, "elapsed_time": "3:04:32", "remaining_time": "0:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7930, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.247223259238513e-07, "epoch": 0.793, "percentage": 79.3, "elapsed_time": "3:04:43", "remaining_time": "0:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7940, "total_steps": 10000, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 6.189627277606894e-07, "epoch": 0.794, "percentage": 79.4, "elapsed_time": "3:04:54", "remaining_time": "0:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7950, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.1322604944307e-07, "epoch": 0.795, "percentage": 79.5, "elapsed_time": "3:05:08", "remaining_time": "0:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7960, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.075123608706093e-07, "epoch": 0.796, "percentage": 79.6, "elapsed_time": "3:05:20", "remaining_time": "0:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7970, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.01821731662798e-07, "epoch": 0.797, "percentage": 79.7, "elapsed_time": "3:05:33", "remaining_time": "0:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7980, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.961542311581586e-07, "epoch": 0.798, "percentage": 79.8, "elapsed_time": "3:05:45", "remaining_time": "0:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7990, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.905099284133953e-07, "epoch": 0.799, "percentage": 79.9, "elapsed_time": "3:05:56", "remaining_time": "0:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8000, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.848888922025553e-07, "epoch": 0.8, "percentage": 80.0, "elapsed_time": "3:06:07", "remaining_time": "0:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8010, "total_steps": 10000, "loss": 0.3056, "accuracy": 0.8999999761581421, "learning_rate": 5.792911910161922e-07, "epoch": 0.801, "percentage": 80.1, "elapsed_time": "3:06:27", "remaining_time": "0:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8020, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.737168930605272e-07, "epoch": 0.802, "percentage": 80.2, "elapsed_time": "3:06:39", "remaining_time": "0:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8030, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.681660662566225e-07, "epoch": 0.803, "percentage": 80.3, "elapsed_time": "3:06:51", "remaining_time": "0:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8040, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.626387782395515e-07, "epoch": 0.804, "percentage": 80.4, "elapsed_time": "3:07:02", "remaining_time": "0:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8050, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.571350963575728e-07, "epoch": 0.805, "percentage": 80.5, "elapsed_time": "3:07:14", "remaining_time": "0:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8060, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.516550876713142e-07, "epoch": 0.806, "percentage": 80.6, "elapsed_time": "3:07:27", "remaining_time": "0:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8070, "total_steps": 10000, "loss": 0.0045, "accuracy": 1.0, "learning_rate": 5.461988189529529e-07, "epoch": 0.807, "percentage": 80.7, "elapsed_time": "3:07:39", "remaining_time": "0:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8080, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.407663566854008e-07, "epoch": 0.808, "percentage": 80.8, "elapsed_time": "3:07:51", "remaining_time": "0:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8090, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.353577670614951e-07, "epoch": 0.809, "percentage": 80.9, "elapsed_time": "3:08:02", "remaining_time": "0:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8100, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.299731159831953e-07, "epoch": 0.81, "percentage": 81.0, "elapsed_time": "3:08:14", "remaining_time": "0:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8110, "total_steps": 10000, "loss": 0.6231, "accuracy": 0.8999999761581421, "learning_rate": 5.24612469060774e-07, "epoch": 0.811, "percentage": 81.1, "elapsed_time": "3:08:26", "remaining_time": "0:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8120, "total_steps": 10000, "loss": 0.0581, "accuracy": 1.0, "learning_rate": 5.192758916120236e-07, "epoch": 0.812, "percentage": 81.2, "elapsed_time": "3:08:39", "remaining_time": "0:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8130, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.139634486614544e-07, "epoch": 0.813, "percentage": 81.3, "elapsed_time": "3:08:53", "remaining_time": "0:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8140, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.086752049395097e-07, "epoch": 0.814, "percentage": 81.4, "elapsed_time": "3:09:04", "remaining_time": "0:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8150, "total_steps": 10000, "loss": 0.0012, "accuracy": 1.0, "learning_rate": 5.034112248817685e-07, "epoch": 0.815, "percentage": 81.5, "elapsed_time": "3:09:16", "remaining_time": "0:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8160, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.981715726281666e-07, "epoch": 0.816, "percentage": 81.6, "elapsed_time": "3:09:27", "remaining_time": "0:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8170, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.929563120222142e-07, "epoch": 0.817, "percentage": 81.7, "elapsed_time": "3:09:39", "remaining_time": "0:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8180, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.87765506610215e-07, "epoch": 0.818, "percentage": 81.8, "elapsed_time": "3:09:53", "remaining_time": "0:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8190, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.825992196404958e-07, "epoch": 0.819, "percentage": 81.9, "elapsed_time": "3:10:04", "remaining_time": "0:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8200, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.774575140626317e-07, "epoch": 0.82, "percentage": 82.0, "elapsed_time": "3:10:16", "remaining_time": "0:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8210, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.7234045252668393e-07, "epoch": 0.821, "percentage": 82.1, "elapsed_time": "3:10:30", "remaining_time": "0:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8220, "total_steps": 10000, "loss": 0.0048, "accuracy": 1.0, "learning_rate": 4.672480973824312e-07, "epoch": 0.822, "percentage": 82.2, "elapsed_time": "3:10:41", "remaining_time": "0:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8230, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.6218051067861423e-07, "epoch": 0.823, "percentage": 82.3, "elapsed_time": "3:10:53", "remaining_time": "0:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8240, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.5713775416217884e-07, "epoch": 0.824, "percentage": 82.4, "elapsed_time": "3:11:05", "remaining_time": "0:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8250, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.5211988927752026e-07, "epoch": 0.825, "percentage": 82.5, "elapsed_time": "3:11:20", "remaining_time": "0:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8260, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.4712697716573994e-07, "epoch": 0.826, "percentage": 82.6, "elapsed_time": "3:11:32", "remaining_time": "0:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8270, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.421590786638952e-07, "epoch": 0.827, "percentage": 82.7, "elapsed_time": "3:11:44", "remaining_time": "0:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8280, "total_steps": 10000, "loss": 0.0242, "accuracy": 1.0, "learning_rate": 4.372162543042624e-07, "epoch": 0.828, "percentage": 82.8, "elapsed_time": "3:11:57", "remaining_time": "0:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8290, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.3229856431359516e-07, "epoch": 0.829, "percentage": 82.9, "elapsed_time": "3:12:09", "remaining_time": "0:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8300, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.27406068612396e-07, "epoch": 0.83, "percentage": 83.0, "elapsed_time": "3:12:22", "remaining_time": "0:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8310, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.225388268141797e-07, "epoch": 0.831, "percentage": 83.1, "elapsed_time": "3:12:35", "remaining_time": "0:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8320, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.1769689822475147e-07, "epoch": 0.832, "percentage": 83.2, "elapsed_time": "3:12:47", "remaining_time": "0:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8330, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.12880341841484e-07, "epoch": 0.833, "percentage": 83.3, "elapsed_time": "3:13:00", "remaining_time": "0:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8340, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.0808921635259595e-07, "epoch": 0.834, "percentage": 83.4, "elapsed_time": "3:13:12", "remaining_time": "0:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8350, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.033235801364402e-07, "epoch": 0.835, "percentage": 83.5, "elapsed_time": "3:13:23", "remaining_time": "0:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8360, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.9858349126078945e-07, "epoch": 0.836, "percentage": 83.6, "elapsed_time": "3:13:35", "remaining_time": "0:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8370, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.938690074821314e-07, "epoch": 0.837, "percentage": 83.7, "elapsed_time": "3:13:46", "remaining_time": "0:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8380, "total_steps": 10000, "loss": 0.2999, "accuracy": 0.8999999761581421, "learning_rate": 3.891801862449629e-07, "epoch": 0.838, "percentage": 83.8, "elapsed_time": "3:13:58", "remaining_time": "0:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8390, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.8451708468109026e-07, "epoch": 0.839, "percentage": 83.9, "elapsed_time": "3:14:10", "remaining_time": "0:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8400, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.798797596089351e-07, "epoch": 0.84, "percentage": 84.0, "elapsed_time": "3:14:23", "remaining_time": "0:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8410, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.7526826753284065e-07, "epoch": 0.841, "percentage": 84.1, "elapsed_time": "3:14:34", "remaining_time": "0:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8420, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.7068266464238085e-07, "epoch": 0.842, "percentage": 84.2, "elapsed_time": "3:14:48", "remaining_time": "0:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8430, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.661230068116811e-07, "epoch": 0.843, "percentage": 84.3, "elapsed_time": "3:14:59", "remaining_time": "0:36:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8440, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.615893495987335e-07, "epoch": 0.844, "percentage": 84.4, "elapsed_time": "3:15:12", "remaining_time": "0:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8450, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.5708174824471947e-07, "epoch": 0.845, "percentage": 84.5, "elapsed_time": "3:15:23", "remaining_time": "0:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8460, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.5260025767333894e-07, "epoch": 0.846, "percentage": 84.6, "elapsed_time": "3:15:36", "remaining_time": "0:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8470, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.481449324901412e-07, "epoch": 0.847, "percentage": 84.7, "elapsed_time": "3:15:48", "remaining_time": "0:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8480, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.4371582698185636e-07, "epoch": 0.848, "percentage": 84.8, "elapsed_time": "3:16:00", "remaining_time": "0:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8490, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.393129951157384e-07, "epoch": 0.849, "percentage": 84.9, "elapsed_time": "3:16:13", "remaining_time": "0:34:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8500, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.3493649053890325e-07, "epoch": 0.85, "percentage": 85.0, "elapsed_time": "3:16:25", "remaining_time": "0:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8510, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.3058636657767927e-07, "epoch": 0.851, "percentage": 85.1, "elapsed_time": "3:16:36", "remaining_time": "0:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8520, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.262626762369525e-07, "epoch": 0.852, "percentage": 85.2, "elapsed_time": "3:16:49", "remaining_time": "0:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8530, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.219654721995266e-07, "epoch": 0.853, "percentage": 85.3, "elapsed_time": "3:17:00", "remaining_time": "0:33:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8540, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.176948068254762e-07, "epoch": 0.854, "percentage": 85.4, "elapsed_time": "3:17:13", "remaining_time": "0:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8550, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.134507321515107e-07, "epoch": 0.855, "percentage": 85.5, "elapsed_time": "3:17:26", "remaining_time": "0:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8560, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.0923329989034134e-07, "epoch": 0.856, "percentage": 85.6, "elapsed_time": "3:17:37", "remaining_time": "0:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8570, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.050425614300487e-07, "epoch": 0.857, "percentage": 85.7, "elapsed_time": "3:17:48", "remaining_time": "0:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8580, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.0087856783345916e-07, "epoch": 0.858, "percentage": 85.8, "elapsed_time": "3:18:03", "remaining_time": "0:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8590, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.967413698375196e-07, "epoch": 0.859, "percentage": 85.9, "elapsed_time": "3:18:16", "remaining_time": "0:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8600, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.9263101785268253e-07, "epoch": 0.86, "percentage": 86.0, "elapsed_time": "3:18:27", "remaining_time": "0:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8610, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.8854756196229017e-07, "epoch": 0.861, "percentage": 86.1, "elapsed_time": "3:18:40", "remaining_time": "0:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8620, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.844910519219632e-07, "epoch": 0.862, "percentage": 86.2, "elapsed_time": "3:18:52", "remaining_time": "0:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8630, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.8046153715899695e-07, "epoch": 0.863, "percentage": 86.3, "elapsed_time": "3:19:04", "remaining_time": "0:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8640, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.7645906677175594e-07, "epoch": 0.864, "percentage": 86.4, "elapsed_time": "3:19:16", "remaining_time": "0:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8650, "total_steps": 10000, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 2.7248368952908055e-07, "epoch": 0.865, "percentage": 86.5, "elapsed_time": "3:19:28", "remaining_time": "0:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8660, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.6853545386968607e-07, "epoch": 0.866, "percentage": 86.6, "elapsed_time": "3:19:39", "remaining_time": "0:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8670, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.6461440790157974e-07, "epoch": 0.867, "percentage": 86.7, "elapsed_time": "3:19:51", "remaining_time": "0:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8680, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.6072059940146775e-07, "epoch": 0.868, "percentage": 86.8, "elapsed_time": "3:20:02", "remaining_time": "0:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8690, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.568540758141791e-07, "epoch": 0.869, "percentage": 86.9, "elapsed_time": "3:20:12", "remaining_time": "0:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8700, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.53014884252083e-07, "epoch": 0.87, "percentage": 87.0, "elapsed_time": "3:20:23", "remaining_time": "0:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8710, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.492030714945162e-07, "epoch": 0.871, "percentage": 87.1, "elapsed_time": "3:20:35", "remaining_time": "0:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8720, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.454186839872158e-07, "epoch": 0.872, "percentage": 87.2, "elapsed_time": "3:20:46", "remaining_time": "0:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8730, "total_steps": 10000, "loss": 0.4983, "accuracy": 0.8999999761581421, "learning_rate": 2.416617678417482e-07, "epoch": 0.873, "percentage": 87.3, "elapsed_time": "3:20:57", "remaining_time": "0:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8740, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3793236883495164e-07, "epoch": 0.874, "percentage": 87.4, "elapsed_time": "3:21:08", "remaining_time": "0:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8750, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3423053240837518e-07, "epoch": 0.875, "percentage": 87.5, "elapsed_time": "3:21:19", "remaining_time": "0:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8760, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.3055630366772857e-07, "epoch": 0.876, "percentage": 87.6, "elapsed_time": "3:21:31", "remaining_time": "0:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8770, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.269097273823287e-07, "epoch": 0.877, "percentage": 87.7, "elapsed_time": "3:21:43", "remaining_time": "0:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8780, "total_steps": 10000, "loss": 0.7611, "accuracy": 0.8999999761581421, "learning_rate": 2.2329084798455747e-07, "epoch": 0.878, "percentage": 87.8, "elapsed_time": "3:21:55", "remaining_time": "0:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8790, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.1969970956931762e-07, "epoch": 0.879, "percentage": 87.9, "elapsed_time": "3:22:07", "remaining_time": "0:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8800, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.1613635589349756e-07, "epoch": 0.88, "percentage": 88.0, "elapsed_time": "3:22:18", "remaining_time": "0:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8810, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.1260083037543817e-07, "epoch": 0.881, "percentage": 88.1, "elapsed_time": "3:22:28", "remaining_time": "0:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8820, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.0909317609440093e-07, "epoch": 0.882, "percentage": 88.2, "elapsed_time": "3:22:38", "remaining_time": "0:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8830, "total_steps": 10000, "loss": 0.0019, "accuracy": 1.0, "learning_rate": 2.0561343579004716e-07, "epoch": 0.883, "percentage": 88.3, "elapsed_time": "3:22:50", "remaining_time": "0:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8840, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.0216165186191406e-07, "epoch": 0.884, "percentage": 88.4, "elapsed_time": "3:23:02", "remaining_time": "0:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8850, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.9873786636889908e-07, "epoch": 0.885, "percentage": 88.5, "elapsed_time": "3:23:13", "remaining_time": "0:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8860, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.95342121028749e-07, "epoch": 0.886, "percentage": 88.6, "elapsed_time": "3:23:27", "remaining_time": "0:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8870, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.9197445721754777e-07, "epoch": 0.887, "percentage": 88.7, "elapsed_time": "3:23:40", "remaining_time": "0:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8880, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.8863491596921745e-07, "epoch": 0.888, "percentage": 88.8, "elapsed_time": "3:23:52", "remaining_time": "0:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8890, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.8532353797501318e-07, "epoch": 0.889, "percentage": 88.9, "elapsed_time": "3:24:05", "remaining_time": "0:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8900, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.8204036358303173e-07, "epoch": 0.89, "percentage": 89.0, "elapsed_time": "3:24:16", "remaining_time": "0:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8910, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.787854327977162e-07, "epoch": 0.891, "percentage": 89.1, "elapsed_time": "3:24:29", "remaining_time": "0:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8920, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.7555878527937164e-07, "epoch": 0.892, "percentage": 89.2, "elapsed_time": "3:24:41", "remaining_time": "0:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8930, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.7236046034367959e-07, "epoch": 0.893, "percentage": 89.3, "elapsed_time": "3:24:52", "remaining_time": "0:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8940, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.6919049696121957e-07, "epoch": 0.894, "percentage": 89.4, "elapsed_time": "3:25:05", "remaining_time": "0:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8950, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.6604893375699594e-07, "epoch": 0.895, "percentage": 89.5, "elapsed_time": "3:25:19", "remaining_time": "0:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8960, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.629358090099639e-07, "epoch": 0.896, "percentage": 89.6, "elapsed_time": "3:25:33", "remaining_time": "0:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8970, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5985116065256683e-07, "epoch": 0.897, "percentage": 89.7, "elapsed_time": "3:25:45", "remaining_time": "0:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8980, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.567950262702714e-07, "epoch": 0.898, "percentage": 89.8, "elapsed_time": "3:25:55", "remaining_time": "0:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8990, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5376744310111019e-07, "epoch": 0.899, "percentage": 89.9, "elapsed_time": "3:26:06", "remaining_time": "0:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9000, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.507684480352292e-07, "epoch": 0.9, "percentage": 90.0, "elapsed_time": "3:26:17", "remaining_time": "0:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9010, "total_steps": 10000, "loss": 0.6933, "accuracy": 0.8999999761581421, "learning_rate": 1.4779807761443638e-07, "epoch": 0.901, "percentage": 90.1, "elapsed_time": "3:26:35", "remaining_time": "0:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9020, "total_steps": 10000, "loss": 0.004, "accuracy": 1.0, "learning_rate": 1.4485636803175828e-07, "epoch": 0.902, "percentage": 90.2, "elapsed_time": "3:26:48", "remaining_time": "0:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9030, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.419433551309976e-07, "epoch": 0.903, "percentage": 90.3, "elapsed_time": "3:26:59", "remaining_time": "0:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9040, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.3905907440629752e-07, "epoch": 0.904, "percentage": 90.4, "elapsed_time": "3:27:10", "remaining_time": "0:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9050, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.362035610017079e-07, "epoch": 0.905, "percentage": 90.5, "elapsed_time": "3:27:24", "remaining_time": "0:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9060, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.3337684971075932e-07, "epoch": 0.906, "percentage": 90.6, "elapsed_time": "3:27:35", "remaining_time": "0:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9070, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.305789749760361e-07, "epoch": 0.907, "percentage": 90.7, "elapsed_time": "3:27:47", "remaining_time": "0:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9080, "total_steps": 10000, "loss": 0.1366, "accuracy": 0.8999999761581421, "learning_rate": 1.278099708887587e-07, "epoch": 0.908, "percentage": 90.8, "elapsed_time": "3:27:58", "remaining_time": "0:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9090, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.2506987118836912e-07, "epoch": 0.909, "percentage": 90.9, "elapsed_time": "3:28:10", "remaining_time": "0:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9100, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.223587092621162e-07, "epoch": 0.91, "percentage": 91.0, "elapsed_time": "3:28:22", "remaining_time": "0:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9110, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.1967651814465353e-07, "epoch": 0.911, "percentage": 91.1, "elapsed_time": "3:28:35", "remaining_time": "0:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9120, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.1702333051763271e-07, "epoch": 0.912, "percentage": 91.2, "elapsed_time": "3:28:48", "remaining_time": "0:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9130, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.1439917870930795e-07, "epoch": 0.913, "percentage": 91.3, "elapsed_time": "3:29:01", "remaining_time": "0:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9140, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.1180409469414094e-07, "epoch": 0.914, "percentage": 91.4, "elapsed_time": "3:29:14", "remaining_time": "0:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9150, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0923811009241142e-07, "epoch": 0.915, "percentage": 91.5, "elapsed_time": "3:29:26", "remaining_time": "0:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9160, "total_steps": 10000, "loss": 0.0247, "accuracy": 1.0, "learning_rate": 1.067012561698319e-07, "epoch": 0.916, "percentage": 91.6, "elapsed_time": "3:29:39", "remaining_time": "0:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9170, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.041935638371669e-07, "epoch": 0.917, "percentage": 91.7, "elapsed_time": "3:29:50", "remaining_time": "0:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9180, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0171506364985622e-07, "epoch": 0.918, "percentage": 91.8, "elapsed_time": "3:30:02", "remaining_time": "0:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9190, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.926578580764234e-08, "epoch": 0.919, "percentage": 91.9, "elapsed_time": "3:30:14", "remaining_time": "0:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9200, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.684576015420277e-08, "epoch": 0.92, "percentage": 92.0, "elapsed_time": "3:30:26", "remaining_time": "0:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9210, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.445501617678654e-08, "epoch": 0.921, "percentage": 92.1, "elapsed_time": "3:30:40", "remaining_time": "0:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9220, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.209358300585474e-08, "epoch": 0.922, "percentage": 92.2, "elapsed_time": "3:30:54", "remaining_time": "0:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9230, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.9761489414725e-08, "epoch": 0.923, "percentage": 92.3, "elapsed_time": "3:31:07", "remaining_time": "0:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9240, "total_steps": 10000, "loss": 0.8828, "accuracy": 0.8999999761581421, "learning_rate": 8.745876381922147e-08, "epoch": 0.924, "percentage": 92.4, "elapsed_time": "3:31:18", "remaining_time": "0:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9250, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.518543427732951e-08, "epoch": 0.925, "percentage": 92.5, "elapsed_time": "3:31:29", "remaining_time": "0:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9260, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.294152848885156e-08, "epoch": 0.926, "percentage": 92.6, "elapsed_time": "3:31:43", "remaining_time": "0:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9270, "total_steps": 10000, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 8.072707379507217e-08, "epoch": 0.927, "percentage": 92.7, "elapsed_time": "3:31:55", "remaining_time": "0:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9280, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.854209717842231e-08, "epoch": 0.928, "percentage": 92.8, "elapsed_time": "3:32:08", "remaining_time": "0:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9290, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.638662526215284e-08, "epoch": 0.929, "percentage": 92.9, "elapsed_time": "3:32:21", "remaining_time": "0:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9300, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.426068431000883e-08, "epoch": 0.93, "percentage": 93.0, "elapsed_time": "3:32:34", "remaining_time": "0:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9310, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.216430022591009e-08, "epoch": 0.931, "percentage": 93.1, "elapsed_time": "3:32:48", "remaining_time": "0:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9320, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.009749855363457e-08, "epoch": 0.932, "percentage": 93.2, "elapsed_time": "3:33:00", "remaining_time": "0:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9330, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.806030447650879e-08, "epoch": 0.933, "percentage": 93.3, "elapsed_time": "3:33:11", "remaining_time": "0:15:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9340, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.605274281709929e-08, "epoch": 0.934, "percentage": 93.4, "elapsed_time": "3:33:22", "remaining_time": "0:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9350, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.407483803691216e-08, "epoch": 0.935, "percentage": 93.5, "elapsed_time": "3:33:33", "remaining_time": "0:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9360, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.212661423609184e-08, "epoch": 0.936, "percentage": 93.6, "elapsed_time": "3:33:46", "remaining_time": "0:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9370, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 6.020809515313141e-08, "epoch": 0.937, "percentage": 93.7, "elapsed_time": "3:37:40", "remaining_time": "0:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9380, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.83193041645802e-08, "epoch": 0.938, "percentage": 93.8, "elapsed_time": "3:38:33", "remaining_time": "0:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9390, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.6460264284760316e-08, "epoch": 0.939, "percentage": 93.9, "elapsed_time": "3:39:04", "remaining_time": "0:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9400, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.463099816548578e-08, "epoch": 0.94, "percentage": 94.0, "elapsed_time": "3:40:45", "remaining_time": "0:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9410, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.283152809578751e-08, "epoch": 0.941, "percentage": 94.1, "elapsed_time": "3:41:36", "remaining_time": "0:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9420, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.106187600163987e-08, "epoch": 0.942, "percentage": 94.2, "elapsed_time": "3:46:49", "remaining_time": "0:13:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9430, "total_steps": 10000, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.932206344569562e-08, "epoch": 0.943, "percentage": 94.3, "elapsed_time": "3:49:07", "remaining_time": "0:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9440, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.761211162702117e-08, "epoch": 0.944, "percentage": 94.4, "elapsed_time": "3:49:55", "remaining_time": "0:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9450, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.593204138084006e-08, "epoch": 0.945, "percentage": 94.5, "elapsed_time": "3:50:46", "remaining_time": "0:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9460, "total_steps": 10000, "loss": 0.0865, "accuracy": 0.8999999761581421, "learning_rate": 4.428187317827848e-08, "epoch": 0.946, "percentage": 94.6, "elapsed_time": "3:51:42", "remaining_time": "0:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9470, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.26616271261146e-08, "epoch": 0.947, "percentage": 94.7, "elapsed_time": "3:52:53", "remaining_time": "0:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9480, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.1071322966535487e-08, "epoch": 0.948, "percentage": 94.8, "elapsed_time": "3:53:34", "remaining_time": "0:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9490, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.95109800768953e-08, "epoch": 0.949, "percentage": 94.9, "elapsed_time": "3:54:10", "remaining_time": "0:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9500, "total_steps": 10000, "loss": 0.1833, "accuracy": 0.8999999761581421, "learning_rate": 3.798061746947995e-08, "epoch": 0.95, "percentage": 95.0, "elapsed_time": "3:55:08", "remaining_time": "0:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9510, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.648025379127479e-08, "epoch": 0.951, "percentage": 95.1, "elapsed_time": "3:57:02", "remaining_time": "0:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9520, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.5009907323737826e-08, "epoch": 0.952, "percentage": 95.2, "elapsed_time": "3:58:00", "remaining_time": "0:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9530, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.3569595982576584e-08, "epoch": 0.953, "percentage": 95.3, "elapsed_time": "3:59:13", "remaining_time": "0:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9540, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.2159337317530234e-08, "epoch": 0.954, "percentage": 95.4, "elapsed_time": "3:59:52", "remaining_time": "0:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9550, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.077914851215585e-08, "epoch": 0.955, "percentage": 95.5, "elapsed_time": "4:01:06", "remaining_time": "0:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9560, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.9429046383618042e-08, "epoch": 0.956, "percentage": 95.6, "elapsed_time": "4:02:05", "remaining_time": "0:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9570, "total_steps": 10000, "loss": 0.2902, "accuracy": 0.8999999761581421, "learning_rate": 2.810904738248549e-08, "epoch": 0.957, "percentage": 95.7, "elapsed_time": "4:02:45", "remaining_time": "0:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9580, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.681916759252917e-08, "epoch": 0.958, "percentage": 95.8, "elapsed_time": "4:03:38", "remaining_time": "0:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9590, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.555942273052753e-08, "epoch": 0.959, "percentage": 95.9, "elapsed_time": "4:04:32", "remaining_time": "0:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9600, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.4329828146074096e-08, "epoch": 0.96, "percentage": 96.0, "elapsed_time": "4:05:18", "remaining_time": "0:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9610, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.313039882139101e-08, "epoch": 0.961, "percentage": 96.1, "elapsed_time": "4:05:48", "remaining_time": "0:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9620, "total_steps": 10000, "loss": 0.0015, "accuracy": 1.0, "learning_rate": 2.1961149371145795e-08, "epoch": 0.962, "percentage": 96.2, "elapsed_time": "4:06:15", "remaining_time": "0:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9630, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.082209404227403e-08, "epoch": 0.963, "percentage": 96.3, "elapsed_time": "4:06:44", "remaining_time": "0:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9640, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.9713246713805588e-08, "epoch": 0.964, "percentage": 96.4, "elapsed_time": "4:08:50", "remaining_time": "0:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9650, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.8634620896695044e-08, "epoch": 0.965, "percentage": 96.5, "elapsed_time": "4:09:09", "remaining_time": "0:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9660, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.7586229733657646e-08, "epoch": 0.966, "percentage": 96.6, "elapsed_time": "4:09:52", "remaining_time": "0:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9670, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.6568085999008886e-08, "epoch": 0.967, "percentage": 96.7, "elapsed_time": "4:10:42", "remaining_time": "0:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9680, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5580202098509078e-08, "epoch": 0.968, "percentage": 96.8, "elapsed_time": "4:11:03", "remaining_time": "0:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9690, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.4622590069211517e-08, "epoch": 0.969, "percentage": 96.9, "elapsed_time": "4:12:55", "remaining_time": "0:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9700, "total_steps": 10000, "loss": 0.0051, "accuracy": 1.0, "learning_rate": 1.3695261579316776e-08, "epoch": 0.97, "percentage": 97.0, "elapsed_time": "4:14:19", "remaining_time": "0:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9710, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.2798227928029483e-08, "epoch": 0.971, "percentage": 97.1, "elapsed_time": "4:15:36", "remaining_time": "0:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9720, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.193150004542204e-08, "epoch": 0.972, "percentage": 97.2, "elapsed_time": "4:16:00", "remaining_time": "0:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9730, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.109508849230001e-08, "epoch": 0.973, "percentage": 97.3, "elapsed_time": "4:16:34", "remaining_time": "0:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9740, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.0289003460074165e-08, "epoch": 0.974, "percentage": 97.4, "elapsed_time": "4:18:37", "remaining_time": "0:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9750, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.513254770636138e-09, "epoch": 0.975, "percentage": 97.5, "elapsed_time": "4:20:30", "remaining_time": "0:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9760, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.767851876239075e-09, "epoch": 0.976, "percentage": 97.6, "elapsed_time": "4:20:50", "remaining_time": "0:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9770, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 8.052803859382174e-09, "epoch": 0.977, "percentage": 97.7, "elapsed_time": "4:21:37", "remaining_time": "0:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9780, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.368119432699383e-09, "epoch": 0.978, "percentage": 97.8, "elapsed_time": "4:22:20", "remaining_time": "0:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9790, "total_steps": 10000, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 6.7138069388547614e-09, "epoch": 0.979, "percentage": 97.9, "elapsed_time": "4:23:15", "remaining_time": "0:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9800, "total_steps": 10000, "loss": 0.0056, "accuracy": 1.0, "learning_rate": 6.089874350439507e-09, "epoch": 0.98, "percentage": 98.0, "elapsed_time": "4:24:39", "remaining_time": "0:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9810, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 5.4963292698750896e-09, "epoch": 0.981, "percentage": 98.1, "elapsed_time": "4:25:48", "remaining_time": "0:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9820, "total_steps": 10000, "loss": 0.0026, "accuracy": 1.0, "learning_rate": 4.933178929321103e-09, "epoch": 0.982, "percentage": 98.2, "elapsed_time": "4:26:23", "remaining_time": "0:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9830, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 4.400430190586724e-09, "epoch": 0.983, "percentage": 98.3, "elapsed_time": "4:28:39", "remaining_time": "0:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9840, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.8980895450474455e-09, "epoch": 0.984, "percentage": 98.4, "elapsed_time": "4:29:42", "remaining_time": "0:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9850, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.4261631135654174e-09, "epoch": 0.985, "percentage": 98.5, "elapsed_time": "4:31:07", "remaining_time": "0:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9860, "total_steps": 10000, "loss": 0.0235, "accuracy": 1.0, "learning_rate": 2.984656646415063e-09, "epoch": 0.986, "percentage": 98.6, "elapsed_time": "4:32:32", "remaining_time": "0:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9870, "total_steps": 10000, "loss": 0.0283, "accuracy": 1.0, "learning_rate": 2.573575523213412e-09, "epoch": 0.987, "percentage": 98.7, "elapsed_time": "4:33:16", "remaining_time": "0:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9880, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.192924752854042e-09, "epoch": 0.988, "percentage": 98.8, "elapsed_time": "4:34:30", "remaining_time": "0:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9890, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.842708973447127e-09, "epoch": 0.989, "percentage": 98.9, "elapsed_time": "4:35:05", "remaining_time": "0:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9900, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5229324522605949e-09, "epoch": 0.99, "percentage": 99.0, "elapsed_time": "4:36:31", "remaining_time": "0:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9910, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.2335990856710001e-09, "epoch": 0.991, "percentage": 99.1, "elapsed_time": "4:37:07", "remaining_time": "0:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9920, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 9.747123991141193e-10, "epoch": 0.992, "percentage": 99.2, "elapsed_time": "4:38:58", "remaining_time": "0:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9930, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 7.462755470422078e-10, "epoch": 0.993, "percentage": 99.3, "elapsed_time": "4:39:37", "remaining_time": "0:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9940, "total_steps": 10000, "loss": 0.0088, "accuracy": 1.0, "learning_rate": 5.48291312886251e-10, "epoch": 0.994, "percentage": 99.4, "elapsed_time": "4:40:05", "remaining_time": "0:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9950, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 3.8076210902182607e-10, "epoch": 0.995, "percentage": 99.5, "elapsed_time": "4:40:46", "remaining_time": "0:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9960, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 2.43689976739403e-10, "epoch": 0.996, "percentage": 99.6, "elapsed_time": "4:42:09", "remaining_time": "0:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9970, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.3707658621964216e-10, "epoch": 0.997, "percentage": 99.7, "elapsed_time": "4:43:04", "remaining_time": "0:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9980, "total_steps": 10000, "loss": 1.2084, "accuracy": 0.8999999761581421, "learning_rate": 6.092323651313293e-11, "epoch": 0.998, "percentage": 99.8, "elapsed_time": "4:44:11", "remaining_time": "0:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9990, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 1.5230855524017708e-11, "epoch": 0.999, "percentage": 99.9, "elapsed_time": "4:44:46", "remaining_time": "0:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10000, "total_steps": 10000, "loss": 0.0, "accuracy": 1.0, "learning_rate": 0.0, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "4:45:36", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10000, "total_steps": 10000, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "4:45:43", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}