|
{"current_steps": 10, "total_steps": 2001, "loss": 0.8065, "lr": 5e-06, "epoch": 0.014989694584972832, "percentage": 0.5, "elapsed_time": "0:05:17", "remaining_time": "17:34:40"} |
|
{"current_steps": 20, "total_steps": 2001, "loss": 0.651, "lr": 5e-06, "epoch": 0.029979389169945664, "percentage": 1.0, "elapsed_time": "0:10:32", "remaining_time": "17:23:59"} |
|
{"current_steps": 30, "total_steps": 2001, "loss": 0.6152, "lr": 5e-06, "epoch": 0.044969083754918496, "percentage": 1.5, "elapsed_time": "0:15:49", "remaining_time": "17:19:44"} |
|
{"current_steps": 40, "total_steps": 2001, "loss": 0.5859, "lr": 5e-06, "epoch": 0.05995877833989133, "percentage": 2.0, "elapsed_time": "0:21:03", "remaining_time": "17:12:23"} |
|
{"current_steps": 50, "total_steps": 2001, "loss": 0.5786, "lr": 5e-06, "epoch": 0.07494847292486416, "percentage": 2.5, "elapsed_time": "0:26:14", "remaining_time": "17:04:04"} |
|
{"current_steps": 60, "total_steps": 2001, "loss": 0.5685, "lr": 5e-06, "epoch": 0.08993816750983699, "percentage": 3.0, "elapsed_time": "0:31:25", "remaining_time": "16:56:51"} |
|
{"current_steps": 70, "total_steps": 2001, "loss": 0.5586, "lr": 5e-06, "epoch": 0.10492786209480982, "percentage": 3.5, "elapsed_time": "0:36:36", "remaining_time": "16:49:42"} |
|
{"current_steps": 80, "total_steps": 2001, "loss": 0.5529, "lr": 5e-06, "epoch": 0.11991755667978266, "percentage": 4.0, "elapsed_time": "0:41:47", "remaining_time": "16:43:22"} |
|
{"current_steps": 90, "total_steps": 2001, "loss": 0.5461, "lr": 5e-06, "epoch": 0.13490725126475547, "percentage": 4.5, "elapsed_time": "0:47:01", "remaining_time": "16:38:32"} |
|
{"current_steps": 100, "total_steps": 2001, "loss": 0.5381, "lr": 5e-06, "epoch": 0.14989694584972832, "percentage": 5.0, "elapsed_time": "0:52:16", "remaining_time": "16:33:46"} |
|
{"current_steps": 110, "total_steps": 2001, "loss": 0.5359, "lr": 5e-06, "epoch": 0.16488664043470114, "percentage": 5.5, "elapsed_time": "0:57:32", "remaining_time": "16:29:03"} |
|
{"current_steps": 120, "total_steps": 2001, "loss": 0.5318, "lr": 5e-06, "epoch": 0.17987633501967398, "percentage": 6.0, "elapsed_time": "1:02:44", "remaining_time": "16:23:28"} |
|
{"current_steps": 130, "total_steps": 2001, "loss": 0.5279, "lr": 5e-06, "epoch": 0.1948660296046468, "percentage": 6.5, "elapsed_time": "1:07:59", "remaining_time": "16:18:26"} |
|
{"current_steps": 140, "total_steps": 2001, "loss": 0.5309, "lr": 5e-06, "epoch": 0.20985572418961965, "percentage": 7.0, "elapsed_time": "1:13:14", "remaining_time": "16:13:33"} |
|
{"current_steps": 150, "total_steps": 2001, "loss": 0.5207, "lr": 5e-06, "epoch": 0.22484541877459246, "percentage": 7.5, "elapsed_time": "1:18:27", "remaining_time": "16:08:06"} |
|
{"current_steps": 160, "total_steps": 2001, "loss": 0.5203, "lr": 5e-06, "epoch": 0.2398351133595653, "percentage": 8.0, "elapsed_time": "1:23:41", "remaining_time": "16:02:54"} |
|
{"current_steps": 170, "total_steps": 2001, "loss": 0.5179, "lr": 5e-06, "epoch": 0.25482480794453816, "percentage": 8.5, "elapsed_time": "1:28:54", "remaining_time": "15:57:40"} |
|
{"current_steps": 180, "total_steps": 2001, "loss": 0.5134, "lr": 5e-06, "epoch": 0.26981450252951095, "percentage": 9.0, "elapsed_time": "1:34:09", "remaining_time": "15:52:31"} |
|
{"current_steps": 190, "total_steps": 2001, "loss": 0.5124, "lr": 5e-06, "epoch": 0.2848041971144838, "percentage": 9.5, "elapsed_time": "1:39:23", "remaining_time": "15:47:19"} |
|
{"current_steps": 200, "total_steps": 2001, "loss": 0.508, "lr": 5e-06, "epoch": 0.29979389169945664, "percentage": 10.0, "elapsed_time": "1:44:38", "remaining_time": "15:42:20"} |
|
{"current_steps": 210, "total_steps": 2001, "loss": 0.5032, "lr": 5e-06, "epoch": 0.31478358628442943, "percentage": 10.49, "elapsed_time": "1:49:51", "remaining_time": "15:36:55"} |
|
{"current_steps": 220, "total_steps": 2001, "loss": 0.5051, "lr": 5e-06, "epoch": 0.3297732808694023, "percentage": 10.99, "elapsed_time": "1:55:02", "remaining_time": "15:31:22"} |
|
{"current_steps": 230, "total_steps": 2001, "loss": 0.5036, "lr": 5e-06, "epoch": 0.3447629754543751, "percentage": 11.49, "elapsed_time": "2:00:17", "remaining_time": "15:26:16"} |
|
{"current_steps": 240, "total_steps": 2001, "loss": 0.5041, "lr": 5e-06, "epoch": 0.35975267003934797, "percentage": 11.99, "elapsed_time": "2:05:34", "remaining_time": "15:21:24"} |
|
{"current_steps": 250, "total_steps": 2001, "loss": 0.5001, "lr": 5e-06, "epoch": 0.37474236462432076, "percentage": 12.49, "elapsed_time": "2:10:50", "remaining_time": "15:16:28"} |
|
{"current_steps": 260, "total_steps": 2001, "loss": 0.5015, "lr": 5e-06, "epoch": 0.3897320592092936, "percentage": 12.99, "elapsed_time": "2:16:04", "remaining_time": "15:11:12"} |
|
{"current_steps": 270, "total_steps": 2001, "loss": 0.4958, "lr": 5e-06, "epoch": 0.40472175379426645, "percentage": 13.49, "elapsed_time": "2:21:20", "remaining_time": "15:06:08"} |
|
{"current_steps": 280, "total_steps": 2001, "loss": 0.4996, "lr": 5e-06, "epoch": 0.4197114483792393, "percentage": 13.99, "elapsed_time": "2:26:34", "remaining_time": "15:00:51"} |
|
{"current_steps": 290, "total_steps": 2001, "loss": 0.4929, "lr": 5e-06, "epoch": 0.4347011429642121, "percentage": 14.49, "elapsed_time": "2:31:50", "remaining_time": "14:55:52"} |
|
{"current_steps": 300, "total_steps": 2001, "loss": 0.4897, "lr": 5e-06, "epoch": 0.44969083754918493, "percentage": 14.99, "elapsed_time": "2:37:06", "remaining_time": "14:50:46"} |
|
{"current_steps": 310, "total_steps": 2001, "loss": 0.4927, "lr": 5e-06, "epoch": 0.4646805321341578, "percentage": 15.49, "elapsed_time": "2:42:22", "remaining_time": "14:45:45"} |
|
{"current_steps": 320, "total_steps": 2001, "loss": 0.4892, "lr": 5e-06, "epoch": 0.4796702267191306, "percentage": 15.99, "elapsed_time": "2:47:39", "remaining_time": "14:40:41"} |
|
{"current_steps": 330, "total_steps": 2001, "loss": 0.4889, "lr": 5e-06, "epoch": 0.4946599213041034, "percentage": 16.49, "elapsed_time": "2:52:53", "remaining_time": "14:35:26"} |
|
{"current_steps": 340, "total_steps": 2001, "loss": 0.4872, "lr": 5e-06, "epoch": 0.5096496158890763, "percentage": 16.99, "elapsed_time": "2:58:06", "remaining_time": "14:30:08"} |
|
{"current_steps": 350, "total_steps": 2001, "loss": 0.4839, "lr": 5e-06, "epoch": 0.5246393104740491, "percentage": 17.49, "elapsed_time": "3:03:21", "remaining_time": "14:24:57"} |
|
{"current_steps": 360, "total_steps": 2001, "loss": 0.4886, "lr": 5e-06, "epoch": 0.5396290050590219, "percentage": 17.99, "elapsed_time": "3:08:37", "remaining_time": "14:19:47"} |
|
{"current_steps": 370, "total_steps": 2001, "loss": 0.4837, "lr": 5e-06, "epoch": 0.5546186996439948, "percentage": 18.49, "elapsed_time": "3:13:52", "remaining_time": "14:14:38"} |
|
{"current_steps": 380, "total_steps": 2001, "loss": 0.4822, "lr": 5e-06, "epoch": 0.5696083942289676, "percentage": 18.99, "elapsed_time": "3:19:07", "remaining_time": "14:09:25"} |
|
{"current_steps": 390, "total_steps": 2001, "loss": 0.4798, "lr": 5e-06, "epoch": 0.5845980888139404, "percentage": 19.49, "elapsed_time": "3:24:20", "remaining_time": "14:04:04"} |
|
{"current_steps": 400, "total_steps": 2001, "loss": 0.4831, "lr": 5e-06, "epoch": 0.5995877833989133, "percentage": 19.99, "elapsed_time": "3:29:33", "remaining_time": "13:58:44"} |
|
{"current_steps": 410, "total_steps": 2001, "loss": 0.4803, "lr": 5e-06, "epoch": 0.6145774779838861, "percentage": 20.49, "elapsed_time": "3:34:48", "remaining_time": "13:53:35"} |
|
{"current_steps": 420, "total_steps": 2001, "loss": 0.4759, "lr": 5e-06, "epoch": 0.6295671725688589, "percentage": 20.99, "elapsed_time": "3:40:06", "remaining_time": "13:48:32"} |
|
{"current_steps": 430, "total_steps": 2001, "loss": 0.4759, "lr": 5e-06, "epoch": 0.6445568671538318, "percentage": 21.49, "elapsed_time": "3:45:22", "remaining_time": "13:43:25"} |
|
{"current_steps": 440, "total_steps": 2001, "loss": 0.4731, "lr": 5e-06, "epoch": 0.6595465617388045, "percentage": 21.99, "elapsed_time": "3:50:37", "remaining_time": "13:38:13"} |
|
{"current_steps": 450, "total_steps": 2001, "loss": 0.4748, "lr": 5e-06, "epoch": 0.6745362563237775, "percentage": 22.49, "elapsed_time": "3:55:53", "remaining_time": "13:33:03"} |
|
{"current_steps": 460, "total_steps": 2001, "loss": 0.4692, "lr": 5e-06, "epoch": 0.6895259509087502, "percentage": 22.99, "elapsed_time": "4:01:08", "remaining_time": "13:27:48"} |
|
{"current_steps": 470, "total_steps": 2001, "loss": 0.469, "lr": 5e-06, "epoch": 0.704515645493723, "percentage": 23.49, "elapsed_time": "4:06:21", "remaining_time": "13:22:28"} |
|
{"current_steps": 480, "total_steps": 2001, "loss": 0.4742, "lr": 5e-06, "epoch": 0.7195053400786959, "percentage": 23.99, "elapsed_time": "4:11:37", "remaining_time": "13:17:19"} |
|
{"current_steps": 490, "total_steps": 2001, "loss": 0.4734, "lr": 5e-06, "epoch": 0.7344950346636687, "percentage": 24.49, "elapsed_time": "4:16:51", "remaining_time": "13:12:03"} |
|
{"current_steps": 500, "total_steps": 2001, "loss": 0.4693, "lr": 5e-06, "epoch": 0.7494847292486415, "percentage": 24.99, "elapsed_time": "4:22:04", "remaining_time": "13:06:44"} |
|
{"current_steps": 510, "total_steps": 2001, "loss": 0.4734, "lr": 5e-06, "epoch": 0.7644744238336144, "percentage": 25.49, "elapsed_time": "4:27:18", "remaining_time": "13:01:28"} |
|
{"current_steps": 520, "total_steps": 2001, "loss": 0.4663, "lr": 5e-06, "epoch": 0.7794641184185872, "percentage": 25.99, "elapsed_time": "4:32:32", "remaining_time": "12:56:14"} |
|
{"current_steps": 530, "total_steps": 2001, "loss": 0.4645, "lr": 5e-06, "epoch": 0.7944538130035601, "percentage": 26.49, "elapsed_time": "4:37:48", "remaining_time": "12:51:02"} |
|
{"current_steps": 540, "total_steps": 2001, "loss": 0.4647, "lr": 5e-06, "epoch": 0.8094435075885329, "percentage": 26.99, "elapsed_time": "4:43:03", "remaining_time": "12:45:50"} |
|
{"current_steps": 550, "total_steps": 2001, "loss": 0.4707, "lr": 5e-06, "epoch": 0.8244332021735057, "percentage": 27.49, "elapsed_time": "4:48:19", "remaining_time": "12:40:39"} |
|
{"current_steps": 560, "total_steps": 2001, "loss": 0.4674, "lr": 5e-06, "epoch": 0.8394228967584786, "percentage": 27.99, "elapsed_time": "4:53:34", "remaining_time": "12:35:25"} |
|
{"current_steps": 570, "total_steps": 2001, "loss": 0.4678, "lr": 5e-06, "epoch": 0.8544125913434514, "percentage": 28.49, "elapsed_time": "4:58:49", "remaining_time": "12:30:12"} |
|
{"current_steps": 580, "total_steps": 2001, "loss": 0.4614, "lr": 5e-06, "epoch": 0.8694022859284242, "percentage": 28.99, "elapsed_time": "5:04:04", "remaining_time": "12:24:59"} |
|
{"current_steps": 590, "total_steps": 2001, "loss": 0.4634, "lr": 5e-06, "epoch": 0.8843919805133971, "percentage": 29.49, "elapsed_time": "5:09:20", "remaining_time": "12:19:48"} |
|
{"current_steps": 600, "total_steps": 2001, "loss": 0.4649, "lr": 5e-06, "epoch": 0.8993816750983699, "percentage": 29.99, "elapsed_time": "5:14:34", "remaining_time": "12:14:33"} |
|
{"current_steps": 610, "total_steps": 2001, "loss": 0.4638, "lr": 5e-06, "epoch": 0.9143713696833426, "percentage": 30.48, "elapsed_time": "5:19:50", "remaining_time": "12:09:21"} |
|
{"current_steps": 620, "total_steps": 2001, "loss": 0.4639, "lr": 5e-06, "epoch": 0.9293610642683156, "percentage": 30.98, "elapsed_time": "5:25:07", "remaining_time": "12:04:11"} |
|
{"current_steps": 630, "total_steps": 2001, "loss": 0.4656, "lr": 5e-06, "epoch": 0.9443507588532883, "percentage": 31.48, "elapsed_time": "5:30:22", "remaining_time": "11:58:57"} |
|
{"current_steps": 640, "total_steps": 2001, "loss": 0.4592, "lr": 5e-06, "epoch": 0.9593404534382612, "percentage": 31.98, "elapsed_time": "5:35:37", "remaining_time": "11:53:44"} |
|
{"current_steps": 650, "total_steps": 2001, "loss": 0.4632, "lr": 5e-06, "epoch": 0.974330148023234, "percentage": 32.48, "elapsed_time": "5:40:53", "remaining_time": "11:48:31"} |
|
{"current_steps": 660, "total_steps": 2001, "loss": 0.4596, "lr": 5e-06, "epoch": 0.9893198426082068, "percentage": 32.98, "elapsed_time": "5:46:07", "remaining_time": "11:43:16"} |
|
{"current_steps": 667, "total_steps": 2001, "eval_loss": 0.05758751183748245, "epoch": 0.9998126288176878, "percentage": 33.33, "elapsed_time": "5:57:26", "remaining_time": "11:54:53"} |
|
{"current_steps": 670, "total_steps": 2001, "loss": 0.4348, "lr": 5e-06, "epoch": 1.0043095371931796, "percentage": 33.48, "elapsed_time": "6:00:02", "remaining_time": "11:55:14"} |
|
{"current_steps": 680, "total_steps": 2001, "loss": 0.364, "lr": 5e-06, "epoch": 1.0192992317781526, "percentage": 33.98, "elapsed_time": "6:05:16", "remaining_time": "11:49:35"} |
|
{"current_steps": 690, "total_steps": 2001, "loss": 0.3558, "lr": 5e-06, "epoch": 1.0342889263631254, "percentage": 34.48, "elapsed_time": "6:10:30", "remaining_time": "11:43:58"} |
|
{"current_steps": 700, "total_steps": 2001, "loss": 0.355, "lr": 5e-06, "epoch": 1.0492786209480982, "percentage": 34.98, "elapsed_time": "6:15:47", "remaining_time": "11:38:25"} |
|
{"current_steps": 710, "total_steps": 2001, "loss": 0.3519, "lr": 5e-06, "epoch": 1.064268315533071, "percentage": 35.48, "elapsed_time": "6:21:01", "remaining_time": "11:32:49"} |
|
{"current_steps": 720, "total_steps": 2001, "loss": 0.3545, "lr": 5e-06, "epoch": 1.0792580101180438, "percentage": 35.98, "elapsed_time": "6:26:17", "remaining_time": "11:27:17"} |
|
{"current_steps": 730, "total_steps": 2001, "loss": 0.3583, "lr": 5e-06, "epoch": 1.0942477047030166, "percentage": 36.48, "elapsed_time": "6:31:33", "remaining_time": "11:21:43"} |
|
{"current_steps": 740, "total_steps": 2001, "loss": 0.3558, "lr": 5e-06, "epoch": 1.1092373992879896, "percentage": 36.98, "elapsed_time": "6:36:49", "remaining_time": "11:16:12"} |
|
{"current_steps": 750, "total_steps": 2001, "loss": 0.3563, "lr": 5e-06, "epoch": 1.1242270938729624, "percentage": 37.48, "elapsed_time": "6:42:04", "remaining_time": "11:10:40"} |
|
{"current_steps": 760, "total_steps": 2001, "loss": 0.358, "lr": 5e-06, "epoch": 1.1392167884579352, "percentage": 37.98, "elapsed_time": "6:47:18", "remaining_time": "11:05:05"} |
|
{"current_steps": 770, "total_steps": 2001, "loss": 0.3574, "lr": 5e-06, "epoch": 1.154206483042908, "percentage": 38.48, "elapsed_time": "6:52:31", "remaining_time": "10:59:30"} |
|
{"current_steps": 780, "total_steps": 2001, "loss": 0.3584, "lr": 5e-06, "epoch": 1.1691961776278808, "percentage": 38.98, "elapsed_time": "6:57:47", "remaining_time": "10:53:59"} |
|
{"current_steps": 790, "total_steps": 2001, "loss": 0.3564, "lr": 5e-06, "epoch": 1.1841858722128538, "percentage": 39.48, "elapsed_time": "7:03:01", "remaining_time": "10:48:27"} |
|
{"current_steps": 800, "total_steps": 2001, "loss": 0.3527, "lr": 5e-06, "epoch": 1.1991755667978266, "percentage": 39.98, "elapsed_time": "7:08:16", "remaining_time": "10:42:56"} |
|
{"current_steps": 810, "total_steps": 2001, "loss": 0.3566, "lr": 5e-06, "epoch": 1.2141652613827993, "percentage": 40.48, "elapsed_time": "7:13:31", "remaining_time": "10:37:26"} |
|
{"current_steps": 820, "total_steps": 2001, "loss": 0.3601, "lr": 5e-06, "epoch": 1.2291549559677721, "percentage": 40.98, "elapsed_time": "7:18:44", "remaining_time": "10:31:53"} |
|
{"current_steps": 830, "total_steps": 2001, "loss": 0.3583, "lr": 5e-06, "epoch": 1.244144650552745, "percentage": 41.48, "elapsed_time": "7:23:57", "remaining_time": "10:26:20"} |
|
{"current_steps": 840, "total_steps": 2001, "loss": 0.3542, "lr": 5e-06, "epoch": 1.259134345137718, "percentage": 41.98, "elapsed_time": "7:29:11", "remaining_time": "10:20:51"} |
|
{"current_steps": 850, "total_steps": 2001, "loss": 0.3575, "lr": 5e-06, "epoch": 1.2741240397226907, "percentage": 42.48, "elapsed_time": "7:34:27", "remaining_time": "10:15:23"} |
|
{"current_steps": 860, "total_steps": 2001, "loss": 0.3586, "lr": 5e-06, "epoch": 1.2891137343076635, "percentage": 42.98, "elapsed_time": "7:39:44", "remaining_time": "10:09:57"} |
|
{"current_steps": 870, "total_steps": 2001, "loss": 0.3622, "lr": 5e-06, "epoch": 1.3041034288926363, "percentage": 43.48, "elapsed_time": "7:45:00", "remaining_time": "10:04:30"} |
|
{"current_steps": 880, "total_steps": 2001, "loss": 0.3588, "lr": 5e-06, "epoch": 1.319093123477609, "percentage": 43.98, "elapsed_time": "7:50:17", "remaining_time": "9:59:04"} |
|
{"current_steps": 890, "total_steps": 2001, "loss": 0.3634, "lr": 5e-06, "epoch": 1.334082818062582, "percentage": 44.48, "elapsed_time": "7:55:32", "remaining_time": "9:53:37"} |
|
{"current_steps": 900, "total_steps": 2001, "loss": 0.3539, "lr": 5e-06, "epoch": 1.3490725126475547, "percentage": 44.98, "elapsed_time": "8:00:44", "remaining_time": "9:48:06"} |
|
{"current_steps": 910, "total_steps": 2001, "loss": 0.3632, "lr": 5e-06, "epoch": 1.3640622072325277, "percentage": 45.48, "elapsed_time": "8:06:00", "remaining_time": "9:42:40"} |
|
{"current_steps": 920, "total_steps": 2001, "loss": 0.3625, "lr": 5e-06, "epoch": 1.3790519018175005, "percentage": 45.98, "elapsed_time": "8:11:16", "remaining_time": "9:37:15"} |
|
{"current_steps": 930, "total_steps": 2001, "loss": 0.3595, "lr": 5e-06, "epoch": 1.3940415964024733, "percentage": 46.48, "elapsed_time": "8:16:32", "remaining_time": "9:31:49"} |
|
{"current_steps": 940, "total_steps": 2001, "loss": 0.3597, "lr": 5e-06, "epoch": 1.409031290987446, "percentage": 46.98, "elapsed_time": "8:21:50", "remaining_time": "9:26:26"} |
|
{"current_steps": 950, "total_steps": 2001, "loss": 0.3611, "lr": 5e-06, "epoch": 1.4240209855724189, "percentage": 47.48, "elapsed_time": "8:27:07", "remaining_time": "9:21:02"} |
|
{"current_steps": 960, "total_steps": 2001, "loss": 0.3603, "lr": 5e-06, "epoch": 1.4390106801573919, "percentage": 47.98, "elapsed_time": "8:32:25", "remaining_time": "9:15:39"} |
|
{"current_steps": 970, "total_steps": 2001, "loss": 0.3631, "lr": 5e-06, "epoch": 1.4540003747423647, "percentage": 48.48, "elapsed_time": "8:37:42", "remaining_time": "9:10:15"} |
|
{"current_steps": 980, "total_steps": 2001, "loss": 0.3609, "lr": 5e-06, "epoch": 1.4689900693273374, "percentage": 48.98, "elapsed_time": "8:42:59", "remaining_time": "9:04:51"} |
|
{"current_steps": 990, "total_steps": 2001, "loss": 0.3625, "lr": 5e-06, "epoch": 1.4839797639123102, "percentage": 49.48, "elapsed_time": "8:48:15", "remaining_time": "8:59:27"} |
|
{"current_steps": 1000, "total_steps": 2001, "loss": 0.3618, "lr": 5e-06, "epoch": 1.498969458497283, "percentage": 49.98, "elapsed_time": "8:53:32", "remaining_time": "8:54:04"} |
|
{"current_steps": 1010, "total_steps": 2001, "loss": 0.3612, "lr": 5e-06, "epoch": 1.513959153082256, "percentage": 50.47, "elapsed_time": "8:58:48", "remaining_time": "8:48:40"} |
|
{"current_steps": 1020, "total_steps": 2001, "loss": 0.3628, "lr": 5e-06, "epoch": 1.5289488476672288, "percentage": 50.97, "elapsed_time": "9:04:05", "remaining_time": "8:43:17"} |
|
{"current_steps": 1030, "total_steps": 2001, "loss": 0.3626, "lr": 5e-06, "epoch": 1.5439385422522016, "percentage": 51.47, "elapsed_time": "9:09:21", "remaining_time": "8:37:53"} |
|
{"current_steps": 1040, "total_steps": 2001, "loss": 0.3618, "lr": 5e-06, "epoch": 1.5589282368371744, "percentage": 51.97, "elapsed_time": "9:14:37", "remaining_time": "8:32:29"} |
|
{"current_steps": 1050, "total_steps": 2001, "loss": 0.3615, "lr": 5e-06, "epoch": 1.5739179314221472, "percentage": 52.47, "elapsed_time": "9:19:52", "remaining_time": "8:27:05"} |
|
{"current_steps": 1060, "total_steps": 2001, "loss": 0.3618, "lr": 5e-06, "epoch": 1.5889076260071202, "percentage": 52.97, "elapsed_time": "9:25:08", "remaining_time": "8:21:41"} |
|
{"current_steps": 1070, "total_steps": 2001, "loss": 0.365, "lr": 5e-06, "epoch": 1.6038973205920928, "percentage": 53.47, "elapsed_time": "9:30:26", "remaining_time": "8:16:19"} |
|
{"current_steps": 1080, "total_steps": 2001, "loss": 0.3632, "lr": 5e-06, "epoch": 1.6188870151770658, "percentage": 53.97, "elapsed_time": "9:35:43", "remaining_time": "8:10:57"} |
|
{"current_steps": 1090, "total_steps": 2001, "loss": 0.3643, "lr": 5e-06, "epoch": 1.6338767097620386, "percentage": 54.47, "elapsed_time": "9:40:59", "remaining_time": "8:05:35"} |
|
{"current_steps": 1100, "total_steps": 2001, "loss": 0.3649, "lr": 5e-06, "epoch": 1.6488664043470114, "percentage": 54.97, "elapsed_time": "9:46:16", "remaining_time": "8:00:12"} |
|
{"current_steps": 1110, "total_steps": 2001, "loss": 0.3612, "lr": 5e-06, "epoch": 1.6638560989319844, "percentage": 55.47, "elapsed_time": "9:51:31", "remaining_time": "7:54:49"} |
|
{"current_steps": 1120, "total_steps": 2001, "loss": 0.3614, "lr": 5e-06, "epoch": 1.678845793516957, "percentage": 55.97, "elapsed_time": "9:56:48", "remaining_time": "7:49:27"} |
|
{"current_steps": 1130, "total_steps": 2001, "loss": 0.3601, "lr": 5e-06, "epoch": 1.69383548810193, "percentage": 56.47, "elapsed_time": "10:02:04", "remaining_time": "7:44:04"} |
|
{"current_steps": 1140, "total_steps": 2001, "loss": 0.3627, "lr": 5e-06, "epoch": 1.7088251826869028, "percentage": 56.97, "elapsed_time": "10:07:21", "remaining_time": "7:38:42"} |
|
{"current_steps": 1150, "total_steps": 2001, "loss": 0.3609, "lr": 5e-06, "epoch": 1.7238148772718755, "percentage": 57.47, "elapsed_time": "10:12:38", "remaining_time": "7:33:20"} |
|
{"current_steps": 1160, "total_steps": 2001, "loss": 0.3601, "lr": 5e-06, "epoch": 1.7388045718568486, "percentage": 57.97, "elapsed_time": "10:17:54", "remaining_time": "7:27:58"} |
|
{"current_steps": 1170, "total_steps": 2001, "loss": 0.3596, "lr": 5e-06, "epoch": 1.7537942664418211, "percentage": 58.47, "elapsed_time": "10:23:10", "remaining_time": "7:22:36"} |
|
{"current_steps": 1180, "total_steps": 2001, "loss": 0.3614, "lr": 5e-06, "epoch": 1.7687839610267941, "percentage": 58.97, "elapsed_time": "10:28:27", "remaining_time": "7:17:15"} |
|
{"current_steps": 1190, "total_steps": 2001, "loss": 0.3629, "lr": 5e-06, "epoch": 1.783773655611767, "percentage": 59.47, "elapsed_time": "10:33:42", "remaining_time": "7:11:52"} |
|
{"current_steps": 1200, "total_steps": 2001, "loss": 0.364, "lr": 5e-06, "epoch": 1.7987633501967397, "percentage": 59.97, "elapsed_time": "10:38:58", "remaining_time": "7:06:30"} |
|
{"current_steps": 1210, "total_steps": 2001, "loss": 0.3623, "lr": 5e-06, "epoch": 1.8137530447817127, "percentage": 60.47, "elapsed_time": "10:44:15", "remaining_time": "7:01:09"} |
|
{"current_steps": 1220, "total_steps": 2001, "loss": 0.3629, "lr": 5e-06, "epoch": 1.8287427393666853, "percentage": 60.97, "elapsed_time": "10:49:30", "remaining_time": "6:55:47"} |
|
{"current_steps": 1230, "total_steps": 2001, "loss": 0.3639, "lr": 5e-06, "epoch": 1.8437324339516583, "percentage": 61.47, "elapsed_time": "10:54:46", "remaining_time": "6:50:26"} |
|
{"current_steps": 1240, "total_steps": 2001, "loss": 0.3614, "lr": 5e-06, "epoch": 1.858722128536631, "percentage": 61.97, "elapsed_time": "11:00:03", "remaining_time": "6:45:05"} |
|
{"current_steps": 1250, "total_steps": 2001, "loss": 0.3628, "lr": 5e-06, "epoch": 1.873711823121604, "percentage": 62.47, "elapsed_time": "11:05:19", "remaining_time": "6:39:43"} |
|
{"current_steps": 1260, "total_steps": 2001, "loss": 0.3624, "lr": 5e-06, "epoch": 1.8887015177065767, "percentage": 62.97, "elapsed_time": "11:10:34", "remaining_time": "6:34:21"} |
|
{"current_steps": 1270, "total_steps": 2001, "loss": 0.362, "lr": 5e-06, "epoch": 1.9036912122915495, "percentage": 63.47, "elapsed_time": "11:15:50", "remaining_time": "6:29:00"} |
|
{"current_steps": 1280, "total_steps": 2001, "loss": 0.363, "lr": 5e-06, "epoch": 1.9186809068765225, "percentage": 63.97, "elapsed_time": "11:21:06", "remaining_time": "6:23:39"} |
|
{"current_steps": 1290, "total_steps": 2001, "loss": 0.3587, "lr": 5e-06, "epoch": 1.9336706014614953, "percentage": 64.47, "elapsed_time": "11:26:21", "remaining_time": "6:18:17"} |
|
{"current_steps": 1300, "total_steps": 2001, "loss": 0.3608, "lr": 5e-06, "epoch": 1.948660296046468, "percentage": 64.97, "elapsed_time": "11:31:37", "remaining_time": "6:12:56"} |
|
{"current_steps": 1310, "total_steps": 2001, "loss": 0.3621, "lr": 5e-06, "epoch": 1.9636499906314409, "percentage": 65.47, "elapsed_time": "11:36:52", "remaining_time": "6:07:35"} |
|
{"current_steps": 1320, "total_steps": 2001, "loss": 0.3632, "lr": 5e-06, "epoch": 1.9786396852164136, "percentage": 65.97, "elapsed_time": "11:42:08", "remaining_time": "6:02:14"} |
|
{"current_steps": 1330, "total_steps": 2001, "loss": 0.3617, "lr": 5e-06, "epoch": 1.9936293798013867, "percentage": 66.47, "elapsed_time": "11:47:24", "remaining_time": "5:56:53"} |
|
{"current_steps": 1334, "total_steps": 2001, "eval_loss": 0.056735917925834656, "epoch": 1.9996252576353757, "percentage": 66.67, "elapsed_time": "11:57:08", "remaining_time": "5:58:34"} |
|
{"current_steps": 1340, "total_steps": 2001, "loss": 0.3009, "lr": 5e-06, "epoch": 2.0086190743863592, "percentage": 66.97, "elapsed_time": "12:01:19", "remaining_time": "5:55:49"} |
|
{"current_steps": 1350, "total_steps": 2001, "loss": 0.2445, "lr": 5e-06, "epoch": 2.0236087689713322, "percentage": 67.47, "elapsed_time": "12:06:34", "remaining_time": "5:50:22"} |
|
{"current_steps": 1360, "total_steps": 2001, "loss": 0.2404, "lr": 5e-06, "epoch": 2.0385984635563053, "percentage": 67.97, "elapsed_time": "12:11:49", "remaining_time": "5:44:55"} |
|
{"current_steps": 1370, "total_steps": 2001, "loss": 0.2396, "lr": 5e-06, "epoch": 2.053588158141278, "percentage": 68.47, "elapsed_time": "12:17:05", "remaining_time": "5:39:29"} |
|
{"current_steps": 1380, "total_steps": 2001, "loss": 0.2399, "lr": 5e-06, "epoch": 2.068577852726251, "percentage": 68.97, "elapsed_time": "12:22:19", "remaining_time": "5:34:02"} |
|
{"current_steps": 1390, "total_steps": 2001, "loss": 0.2398, "lr": 5e-06, "epoch": 2.0835675473112234, "percentage": 69.47, "elapsed_time": "12:27:34", "remaining_time": "5:28:36"} |
|
{"current_steps": 1400, "total_steps": 2001, "loss": 0.2404, "lr": 5e-06, "epoch": 2.0985572418961964, "percentage": 69.97, "elapsed_time": "12:32:47", "remaining_time": "5:23:09"} |
|
{"current_steps": 1410, "total_steps": 2001, "loss": 0.2406, "lr": 5e-06, "epoch": 2.1135469364811694, "percentage": 70.46, "elapsed_time": "12:38:01", "remaining_time": "5:17:43"} |
|
{"current_steps": 1420, "total_steps": 2001, "loss": 0.2445, "lr": 5e-06, "epoch": 2.128536631066142, "percentage": 70.96, "elapsed_time": "12:43:16", "remaining_time": "5:12:17"} |
|
{"current_steps": 1430, "total_steps": 2001, "loss": 0.2428, "lr": 5e-06, "epoch": 2.143526325651115, "percentage": 71.46, "elapsed_time": "12:48:32", "remaining_time": "5:06:52"} |
|
{"current_steps": 1440, "total_steps": 2001, "loss": 0.2443, "lr": 5e-06, "epoch": 2.1585160202360876, "percentage": 71.96, "elapsed_time": "12:53:48", "remaining_time": "5:01:27"} |
|
{"current_steps": 1450, "total_steps": 2001, "loss": 0.2431, "lr": 5e-06, "epoch": 2.1735057148210606, "percentage": 72.46, "elapsed_time": "12:59:05", "remaining_time": "4:56:03"} |
|
{"current_steps": 1460, "total_steps": 2001, "loss": 0.2448, "lr": 5e-06, "epoch": 2.188495409406033, "percentage": 72.96, "elapsed_time": "13:04:18", "remaining_time": "4:50:37"} |
|
{"current_steps": 1470, "total_steps": 2001, "loss": 0.247, "lr": 5e-06, "epoch": 2.203485103991006, "percentage": 73.46, "elapsed_time": "13:09:32", "remaining_time": "4:45:12"} |
|
{"current_steps": 1480, "total_steps": 2001, "loss": 0.2491, "lr": 5e-06, "epoch": 2.218474798575979, "percentage": 73.96, "elapsed_time": "13:14:46", "remaining_time": "4:39:46"} |
|
{"current_steps": 1490, "total_steps": 2001, "loss": 0.2485, "lr": 5e-06, "epoch": 2.2334644931609517, "percentage": 74.46, "elapsed_time": "13:20:02", "remaining_time": "4:34:22"} |
|
{"current_steps": 1500, "total_steps": 2001, "loss": 0.2463, "lr": 5e-06, "epoch": 2.2484541877459248, "percentage": 74.96, "elapsed_time": "13:25:16", "remaining_time": "4:28:57"} |
|
{"current_steps": 1510, "total_steps": 2001, "loss": 0.2486, "lr": 5e-06, "epoch": 2.2634438823308973, "percentage": 75.46, "elapsed_time": "13:30:31", "remaining_time": "4:23:33"} |
|
{"current_steps": 1520, "total_steps": 2001, "loss": 0.2497, "lr": 5e-06, "epoch": 2.2784335769158703, "percentage": 75.96, "elapsed_time": "13:35:45", "remaining_time": "4:18:08"} |
|
{"current_steps": 1530, "total_steps": 2001, "loss": 0.2492, "lr": 5e-06, "epoch": 2.2934232715008434, "percentage": 76.46, "elapsed_time": "13:41:00", "remaining_time": "4:12:44"} |
|
{"current_steps": 1540, "total_steps": 2001, "loss": 0.2503, "lr": 5e-06, "epoch": 2.308412966085816, "percentage": 76.96, "elapsed_time": "13:46:18", "remaining_time": "4:07:21"} |
|
{"current_steps": 1550, "total_steps": 2001, "loss": 0.2505, "lr": 5e-06, "epoch": 2.323402660670789, "percentage": 77.46, "elapsed_time": "13:51:34", "remaining_time": "4:01:57"} |
|
{"current_steps": 1560, "total_steps": 2001, "loss": 0.2518, "lr": 5e-06, "epoch": 2.3383923552557615, "percentage": 77.96, "elapsed_time": "13:56:51", "remaining_time": "3:56:34"} |
|
{"current_steps": 1570, "total_steps": 2001, "loss": 0.2504, "lr": 5e-06, "epoch": 2.3533820498407345, "percentage": 78.46, "elapsed_time": "14:02:06", "remaining_time": "3:51:10"} |
|
{"current_steps": 1580, "total_steps": 2001, "loss": 0.2511, "lr": 5e-06, "epoch": 2.3683717444257075, "percentage": 78.96, "elapsed_time": "14:07:23", "remaining_time": "3:45:47"} |
|
{"current_steps": 1590, "total_steps": 2001, "loss": 0.2517, "lr": 5e-06, "epoch": 2.38336143901068, "percentage": 79.46, "elapsed_time": "14:12:38", "remaining_time": "3:40:24"} |
|
{"current_steps": 1600, "total_steps": 2001, "loss": 0.2519, "lr": 5e-06, "epoch": 2.398351133595653, "percentage": 79.96, "elapsed_time": "14:17:53", "remaining_time": "3:35:00"} |
|
{"current_steps": 1610, "total_steps": 2001, "loss": 0.2537, "lr": 5e-06, "epoch": 2.4133408281806257, "percentage": 80.46, "elapsed_time": "14:23:10", "remaining_time": "3:29:37"} |
|
{"current_steps": 1620, "total_steps": 2001, "loss": 0.2525, "lr": 5e-06, "epoch": 2.4283305227655987, "percentage": 80.96, "elapsed_time": "14:28:23", "remaining_time": "3:24:13"} |
|
{"current_steps": 1630, "total_steps": 2001, "loss": 0.2519, "lr": 5e-06, "epoch": 2.4433202173505713, "percentage": 81.46, "elapsed_time": "14:33:39", "remaining_time": "3:18:51"} |
|
{"current_steps": 1640, "total_steps": 2001, "loss": 0.2542, "lr": 5e-06, "epoch": 2.4583099119355443, "percentage": 81.96, "elapsed_time": "14:38:55", "remaining_time": "3:13:28"} |
|
{"current_steps": 1650, "total_steps": 2001, "loss": 0.2523, "lr": 5e-06, "epoch": 2.4732996065205173, "percentage": 82.46, "elapsed_time": "14:44:11", "remaining_time": "3:08:05"} |
|
{"current_steps": 1660, "total_steps": 2001, "loss": 0.2525, "lr": 5e-06, "epoch": 2.48828930110549, "percentage": 82.96, "elapsed_time": "14:49:27", "remaining_time": "3:02:42"} |
|
{"current_steps": 1670, "total_steps": 2001, "loss": 0.2512, "lr": 5e-06, "epoch": 2.503278995690463, "percentage": 83.46, "elapsed_time": "14:54:43", "remaining_time": "2:57:20"} |
|
{"current_steps": 1680, "total_steps": 2001, "loss": 0.2543, "lr": 5e-06, "epoch": 2.518268690275436, "percentage": 83.96, "elapsed_time": "14:59:59", "remaining_time": "2:51:57"} |
|
{"current_steps": 1690, "total_steps": 2001, "loss": 0.2542, "lr": 5e-06, "epoch": 2.5332583848604084, "percentage": 84.46, "elapsed_time": "15:05:15", "remaining_time": "2:46:35"} |
|
{"current_steps": 1700, "total_steps": 2001, "loss": 0.2543, "lr": 5e-06, "epoch": 2.5482480794453815, "percentage": 84.96, "elapsed_time": "15:10:30", "remaining_time": "2:41:12"} |
|
{"current_steps": 1710, "total_steps": 2001, "loss": 0.2547, "lr": 5e-06, "epoch": 2.563237774030354, "percentage": 85.46, "elapsed_time": "15:15:45", "remaining_time": "2:35:50"} |
|
{"current_steps": 1720, "total_steps": 2001, "loss": 0.2577, "lr": 5e-06, "epoch": 2.578227468615327, "percentage": 85.96, "elapsed_time": "15:21:01", "remaining_time": "2:30:28"} |
|
{"current_steps": 1730, "total_steps": 2001, "loss": 0.2585, "lr": 5e-06, "epoch": 2.5932171632002996, "percentage": 86.46, "elapsed_time": "15:26:15", "remaining_time": "2:25:05"} |
|
{"current_steps": 1740, "total_steps": 2001, "loss": 0.2566, "lr": 5e-06, "epoch": 2.6082068577852726, "percentage": 86.96, "elapsed_time": "15:31:32", "remaining_time": "2:19:43"} |
|
{"current_steps": 1750, "total_steps": 2001, "loss": 0.2577, "lr": 5e-06, "epoch": 2.6231965523702456, "percentage": 87.46, "elapsed_time": "15:36:48", "remaining_time": "2:14:21"} |
|
{"current_steps": 1760, "total_steps": 2001, "loss": 0.2584, "lr": 5e-06, "epoch": 2.638186246955218, "percentage": 87.96, "elapsed_time": "15:42:02", "remaining_time": "2:08:59"} |
|
{"current_steps": 1770, "total_steps": 2001, "loss": 0.258, "lr": 5e-06, "epoch": 2.653175941540191, "percentage": 88.46, "elapsed_time": "15:47:17", "remaining_time": "2:03:37"} |
|
{"current_steps": 1780, "total_steps": 2001, "loss": 0.2596, "lr": 5e-06, "epoch": 2.668165636125164, "percentage": 88.96, "elapsed_time": "15:52:31", "remaining_time": "1:58:15"} |
|
{"current_steps": 1790, "total_steps": 2001, "loss": 0.259, "lr": 5e-06, "epoch": 2.683155330710137, "percentage": 89.46, "elapsed_time": "15:57:46", "remaining_time": "1:52:53"} |
|
{"current_steps": 1800, "total_steps": 2001, "loss": 0.2613, "lr": 5e-06, "epoch": 2.6981450252951094, "percentage": 89.96, "elapsed_time": "16:03:02", "remaining_time": "1:47:32"} |
|
{"current_steps": 1810, "total_steps": 2001, "loss": 0.2585, "lr": 5e-06, "epoch": 2.7131347198800824, "percentage": 90.45, "elapsed_time": "16:08:17", "remaining_time": "1:42:10"} |
|
{"current_steps": 1820, "total_steps": 2001, "loss": 0.2597, "lr": 5e-06, "epoch": 2.7281244144650554, "percentage": 90.95, "elapsed_time": "16:13:29", "remaining_time": "1:36:48"} |
|
{"current_steps": 1830, "total_steps": 2001, "loss": 0.2571, "lr": 5e-06, "epoch": 2.743114109050028, "percentage": 91.45, "elapsed_time": "16:18:44", "remaining_time": "1:31:27"} |
|
{"current_steps": 1840, "total_steps": 2001, "loss": 0.263, "lr": 5e-06, "epoch": 2.758103803635001, "percentage": 91.95, "elapsed_time": "16:23:56", "remaining_time": "1:26:05"} |
|
{"current_steps": 1850, "total_steps": 2001, "loss": 0.2608, "lr": 5e-06, "epoch": 2.773093498219974, "percentage": 92.45, "elapsed_time": "16:29:11", "remaining_time": "1:20:44"} |
|
{"current_steps": 1860, "total_steps": 2001, "loss": 0.2613, "lr": 5e-06, "epoch": 2.7880831928049465, "percentage": 92.95, "elapsed_time": "16:34:24", "remaining_time": "1:15:22"} |
|
{"current_steps": 1870, "total_steps": 2001, "loss": 0.2611, "lr": 5e-06, "epoch": 2.8030728873899196, "percentage": 93.45, "elapsed_time": "16:39:39", "remaining_time": "1:10:01"} |
|
{"current_steps": 1880, "total_steps": 2001, "loss": 0.2622, "lr": 5e-06, "epoch": 2.818062581974892, "percentage": 93.95, "elapsed_time": "16:44:52", "remaining_time": "1:04:40"} |
|
{"current_steps": 1890, "total_steps": 2001, "loss": 0.2615, "lr": 5e-06, "epoch": 2.833052276559865, "percentage": 94.45, "elapsed_time": "16:50:04", "remaining_time": "0:59:19"} |
|
{"current_steps": 1900, "total_steps": 2001, "loss": 0.263, "lr": 5e-06, "epoch": 2.8480419711448377, "percentage": 94.95, "elapsed_time": "16:55:17", "remaining_time": "0:53:58"} |
|
{"current_steps": 1910, "total_steps": 2001, "loss": 0.2649, "lr": 5e-06, "epoch": 2.8630316657298107, "percentage": 95.45, "elapsed_time": "17:00:29", "remaining_time": "0:48:37"} |
|
{"current_steps": 1920, "total_steps": 2001, "loss": 0.2611, "lr": 5e-06, "epoch": 2.8780213603147837, "percentage": 95.95, "elapsed_time": "17:05:41", "remaining_time": "0:43:16"} |
|
{"current_steps": 1930, "total_steps": 2001, "loss": 0.2626, "lr": 5e-06, "epoch": 2.8930110548997563, "percentage": 96.45, "elapsed_time": "17:10:55", "remaining_time": "0:37:55"} |
|
{"current_steps": 1940, "total_steps": 2001, "loss": 0.2627, "lr": 5e-06, "epoch": 2.9080007494847293, "percentage": 96.95, "elapsed_time": "17:16:12", "remaining_time": "0:32:34"} |
|
{"current_steps": 1950, "total_steps": 2001, "loss": 0.2628, "lr": 5e-06, "epoch": 2.9229904440697023, "percentage": 97.45, "elapsed_time": "17:21:27", "remaining_time": "0:27:14"} |
|
{"current_steps": 1960, "total_steps": 2001, "loss": 0.2627, "lr": 5e-06, "epoch": 2.937980138654675, "percentage": 97.95, "elapsed_time": "17:26:43", "remaining_time": "0:21:53"} |
|
{"current_steps": 1970, "total_steps": 2001, "loss": 0.2646, "lr": 5e-06, "epoch": 2.952969833239648, "percentage": 98.45, "elapsed_time": "17:31:57", "remaining_time": "0:16:33"} |
|
{"current_steps": 1980, "total_steps": 2001, "loss": 0.2637, "lr": 5e-06, "epoch": 2.9679595278246205, "percentage": 98.95, "elapsed_time": "17:37:10", "remaining_time": "0:11:12"} |
|
{"current_steps": 1990, "total_steps": 2001, "loss": 0.2637, "lr": 5e-06, "epoch": 2.9829492224095935, "percentage": 99.45, "elapsed_time": "17:42:22", "remaining_time": "0:05:52"} |
|
{"current_steps": 2000, "total_steps": 2001, "loss": 0.2629, "lr": 5e-06, "epoch": 2.997938916994566, "percentage": 99.95, "elapsed_time": "17:47:34", "remaining_time": "0:00:32"} |
|
{"current_steps": 2001, "total_steps": 2001, "eval_loss": 0.061618607491254807, "epoch": 2.9994378864530633, "percentage": 100.0, "elapsed_time": "17:56:47", "remaining_time": "0:00:00"} |
|
{"current_steps": 2001, "total_steps": 2001, "epoch": 2.9994378864530633, "percentage": 100.0, "elapsed_time": "17:58:13", "remaining_time": "0:00:00"} |
|
|