{"current_steps": 10, "total_steps": 3402, "loss": 0.4452, "learning_rate": 3.883495145631068e-06, "epoch": 0.008818342151675485, "percentage": 0.29, "elapsed_time": "0:01:36", "remaining_time": "9:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 3402, "loss": 0.3563, "learning_rate": 7.766990291262136e-06, "epoch": 0.01763668430335097, "percentage": 0.59, "elapsed_time": "0:02:56", "remaining_time": "8:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 3402, "loss": 0.2954, "learning_rate": 1.1650485436893204e-05, "epoch": 0.026455026455026454, "percentage": 0.88, "elapsed_time": "0:04:16", "remaining_time": "7:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 3402, "loss": 0.264, "learning_rate": 1.5533980582524273e-05, "epoch": 0.03527336860670194, "percentage": 1.18, "elapsed_time": "0:05:35", "remaining_time": "7:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 3402, "loss": 0.2515, "learning_rate": 1.9417475728155343e-05, "epoch": 0.04409171075837742, "percentage": 1.47, "elapsed_time": "0:06:55", "remaining_time": "7:44:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 3402, "loss": 0.2384, "learning_rate": 2.330097087378641e-05, "epoch": 0.05291005291005291, "percentage": 1.76, "elapsed_time": "0:08:15", "remaining_time": "7:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 3402, "loss": 0.2371, "learning_rate": 2.718446601941748e-05, "epoch": 0.06172839506172839, "percentage": 2.06, "elapsed_time": "0:09:35", "remaining_time": "7:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 3402, "loss": 0.2316, "learning_rate": 3.1067961165048545e-05, "epoch": 0.07054673721340388, "percentage": 2.35, "elapsed_time": "0:10:55", "remaining_time": "7:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 3402, "loss": 0.2243, "learning_rate": 3.4951456310679615e-05, "epoch": 0.07936507936507936, "percentage": 2.65, "elapsed_time": "0:12:14", "remaining_time": "7:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 3402, "loss": 0.2216, "learning_rate": 3.8834951456310685e-05, "epoch": 0.08818342151675485, "percentage": 2.94, "elapsed_time": "0:13:34", "remaining_time": "7:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 3402, "loss": 0.2181, "learning_rate": 3.9999555645496425e-05, "epoch": 0.09700176366843033, "percentage": 3.23, "elapsed_time": "0:14:54", "remaining_time": "7:26:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 3402, "loss": 0.2123, "learning_rate": 3.999737926280763e-05, "epoch": 0.10582010582010581, "percentage": 3.53, "elapsed_time": "0:16:14", "remaining_time": "7:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 3402, "loss": 0.2072, "learning_rate": 3.999338943291723e-05, "epoch": 0.1146384479717813, "percentage": 3.82, "elapsed_time": "0:17:33", "remaining_time": "7:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 3402, "loss": 0.2046, "learning_rate": 3.998758651763991e-05, "epoch": 0.12345679012345678, "percentage": 4.12, "elapsed_time": "0:18:53", "remaining_time": "7:20:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 3402, "loss": 0.2017, "learning_rate": 3.9979971043208656e-05, "epoch": 0.13227513227513227, "percentage": 4.41, "elapsed_time": "0:20:13", "remaining_time": "7:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 3402, "loss": 0.2026, "learning_rate": 3.997054370022701e-05, "epoch": 0.14109347442680775, "percentage": 4.7, "elapsed_time": "0:21:33", "remaining_time": "7:16:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 3402, "loss": 0.1972, "learning_rate": 3.995930534360642e-05, "epoch": 0.14991181657848324, "percentage": 5.0, "elapsed_time": "0:22:53", "remaining_time": "7:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 3402, "loss": 0.1947, "learning_rate": 3.994625699248876e-05, "epoch": 0.15873015873015872, "percentage": 5.29, "elapsed_time": "0:24:12", "remaining_time": "7:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 3402, "loss": 0.1971, "learning_rate": 3.993139983015388e-05, "epoch": 0.1675485008818342, "percentage": 5.58, "elapsed_time": "0:25:32", "remaining_time": "7:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 3402, "loss": 0.1925, "learning_rate": 3.9914735203912274e-05, "epoch": 0.1763668430335097, "percentage": 5.88, "elapsed_time": "0:26:52", "remaining_time": "7:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 3402, "loss": 0.192, "learning_rate": 3.989626462498299e-05, "epoch": 0.18518518518518517, "percentage": 6.17, "elapsed_time": "0:28:12", "remaining_time": "7:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 3402, "loss": 0.1868, "learning_rate": 3.9875989768356474e-05, "epoch": 0.19400352733686066, "percentage": 6.47, "elapsed_time": "0:29:31", "remaining_time": "7:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 3402, "loss": 0.1893, "learning_rate": 3.9853912472642766e-05, "epoch": 0.20282186948853614, "percentage": 6.76, "elapsed_time": "0:30:51", "remaining_time": "7:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 3402, "loss": 0.1863, "learning_rate": 3.9830034739904716e-05, "epoch": 0.21164021164021163, "percentage": 7.05, "elapsed_time": "0:32:11", "remaining_time": "7:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 3402, "loss": 0.1862, "learning_rate": 3.980435873547643e-05, "epoch": 0.2204585537918871, "percentage": 7.35, "elapsed_time": "0:33:33", "remaining_time": "7:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 3402, "loss": 0.1851, "learning_rate": 3.977688678776695e-05, "epoch": 0.2292768959435626, "percentage": 7.64, "elapsed_time": "0:34:56", "remaining_time": "7:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 3402, "loss": 0.1865, "learning_rate": 3.974762138804906e-05, "epoch": 0.23809523809523808, "percentage": 7.94, "elapsed_time": "0:36:17", "remaining_time": "7:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 3402, "loss": 0.1817, "learning_rate": 3.971656519023337e-05, "epoch": 0.24691358024691357, "percentage": 8.23, "elapsed_time": "0:37:37", "remaining_time": "6:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 3402, "loss": 0.1818, "learning_rate": 3.9683721010627666e-05, "epoch": 0.25573192239858905, "percentage": 8.52, "elapsed_time": "0:38:57", "remaining_time": "6:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 3402, "loss": 0.18, "learning_rate": 3.964909182768153e-05, "epoch": 0.26455026455026454, "percentage": 8.82, "elapsed_time": "0:40:17", "remaining_time": "6:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 3402, "loss": 0.1803, "learning_rate": 3.9612680781716203e-05, "epoch": 0.27336860670194, "percentage": 9.11, "elapsed_time": "0:41:37", "remaining_time": "6:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 3402, "loss": 0.1789, "learning_rate": 3.9574491174639824e-05, "epoch": 0.2821869488536155, "percentage": 9.41, "elapsed_time": "0:42:56", "remaining_time": "6:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 3402, "loss": 0.178, "learning_rate": 3.9534526469648e-05, "epoch": 0.291005291005291, "percentage": 9.7, "elapsed_time": "0:44:16", "remaining_time": "6:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 3402, "loss": 0.179, "learning_rate": 3.949279029090976e-05, "epoch": 0.2998236331569665, "percentage": 9.99, "elapsed_time": "0:45:36", "remaining_time": "6:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 3402, "loss": 0.1786, "learning_rate": 3.944928642323887e-05, "epoch": 0.30864197530864196, "percentage": 10.29, "elapsed_time": "0:46:56", "remaining_time": "6:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 3402, "loss": 0.18, "learning_rate": 3.940401881175065e-05, "epoch": 0.31746031746031744, "percentage": 10.58, "elapsed_time": "0:48:16", "remaining_time": "6:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 3402, "loss": 0.1776, "learning_rate": 3.9356991561504177e-05, "epoch": 0.3262786596119929, "percentage": 10.88, "elapsed_time": "0:49:35", "remaining_time": "6:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 3402, "loss": 0.1763, "learning_rate": 3.9308208937130046e-05, "epoch": 0.3350970017636684, "percentage": 11.17, "elapsed_time": "0:50:55", "remaining_time": "6:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 3402, "loss": 0.1751, "learning_rate": 3.925767536244362e-05, "epoch": 0.3439153439153439, "percentage": 11.46, "elapsed_time": "0:52:15", "remaining_time": "6:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 3402, "loss": 0.1745, "learning_rate": 3.920539542004387e-05, "epoch": 0.3527336860670194, "percentage": 11.76, "elapsed_time": "0:53:35", "remaining_time": "6:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 3402, "loss": 0.1749, "learning_rate": 3.915137385089781e-05, "epoch": 0.36155202821869487, "percentage": 12.05, "elapsed_time": "0:54:54", "remaining_time": "6:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 3402, "loss": 0.174, "learning_rate": 3.909561555391053e-05, "epoch": 0.37037037037037035, "percentage": 12.35, "elapsed_time": "0:56:14", "remaining_time": "6:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 3402, "loss": 0.1734, "learning_rate": 3.903812558548099e-05, "epoch": 0.37918871252204583, "percentage": 12.64, "elapsed_time": "0:57:34", "remaining_time": "6:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 3402, "loss": 0.174, "learning_rate": 3.8978909159043465e-05, "epoch": 0.3880070546737213, "percentage": 12.93, "elapsed_time": "0:58:54", "remaining_time": "6:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 3402, "loss": 0.1715, "learning_rate": 3.891797164459477e-05, "epoch": 0.3968253968253968, "percentage": 13.23, "elapsed_time": "1:00:14", "remaining_time": "6:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 3402, "loss": 0.1707, "learning_rate": 3.885531856820726e-05, "epoch": 0.4056437389770723, "percentage": 13.52, "elapsed_time": "1:01:33", "remaining_time": "6:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 3402, "loss": 0.1702, "learning_rate": 3.8790955611527754e-05, "epoch": 0.4144620811287478, "percentage": 13.82, "elapsed_time": "1:02:53", "remaining_time": "6:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 3402, "loss": 0.1688, "learning_rate": 3.872488861126226e-05, "epoch": 0.42328042328042326, "percentage": 14.11, "elapsed_time": "1:04:13", "remaining_time": "6:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 3402, "loss": 0.169, "learning_rate": 3.865712355864668e-05, "epoch": 0.43209876543209874, "percentage": 14.4, "elapsed_time": "1:05:33", "remaining_time": "6:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 3402, "loss": 0.1672, "learning_rate": 3.8587666598903526e-05, "epoch": 0.4409171075837742, "percentage": 14.7, "elapsed_time": "1:06:52", "remaining_time": "6:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 3402, "loss": 0.1726, "learning_rate": 3.851652403068461e-05, "epoch": 0.4497354497354497, "percentage": 14.99, "elapsed_time": "1:08:12", "remaining_time": "6:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 3402, "loss": 0.1704, "learning_rate": 3.8443702305499886e-05, "epoch": 0.4585537918871252, "percentage": 15.29, "elapsed_time": "1:09:32", "remaining_time": "6:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 3402, "loss": 0.1671, "learning_rate": 3.836920802713238e-05, "epoch": 0.4673721340388007, "percentage": 15.58, "elapsed_time": "1:10:52", "remaining_time": "6:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 3402, "loss": 0.1672, "learning_rate": 3.829304795103933e-05, "epoch": 0.47619047619047616, "percentage": 15.87, "elapsed_time": "1:12:12", "remaining_time": "6:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 3402, "loss": 0.1666, "learning_rate": 3.82152289837396e-05, "epoch": 0.48500881834215165, "percentage": 16.17, "elapsed_time": "1:13:31", "remaining_time": "6:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 3402, "loss": 0.1686, "learning_rate": 3.813575818218732e-05, "epoch": 0.49382716049382713, "percentage": 16.46, "elapsed_time": "1:14:51", "remaining_time": "6:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 3402, "loss": 0.1669, "learning_rate": 3.8054642753132e-05, "epoch": 0.5026455026455027, "percentage": 16.75, "elapsed_time": "1:16:11", "remaining_time": "6:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 3402, "loss": 0.1622, "learning_rate": 3.797189005246489e-05, "epoch": 0.5114638447971781, "percentage": 17.05, "elapsed_time": "1:17:31", "remaining_time": "6:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 3402, "loss": 0.1629, "learning_rate": 3.788750758455204e-05, "epoch": 0.5202821869488536, "percentage": 17.34, "elapsed_time": "1:18:50", "remaining_time": "6:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 3402, "loss": 0.1682, "learning_rate": 3.7801503001553664e-05, "epoch": 0.5291005291005291, "percentage": 17.64, "elapsed_time": "1:20:10", "remaining_time": "6:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 3402, "loss": 0.1672, "learning_rate": 3.771388410273027e-05, "epoch": 0.5379188712522046, "percentage": 17.93, "elapsed_time": "1:21:30", "remaining_time": "6:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 3402, "loss": 0.1618, "learning_rate": 3.762465883373539e-05, "epoch": 0.54673721340388, "percentage": 18.22, "elapsed_time": "1:22:50", "remaining_time": "6:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 3402, "loss": 0.1639, "learning_rate": 3.753383528589499e-05, "epoch": 0.5555555555555556, "percentage": 18.52, "elapsed_time": "1:24:10", "remaining_time": "6:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 3402, "loss": 0.1603, "learning_rate": 3.744142169547376e-05, "epoch": 0.564373897707231, "percentage": 18.81, "elapsed_time": "1:25:29", "remaining_time": "6:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 3402, "loss": 0.1627, "learning_rate": 3.734742644292821e-05, "epoch": 0.5731922398589065, "percentage": 19.11, "elapsed_time": "1:26:50", "remaining_time": "6:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 3402, "loss": 0.1639, "learning_rate": 3.725185805214665e-05, "epoch": 0.582010582010582, "percentage": 19.4, "elapsed_time": "1:28:09", "remaining_time": "6:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 3402, "loss": 0.1619, "learning_rate": 3.7154725189676264e-05, "epoch": 0.5908289241622575, "percentage": 19.69, "elapsed_time": "1:29:30", "remaining_time": "6:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 3402, "loss": 0.165, "learning_rate": 3.7056036663937164e-05, "epoch": 0.599647266313933, "percentage": 19.99, "elapsed_time": "1:30:53", "remaining_time": "6:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 3402, "loss": 0.1614, "learning_rate": 3.695580142442361e-05, "epoch": 0.6084656084656085, "percentage": 20.28, "elapsed_time": "1:32:15", "remaining_time": "6:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 3402, "loss": 0.1618, "learning_rate": 3.685402856089242e-05, "epoch": 0.6172839506172839, "percentage": 20.58, "elapsed_time": "1:33:35", "remaining_time": "6:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 3402, "loss": 0.1655, "learning_rate": 3.675072730253868e-05, "epoch": 0.6261022927689595, "percentage": 20.87, "elapsed_time": "1:34:55", "remaining_time": "5:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 3402, "loss": 0.1608, "learning_rate": 3.6645907017158814e-05, "epoch": 0.6349206349206349, "percentage": 21.16, "elapsed_time": "1:36:15", "remaining_time": "5:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 3402, "loss": 0.1606, "learning_rate": 3.653957721030107e-05, "epoch": 0.6437389770723104, "percentage": 21.46, "elapsed_time": "1:37:35", "remaining_time": "5:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 3402, "loss": 0.1624, "learning_rate": 3.64317475244035e-05, "epoch": 0.6525573192239859, "percentage": 21.75, "elapsed_time": "1:38:55", "remaining_time": "5:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 3402, "loss": 0.1605, "learning_rate": 3.632242773791952e-05, "epoch": 0.6613756613756614, "percentage": 22.05, "elapsed_time": "1:40:15", "remaining_time": "5:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 3402, "loss": 0.1597, "learning_rate": 3.621162776443125e-05, "epoch": 0.6701940035273368, "percentage": 22.34, "elapsed_time": "1:41:35", "remaining_time": "5:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 3402, "loss": 0.1609, "learning_rate": 3.60993576517504e-05, "epoch": 0.6790123456790124, "percentage": 22.63, "elapsed_time": "1:42:54", "remaining_time": "5:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 3402, "loss": 0.1607, "learning_rate": 3.598562758100716e-05, "epoch": 0.6878306878306878, "percentage": 22.93, "elapsed_time": "1:44:14", "remaining_time": "5:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 3402, "loss": 0.1606, "learning_rate": 3.5870447865726913e-05, "epoch": 0.6966490299823633, "percentage": 23.22, "elapsed_time": "1:45:34", "remaining_time": "5:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 3402, "loss": 0.161, "learning_rate": 3.575382895089495e-05, "epoch": 0.7054673721340388, "percentage": 23.52, "elapsed_time": "1:46:54", "remaining_time": "5:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 3402, "loss": 0.1592, "learning_rate": 3.563578141200929e-05, "epoch": 0.7142857142857143, "percentage": 23.81, "elapsed_time": "1:48:14", "remaining_time": "5:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 3402, "loss": 0.1596, "learning_rate": 3.551631595412164e-05, "epoch": 0.7231040564373897, "percentage": 24.1, "elapsed_time": "1:49:33", "remaining_time": "5:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 3402, "loss": 0.1565, "learning_rate": 3.539544341086663e-05, "epoch": 0.7319223985890653, "percentage": 24.4, "elapsed_time": "1:50:53", "remaining_time": "5:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 3402, "loss": 0.1581, "learning_rate": 3.5273174743479336e-05, "epoch": 0.7407407407407407, "percentage": 24.69, "elapsed_time": "1:52:13", "remaining_time": "5:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 3402, "loss": 0.1598, "learning_rate": 3.514952103980132e-05, "epoch": 0.7495590828924162, "percentage": 24.99, "elapsed_time": "1:53:33", "remaining_time": "5:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 3402, "loss": 0.1586, "learning_rate": 3.50244935132751e-05, "epoch": 0.7583774250440917, "percentage": 25.28, "elapsed_time": "1:54:53", "remaining_time": "5:39:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 3402, "loss": 0.1559, "learning_rate": 3.489810350192729e-05, "epoch": 0.7671957671957672, "percentage": 25.57, "elapsed_time": "1:56:12", "remaining_time": "5:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 3402, "loss": 0.1563, "learning_rate": 3.477036246734038e-05, "epoch": 0.7760141093474426, "percentage": 25.87, "elapsed_time": "1:57:32", "remaining_time": "5:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 3402, "loss": 0.1596, "learning_rate": 3.4641281993613406e-05, "epoch": 0.7848324514991182, "percentage": 26.16, "elapsed_time": "1:58:52", "remaining_time": "5:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 3402, "loss": 0.1579, "learning_rate": 3.451087378631143e-05, "epoch": 0.7936507936507936, "percentage": 26.46, "elapsed_time": "2:00:12", "remaining_time": "5:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 3402, "loss": 0.1571, "learning_rate": 3.437914967140401e-05, "epoch": 0.8024691358024691, "percentage": 26.75, "elapsed_time": "2:01:32", "remaining_time": "5:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 3402, "loss": 0.157, "learning_rate": 3.4246121594192814e-05, "epoch": 0.8112874779541446, "percentage": 27.04, "elapsed_time": "2:02:51", "remaining_time": "5:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 3402, "loss": 0.1554, "learning_rate": 3.411180161822831e-05, "epoch": 0.8201058201058201, "percentage": 27.34, "elapsed_time": "2:04:11", "remaining_time": "5:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 3402, "loss": 0.1557, "learning_rate": 3.3976201924215854e-05, "epoch": 0.8289241622574955, "percentage": 27.63, "elapsed_time": "2:05:31", "remaining_time": "5:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 3402, "loss": 0.155, "learning_rate": 3.3839334808911057e-05, "epoch": 0.8377425044091711, "percentage": 27.92, "elapsed_time": "2:06:51", "remaining_time": "5:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 3402, "loss": 0.1554, "learning_rate": 3.370121268400467e-05, "epoch": 0.8465608465608465, "percentage": 28.22, "elapsed_time": "2:08:10", "remaining_time": "5:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 3402, "loss": 0.1543, "learning_rate": 3.356184807499705e-05, "epoch": 0.855379188712522, "percentage": 28.51, "elapsed_time": "2:09:30", "remaining_time": "5:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 3402, "loss": 0.1552, "learning_rate": 3.342125362006226e-05, "epoch": 0.8641975308641975, "percentage": 28.81, "elapsed_time": "2:10:50", "remaining_time": "5:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 3402, "loss": 0.155, "learning_rate": 3.3279442068902024e-05, "epoch": 0.873015873015873, "percentage": 29.1, "elapsed_time": "2:12:10", "remaining_time": "5:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 3402, "loss": 0.1559, "learning_rate": 3.3136426281589525e-05, "epoch": 0.8818342151675485, "percentage": 29.39, "elapsed_time": "2:13:30", "remaining_time": "5:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 3402, "loss": 0.1555, "learning_rate": 3.299221922740318e-05, "epoch": 0.890652557319224, "percentage": 29.69, "elapsed_time": "2:14:49", "remaining_time": "5:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 3402, "loss": 0.1544, "learning_rate": 3.284683398365053e-05, "epoch": 0.8994708994708994, "percentage": 29.98, "elapsed_time": "2:16:09", "remaining_time": "5:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 3402, "loss": 0.156, "learning_rate": 3.270028373448237e-05, "epoch": 0.908289241622575, "percentage": 30.28, "elapsed_time": "2:17:29", "remaining_time": "5:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 3402, "loss": 0.1525, "learning_rate": 3.255258176969711e-05, "epoch": 0.9171075837742504, "percentage": 30.57, "elapsed_time": "2:18:49", "remaining_time": "5:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 3402, "loss": 0.1579, "learning_rate": 3.2403741483535624e-05, "epoch": 0.9259259259259259, "percentage": 30.86, "elapsed_time": "2:20:09", "remaining_time": "5:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 3402, "loss": 0.1545, "learning_rate": 3.22537763734666e-05, "epoch": 0.9347442680776014, "percentage": 31.16, "elapsed_time": "2:21:28", "remaining_time": "5:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 3402, "loss": 0.1523, "learning_rate": 3.210270003896254e-05, "epoch": 0.9435626102292769, "percentage": 31.45, "elapsed_time": "2:22:49", "remaining_time": "5:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 3402, "loss": 0.1498, "learning_rate": 3.195052618026646e-05, "epoch": 0.9523809523809523, "percentage": 31.75, "elapsed_time": "2:24:08", "remaining_time": "5:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 3402, "loss": 0.1533, "learning_rate": 3.1797268597149575e-05, "epoch": 0.9611992945326279, "percentage": 32.04, "elapsed_time": "2:25:29", "remaining_time": "5:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 3402, "loss": 0.1505, "learning_rate": 3.1642941187659784e-05, "epoch": 0.9700176366843033, "percentage": 32.33, "elapsed_time": "2:26:50", "remaining_time": "5:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 3402, "loss": 0.154, "learning_rate": 3.1487557946861413e-05, "epoch": 0.9788359788359788, "percentage": 32.63, "elapsed_time": "2:28:11", "remaining_time": "5:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 3402, "loss": 0.1495, "learning_rate": 3.133113296556603e-05, "epoch": 0.9876543209876543, "percentage": 32.92, "elapsed_time": "2:29:32", "remaining_time": "5:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 3402, "loss": 0.1517, "learning_rate": 3.117368042905466e-05, "epoch": 0.9964726631393298, "percentage": 33.22, "elapsed_time": "2:30:53", "remaining_time": "5:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 3402, "loss": 0.1409, "learning_rate": 3.101521461579139e-05, "epoch": 1.0052910052910053, "percentage": 33.51, "elapsed_time": "2:32:50", "remaining_time": "5:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 3402, "loss": 0.1321, "learning_rate": 3.085574989612856e-05, "epoch": 1.0141093474426808, "percentage": 33.8, "elapsed_time": "2:34:10", "remaining_time": "5:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 3402, "loss": 0.1313, "learning_rate": 3.069530073100356e-05, "epoch": 1.0229276895943562, "percentage": 34.1, "elapsed_time": "2:35:30", "remaining_time": "5:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 3402, "loss": 0.1321, "learning_rate": 3.053388167062747e-05, "epoch": 1.0317460317460316, "percentage": 34.39, "elapsed_time": "2:36:49", "remaining_time": "4:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 3402, "loss": 0.1332, "learning_rate": 3.037150735316561e-05, "epoch": 1.0405643738977073, "percentage": 34.69, "elapsed_time": "2:38:09", "remaining_time": "4:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 3402, "loss": 0.131, "learning_rate": 3.0208192503410046e-05, "epoch": 1.0493827160493827, "percentage": 34.98, "elapsed_time": "2:39:29", "remaining_time": "4:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 3402, "loss": 0.1327, "learning_rate": 3.0043951931444302e-05, "epoch": 1.0582010582010581, "percentage": 35.27, "elapsed_time": "2:40:49", "remaining_time": "4:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 3402, "loss": 0.1337, "learning_rate": 2.9878800531300335e-05, "epoch": 1.0670194003527338, "percentage": 35.57, "elapsed_time": "2:42:09", "remaining_time": "4:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 3402, "loss": 0.1364, "learning_rate": 2.9712753279607852e-05, "epoch": 1.0758377425044092, "percentage": 35.86, "elapsed_time": "2:43:29", "remaining_time": "4:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 3402, "loss": 0.1306, "learning_rate": 2.9545825234236187e-05, "epoch": 1.0846560846560847, "percentage": 36.16, "elapsed_time": "2:44:48", "remaining_time": "4:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 3402, "loss": 0.1342, "learning_rate": 2.937803153292878e-05, "epoch": 1.09347442680776, "percentage": 36.45, "elapsed_time": "2:46:08", "remaining_time": "4:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 3402, "loss": 0.1341, "learning_rate": 2.9209387391930425e-05, "epoch": 1.1022927689594355, "percentage": 36.74, "elapsed_time": "2:47:28", "remaining_time": "4:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 3402, "loss": 0.1333, "learning_rate": 2.9039908104607395e-05, "epoch": 1.1111111111111112, "percentage": 37.04, "elapsed_time": "2:48:48", "remaining_time": "4:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 3402, "loss": 0.1336, "learning_rate": 2.8869609040060572e-05, "epoch": 1.1199294532627866, "percentage": 37.33, "elapsed_time": "2:50:08", "remaining_time": "4:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 3402, "loss": 0.1323, "learning_rate": 2.869850564173172e-05, "epoch": 1.128747795414462, "percentage": 37.62, "elapsed_time": "2:51:27", "remaining_time": "4:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 3402, "loss": 0.1319, "learning_rate": 2.8526613426002998e-05, "epoch": 1.1375661375661377, "percentage": 37.92, "elapsed_time": "2:52:47", "remaining_time": "4:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 3402, "loss": 0.1321, "learning_rate": 2.835394798078988e-05, "epoch": 1.146384479717813, "percentage": 38.21, "elapsed_time": "2:54:07", "remaining_time": "4:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 3402, "loss": 0.1317, "learning_rate": 2.8180524964127573e-05, "epoch": 1.1552028218694885, "percentage": 38.51, "elapsed_time": "2:55:27", "remaining_time": "4:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 3402, "loss": 0.1322, "learning_rate": 2.8006360102751064e-05, "epoch": 1.164021164021164, "percentage": 38.8, "elapsed_time": "2:56:47", "remaining_time": "4:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 3402, "loss": 0.133, "learning_rate": 2.7831469190668974e-05, "epoch": 1.1728395061728394, "percentage": 39.09, "elapsed_time": "2:58:06", "remaining_time": "4:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 3402, "loss": 0.1317, "learning_rate": 2.7655868087731295e-05, "epoch": 1.181657848324515, "percentage": 39.39, "elapsed_time": "2:59:26", "remaining_time": "4:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 3402, "loss": 0.1333, "learning_rate": 2.7479572718191108e-05, "epoch": 1.1904761904761905, "percentage": 39.68, "elapsed_time": "3:00:46", "remaining_time": "4:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 3402, "loss": 0.1309, "learning_rate": 2.7302599069260572e-05, "epoch": 1.199294532627866, "percentage": 39.98, "elapsed_time": "3:02:06", "remaining_time": "4:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 3402, "loss": 0.1314, "learning_rate": 2.712496318966108e-05, "epoch": 1.2081128747795415, "percentage": 40.27, "elapsed_time": "3:03:26", "remaining_time": "4:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 3402, "loss": 0.1334, "learning_rate": 2.69466811881679e-05, "epoch": 1.216931216931217, "percentage": 40.56, "elapsed_time": "3:04:45", "remaining_time": "4:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 3402, "loss": 0.1331, "learning_rate": 2.67677692321494e-05, "epoch": 1.2257495590828924, "percentage": 40.86, "elapsed_time": "3:06:05", "remaining_time": "4:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 3402, "loss": 0.1313, "learning_rate": 2.6588243546100882e-05, "epoch": 1.2345679012345678, "percentage": 41.15, "elapsed_time": "3:07:25", "remaining_time": "4:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 3402, "loss": 0.1287, "learning_rate": 2.6408120410173296e-05, "epoch": 1.2433862433862433, "percentage": 41.45, "elapsed_time": "3:08:45", "remaining_time": "4:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 3402, "loss": 0.1297, "learning_rate": 2.6227416158696884e-05, "epoch": 1.252204585537919, "percentage": 41.74, "elapsed_time": "3:10:05", "remaining_time": "4:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 3402, "loss": 0.1309, "learning_rate": 2.60461471786999e-05, "epoch": 1.2610229276895943, "percentage": 42.03, "elapsed_time": "3:11:25", "remaining_time": "4:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 3402, "loss": 0.1292, "learning_rate": 2.5864329908422597e-05, "epoch": 1.2698412698412698, "percentage": 42.33, "elapsed_time": "3:12:45", "remaining_time": "4:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 3402, "loss": 0.1295, "learning_rate": 2.5681980835826503e-05, "epoch": 1.2786596119929454, "percentage": 42.62, "elapsed_time": "3:14:05", "remaining_time": "4:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 3402, "loss": 0.1314, "learning_rate": 2.5499116497099224e-05, "epoch": 1.2874779541446209, "percentage": 42.92, "elapsed_time": "3:15:25", "remaining_time": "4:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 3402, "loss": 0.1318, "learning_rate": 2.531575347515492e-05, "epoch": 1.2962962962962963, "percentage": 43.21, "elapsed_time": "3:16:47", "remaining_time": "4:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 3402, "loss": 0.1291, "learning_rate": 2.5131908398130426e-05, "epoch": 1.3051146384479717, "percentage": 43.5, "elapsed_time": "3:18:09", "remaining_time": "4:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 3402, "loss": 0.1299, "learning_rate": 2.49475979378774e-05, "epoch": 1.3139329805996471, "percentage": 43.8, "elapsed_time": "3:19:31", "remaining_time": "4:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 3402, "loss": 0.1333, "learning_rate": 2.476283880845042e-05, "epoch": 1.3227513227513228, "percentage": 44.09, "elapsed_time": "3:20:52", "remaining_time": "4:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 3402, "loss": 0.1311, "learning_rate": 2.4577647764591276e-05, "epoch": 1.3315696649029982, "percentage": 44.39, "elapsed_time": "3:22:14", "remaining_time": "4:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 3402, "loss": 0.1298, "learning_rate": 2.4392041600209608e-05, "epoch": 1.3403880070546736, "percentage": 44.68, "elapsed_time": "3:23:35", "remaining_time": "4:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 3402, "loss": 0.1266, "learning_rate": 2.4206037146859944e-05, "epoch": 1.3492063492063493, "percentage": 44.97, "elapsed_time": "3:24:55", "remaining_time": "4:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 3402, "loss": 0.131, "learning_rate": 2.4019651272215338e-05, "epoch": 1.3580246913580247, "percentage": 45.27, "elapsed_time": "3:26:15", "remaining_time": "4:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 3402, "loss": 0.1327, "learning_rate": 2.383290087853775e-05, "epoch": 1.3668430335097002, "percentage": 45.56, "elapsed_time": "3:27:35", "remaining_time": "4:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 3402, "loss": 0.1328, "learning_rate": 2.364580290114527e-05, "epoch": 1.3756613756613756, "percentage": 45.86, "elapsed_time": "3:28:55", "remaining_time": "4:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 3402, "loss": 0.1337, "learning_rate": 2.3458374306876355e-05, "epoch": 1.384479717813051, "percentage": 46.15, "elapsed_time": "3:30:15", "remaining_time": "4:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 3402, "loss": 0.128, "learning_rate": 2.327063209255121e-05, "epoch": 1.3932980599647267, "percentage": 46.44, "elapsed_time": "3:31:35", "remaining_time": "4:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 3402, "loss": 0.1294, "learning_rate": 2.308259328343042e-05, "epoch": 1.402116402116402, "percentage": 46.74, "elapsed_time": "3:32:55", "remaining_time": "4:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 3402, "loss": 0.1291, "learning_rate": 2.289427493167107e-05, "epoch": 1.4109347442680775, "percentage": 47.03, "elapsed_time": "3:34:14", "remaining_time": "4:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 3402, "loss": 0.1274, "learning_rate": 2.270569411478033e-05, "epoch": 1.4197530864197532, "percentage": 47.33, "elapsed_time": "3:35:34", "remaining_time": "3:59:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 3402, "loss": 0.1297, "learning_rate": 2.251686793406684e-05, "epoch": 1.4285714285714286, "percentage": 47.62, "elapsed_time": "3:36:54", "remaining_time": "3:58:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 3402, "loss": 0.1302, "learning_rate": 2.2327813513089875e-05, "epoch": 1.437389770723104, "percentage": 47.91, "elapsed_time": "3:38:14", "remaining_time": "3:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 3402, "loss": 0.1285, "learning_rate": 2.213854799610649e-05, "epoch": 1.4462081128747795, "percentage": 48.21, "elapsed_time": "3:39:34", "remaining_time": "3:55:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 3402, "loss": 0.1289, "learning_rate": 2.194908854651683e-05, "epoch": 1.455026455026455, "percentage": 48.5, "elapsed_time": "3:40:54", "remaining_time": "3:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 3402, "loss": 0.1275, "learning_rate": 2.1759452345307675e-05, "epoch": 1.4638447971781305, "percentage": 48.79, "elapsed_time": "3:42:14", "remaining_time": "3:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 3402, "loss": 0.1266, "learning_rate": 2.1569656589494386e-05, "epoch": 1.472663139329806, "percentage": 49.09, "elapsed_time": "3:43:33", "remaining_time": "3:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 3402, "loss": 0.1271, "learning_rate": 2.137971849056142e-05, "epoch": 1.4814814814814814, "percentage": 49.38, "elapsed_time": "3:44:53", "remaining_time": "3:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1690, "total_steps": 3402, "loss": 0.1288, "learning_rate": 2.1189655272901498e-05, "epoch": 1.490299823633157, "percentage": 49.68, "elapsed_time": "3:46:13", "remaining_time": "3:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 3402, "loss": 0.1274, "learning_rate": 2.0999484172253654e-05, "epoch": 1.4991181657848325, "percentage": 49.97, "elapsed_time": "3:47:33", "remaining_time": "3:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1710, "total_steps": 3402, "loss": 0.1268, "learning_rate": 2.08092224341402e-05, "epoch": 1.507936507936508, "percentage": 50.26, "elapsed_time": "3:48:53", "remaining_time": "3:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1720, "total_steps": 3402, "loss": 0.1269, "learning_rate": 2.0618887312302838e-05, "epoch": 1.5167548500881836, "percentage": 50.56, "elapsed_time": "3:50:13", "remaining_time": "3:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 3402, "loss": 0.1327, "learning_rate": 2.042849606713802e-05, "epoch": 1.5255731922398588, "percentage": 50.85, "elapsed_time": "3:51:32", "remaining_time": "3:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1740, "total_steps": 3402, "loss": 0.1289, "learning_rate": 2.02380659641317e-05, "epoch": 1.5343915343915344, "percentage": 51.15, "elapsed_time": "3:52:52", "remaining_time": "3:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 3402, "loss": 0.1241, "learning_rate": 2.004761427229363e-05, "epoch": 1.5432098765432098, "percentage": 51.44, "elapsed_time": "3:54:12", "remaining_time": "3:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1760, "total_steps": 3402, "loss": 0.1283, "learning_rate": 1.985715826259131e-05, "epoch": 1.5520282186948853, "percentage": 51.73, "elapsed_time": "3:55:32", "remaining_time": "3:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1770, "total_steps": 3402, "loss": 0.1268, "learning_rate": 1.966671520638383e-05, "epoch": 1.560846560846561, "percentage": 52.03, "elapsed_time": "3:56:52", "remaining_time": "3:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1780, "total_steps": 3402, "loss": 0.1281, "learning_rate": 1.947630237385558e-05, "epoch": 1.5696649029982364, "percentage": 52.32, "elapsed_time": "3:58:11", "remaining_time": "3:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1790, "total_steps": 3402, "loss": 0.128, "learning_rate": 1.9285937032450146e-05, "epoch": 1.5784832451499118, "percentage": 52.62, "elapsed_time": "3:59:31", "remaining_time": "3:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 3402, "loss": 0.1264, "learning_rate": 1.909563644530443e-05, "epoch": 1.5873015873015874, "percentage": 52.91, "elapsed_time": "4:00:51", "remaining_time": "3:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1810, "total_steps": 3402, "loss": 0.1268, "learning_rate": 1.8905417869683113e-05, "epoch": 1.5961199294532626, "percentage": 53.2, "elapsed_time": "4:02:11", "remaining_time": "3:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1820, "total_steps": 3402, "loss": 0.1249, "learning_rate": 1.871529855541375e-05, "epoch": 1.6049382716049383, "percentage": 53.5, "elapsed_time": "4:03:31", "remaining_time": "3:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1830, "total_steps": 3402, "loss": 0.1269, "learning_rate": 1.8525295743322453e-05, "epoch": 1.6137566137566137, "percentage": 53.79, "elapsed_time": "4:04:51", "remaining_time": "3:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1840, "total_steps": 3402, "loss": 0.1273, "learning_rate": 1.8335426663670397e-05, "epoch": 1.6225749559082892, "percentage": 54.09, "elapsed_time": "4:06:11", "remaining_time": "3:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 3402, "loss": 0.1255, "learning_rate": 1.8145708534591377e-05, "epoch": 1.6313932980599648, "percentage": 54.38, "elapsed_time": "4:07:31", "remaining_time": "3:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1860, "total_steps": 3402, "loss": 0.1283, "learning_rate": 1.79561585605303e-05, "epoch": 1.6402116402116402, "percentage": 54.67, "elapsed_time": "4:08:51", "remaining_time": "3:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1870, "total_steps": 3402, "loss": 0.1254, "learning_rate": 1.7766793930683094e-05, "epoch": 1.6490299823633157, "percentage": 54.97, "elapsed_time": "4:10:11", "remaining_time": "3:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1880, "total_steps": 3402, "loss": 0.1244, "learning_rate": 1.7577631817437888e-05, "epoch": 1.6578483245149913, "percentage": 55.26, "elapsed_time": "4:11:32", "remaining_time": "3:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1890, "total_steps": 3402, "loss": 0.1232, "learning_rate": 1.7388689374817722e-05, "epoch": 1.6666666666666665, "percentage": 55.56, "elapsed_time": "4:12:52", "remaining_time": "3:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 3402, "loss": 0.1259, "learning_rate": 1.719998373692499e-05, "epoch": 1.6754850088183422, "percentage": 55.85, "elapsed_time": "4:14:15", "remaining_time": "3:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1910, "total_steps": 3402, "loss": 0.1241, "learning_rate": 1.7011532016387637e-05, "epoch": 1.6843033509700176, "percentage": 56.14, "elapsed_time": "4:15:36", "remaining_time": "3:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1920, "total_steps": 3402, "loss": 0.1248, "learning_rate": 1.682335130280728e-05, "epoch": 1.693121693121693, "percentage": 56.44, "elapsed_time": "4:16:57", "remaining_time": "3:18:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1930, "total_steps": 3402, "loss": 0.1209, "learning_rate": 1.663545866120949e-05, "epoch": 1.7019400352733687, "percentage": 56.73, "elapsed_time": "4:18:18", "remaining_time": "3:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1940, "total_steps": 3402, "loss": 0.1239, "learning_rate": 1.6447871130496257e-05, "epoch": 1.710758377425044, "percentage": 57.03, "elapsed_time": "4:19:39", "remaining_time": "3:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1950, "total_steps": 3402, "loss": 0.1261, "learning_rate": 1.62606057219008e-05, "epoch": 1.7195767195767195, "percentage": 57.32, "elapsed_time": "4:20:59", "remaining_time": "3:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1960, "total_steps": 3402, "loss": 0.1266, "learning_rate": 1.6073679417444946e-05, "epoch": 1.7283950617283952, "percentage": 57.61, "elapsed_time": "4:22:19", "remaining_time": "3:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1970, "total_steps": 3402, "loss": 0.1225, "learning_rate": 1.588710916839914e-05, "epoch": 1.7372134038800704, "percentage": 57.91, "elapsed_time": "4:23:39", "remaining_time": "3:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1980, "total_steps": 3402, "loss": 0.1249, "learning_rate": 1.570091189374518e-05, "epoch": 1.746031746031746, "percentage": 58.2, "elapsed_time": "4:24:59", "remaining_time": "3:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1990, "total_steps": 3402, "loss": 0.1254, "learning_rate": 1.5515104478641975e-05, "epoch": 1.7548500881834215, "percentage": 58.5, "elapsed_time": "4:26:19", "remaining_time": "3:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 3402, "loss": 0.1236, "learning_rate": 1.5329703772894327e-05, "epoch": 1.763668430335097, "percentage": 58.79, "elapsed_time": "4:27:39", "remaining_time": "3:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2010, "total_steps": 3402, "loss": 0.1242, "learning_rate": 1.51447265894249e-05, "epoch": 1.7724867724867726, "percentage": 59.08, "elapsed_time": "4:28:59", "remaining_time": "3:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2020, "total_steps": 3402, "loss": 0.1245, "learning_rate": 1.4960189702749551e-05, "epoch": 1.781305114638448, "percentage": 59.38, "elapsed_time": "4:30:18", "remaining_time": "3:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2030, "total_steps": 3402, "loss": 0.1226, "learning_rate": 1.4776109847456173e-05, "epoch": 1.7901234567901234, "percentage": 59.67, "elapsed_time": "4:31:38", "remaining_time": "3:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2040, "total_steps": 3402, "loss": 0.1243, "learning_rate": 1.4592503716687107e-05, "epoch": 1.798941798941799, "percentage": 59.96, "elapsed_time": "4:32:58", "remaining_time": "3:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2050, "total_steps": 3402, "loss": 0.1216, "learning_rate": 1.4409387960625331e-05, "epoch": 1.8077601410934743, "percentage": 60.26, "elapsed_time": "4:34:18", "remaining_time": "3:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2060, "total_steps": 3402, "loss": 0.1249, "learning_rate": 1.422677918498459e-05, "epoch": 1.81657848324515, "percentage": 60.55, "elapsed_time": "4:35:38", "remaining_time": "2:59:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2070, "total_steps": 3402, "loss": 0.1251, "learning_rate": 1.4044693949503465e-05, "epoch": 1.8253968253968254, "percentage": 60.85, "elapsed_time": "4:36:58", "remaining_time": "2:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2080, "total_steps": 3402, "loss": 0.1228, "learning_rate": 1.3863148766443723e-05, "epoch": 1.8342151675485008, "percentage": 61.14, "elapsed_time": "4:38:18", "remaining_time": "2:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2090, "total_steps": 3402, "loss": 0.1221, "learning_rate": 1.368216009909286e-05, "epoch": 1.8430335097001764, "percentage": 61.43, "elapsed_time": "4:39:37", "remaining_time": "2:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2100, "total_steps": 3402, "loss": 0.123, "learning_rate": 1.3501744360271177e-05, "epoch": 1.8518518518518519, "percentage": 61.73, "elapsed_time": "4:40:57", "remaining_time": "2:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2110, "total_steps": 3402, "loss": 0.1187, "learning_rate": 1.3321917910843394e-05, "epoch": 1.8606701940035273, "percentage": 62.02, "elapsed_time": "4:42:17", "remaining_time": "2:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2120, "total_steps": 3402, "loss": 0.1222, "learning_rate": 1.3142697058234952e-05, "epoch": 1.869488536155203, "percentage": 62.32, "elapsed_time": "4:43:37", "remaining_time": "2:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2130, "total_steps": 3402, "loss": 0.1205, "learning_rate": 1.2964098054953209e-05, "epoch": 1.8783068783068781, "percentage": 62.61, "elapsed_time": "4:44:57", "remaining_time": "2:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2140, "total_steps": 3402, "loss": 0.1194, "learning_rate": 1.2786137097113594e-05, "epoch": 1.8871252204585538, "percentage": 62.9, "elapsed_time": "4:46:17", "remaining_time": "2:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2150, "total_steps": 3402, "loss": 0.1234, "learning_rate": 1.2608830322970865e-05, "epoch": 1.8959435626102292, "percentage": 63.2, "elapsed_time": "4:47:36", "remaining_time": "2:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2160, "total_steps": 3402, "loss": 0.1237, "learning_rate": 1.2432193811455609e-05, "epoch": 1.9047619047619047, "percentage": 63.49, "elapsed_time": "4:48:56", "remaining_time": "2:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2170, "total_steps": 3402, "loss": 0.1216, "learning_rate": 1.2256243580716187e-05, "epoch": 1.9135802469135803, "percentage": 63.79, "elapsed_time": "4:50:16", "remaining_time": "2:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2180, "total_steps": 3402, "loss": 0.122, "learning_rate": 1.2080995586666085e-05, "epoch": 1.9223985890652557, "percentage": 64.08, "elapsed_time": "4:51:36", "remaining_time": "2:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2190, "total_steps": 3402, "loss": 0.1236, "learning_rate": 1.1906465721536984e-05, "epoch": 1.9312169312169312, "percentage": 64.37, "elapsed_time": "4:52:56", "remaining_time": "2:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2200, "total_steps": 3402, "loss": 0.1214, "learning_rate": 1.17326698124376e-05, "epoch": 1.9400352733686068, "percentage": 64.67, "elapsed_time": "4:54:15", "remaining_time": "2:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2210, "total_steps": 3402, "loss": 0.1212, "learning_rate": 1.1559623619918396e-05, "epoch": 1.948853615520282, "percentage": 64.96, "elapsed_time": "4:55:35", "remaining_time": "2:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2220, "total_steps": 3402, "loss": 0.1203, "learning_rate": 1.1387342836542353e-05, "epoch": 1.9576719576719577, "percentage": 65.26, "elapsed_time": "4:56:55", "remaining_time": "2:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2230, "total_steps": 3402, "loss": 0.1187, "learning_rate": 1.1215843085461912e-05, "epoch": 1.966490299823633, "percentage": 65.55, "elapsed_time": "4:58:15", "remaining_time": "2:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2240, "total_steps": 3402, "loss": 0.1185, "learning_rate": 1.1045139919002181e-05, "epoch": 1.9753086419753085, "percentage": 65.84, "elapsed_time": "4:59:35", "remaining_time": "2:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2250, "total_steps": 3402, "loss": 0.1223, "learning_rate": 1.087524881725059e-05, "epoch": 1.9841269841269842, "percentage": 66.14, "elapsed_time": "5:00:54", "remaining_time": "2:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2260, "total_steps": 3402, "loss": 0.1195, "learning_rate": 1.0706185186653108e-05, "epoch": 1.9929453262786596, "percentage": 66.43, "elapsed_time": "5:02:14", "remaining_time": "2:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2270, "total_steps": 3402, "loss": 0.1145, "learning_rate": 1.0537964358617114e-05, "epoch": 2.001763668430335, "percentage": 66.73, "elapsed_time": "5:04:12", "remaining_time": "2:31:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2280, "total_steps": 3402, "loss": 0.0971, "learning_rate": 1.0370601588121052e-05, "epoch": 2.0105820105820107, "percentage": 67.02, "elapsed_time": "5:05:34", "remaining_time": "2:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2290, "total_steps": 3402, "loss": 0.0983, "learning_rate": 1.0204112052331097e-05, "epoch": 2.019400352733686, "percentage": 67.31, "elapsed_time": "5:06:55", "remaining_time": "2:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2300, "total_steps": 3402, "loss": 0.097, "learning_rate": 1.0038510849224758e-05, "epoch": 2.0282186948853616, "percentage": 67.61, "elapsed_time": "5:08:17", "remaining_time": "2:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2310, "total_steps": 3402, "loss": 0.0942, "learning_rate": 9.87381299622181e-06, "epoch": 2.037037037037037, "percentage": 67.9, "elapsed_time": "5:09:38", "remaining_time": "2:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2320, "total_steps": 3402, "loss": 0.0952, "learning_rate": 9.710033428822368e-06, "epoch": 2.0458553791887124, "percentage": 68.2, "elapsed_time": "5:10:58", "remaining_time": "2:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2330, "total_steps": 3402, "loss": 0.0966, "learning_rate": 9.547186999252538e-06, "epoch": 2.054673721340388, "percentage": 68.49, "elapsed_time": "5:12:19", "remaining_time": "2:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2340, "total_steps": 3402, "loss": 0.0947, "learning_rate": 9.385288475117526e-06, "epoch": 2.0634920634920633, "percentage": 68.78, "elapsed_time": "5:13:40", "remaining_time": "2:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2350, "total_steps": 3402, "loss": 0.0961, "learning_rate": 9.224352538062441e-06, "epoch": 2.072310405643739, "percentage": 69.08, "elapsed_time": "5:15:01", "remaining_time": "2:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2360, "total_steps": 3402, "loss": 0.0935, "learning_rate": 9.06439378244091e-06, "epoch": 2.0811287477954146, "percentage": 69.37, "elapsed_time": "5:16:21", "remaining_time": "2:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2370, "total_steps": 3402, "loss": 0.098, "learning_rate": 8.905426713991609e-06, "epoch": 2.0899470899470898, "percentage": 69.66, "elapsed_time": "5:17:41", "remaining_time": "2:18:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2380, "total_steps": 3402, "loss": 0.0929, "learning_rate": 8.747465748522824e-06, "epoch": 2.0987654320987654, "percentage": 69.96, "elapsed_time": "5:19:01", "remaining_time": "2:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2390, "total_steps": 3402, "loss": 0.0938, "learning_rate": 8.590525210605125e-06, "epoch": 2.107583774250441, "percentage": 70.25, "elapsed_time": "5:20:20", "remaining_time": "2:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2400, "total_steps": 3402, "loss": 0.0933, "learning_rate": 8.434619332272412e-06, "epoch": 2.1164021164021163, "percentage": 70.55, "elapsed_time": "5:21:40", "remaining_time": "2:14:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2410, "total_steps": 3402, "loss": 0.0944, "learning_rate": 8.279762251731246e-06, "epoch": 2.125220458553792, "percentage": 70.84, "elapsed_time": "5:23:00", "remaining_time": "2:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2420, "total_steps": 3402, "loss": 0.092, "learning_rate": 8.125968012078745e-06, "epoch": 2.1340388007054676, "percentage": 71.13, "elapsed_time": "5:24:20", "remaining_time": "2:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2430, "total_steps": 3402, "loss": 0.0939, "learning_rate": 7.973250560029132e-06, "epoch": 2.142857142857143, "percentage": 71.43, "elapsed_time": "5:25:40", "remaining_time": "2:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2440, "total_steps": 3402, "loss": 0.0917, "learning_rate": 7.821623744648952e-06, "epoch": 2.1516754850088184, "percentage": 71.72, "elapsed_time": "5:27:00", "remaining_time": "2:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2450, "total_steps": 3402, "loss": 0.0942, "learning_rate": 7.671101316101172e-06, "epoch": 2.1604938271604937, "percentage": 72.02, "elapsed_time": "5:28:20", "remaining_time": "2:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2460, "total_steps": 3402, "loss": 0.0947, "learning_rate": 7.521696924398303e-06, "epoch": 2.1693121693121693, "percentage": 72.31, "elapsed_time": "5:29:39", "remaining_time": "2:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2470, "total_steps": 3402, "loss": 0.0944, "learning_rate": 7.373424118164501e-06, "epoch": 2.178130511463845, "percentage": 72.6, "elapsed_time": "5:30:59", "remaining_time": "2:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2480, "total_steps": 3402, "loss": 0.0941, "learning_rate": 7.226296343406974e-06, "epoch": 2.18694885361552, "percentage": 72.9, "elapsed_time": "5:32:19", "remaining_time": "2:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2490, "total_steps": 3402, "loss": 0.0922, "learning_rate": 7.0803269422966135e-06, "epoch": 2.195767195767196, "percentage": 73.19, "elapsed_time": "5:33:39", "remaining_time": "2:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 3402, "loss": 0.0948, "learning_rate": 6.935529151958065e-06, "epoch": 2.204585537918871, "percentage": 73.49, "elapsed_time": "5:34:59", "remaining_time": "2:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2510, "total_steps": 3402, "loss": 0.0932, "learning_rate": 6.791916103269333e-06, "epoch": 2.2134038800705467, "percentage": 73.78, "elapsed_time": "5:36:18", "remaining_time": "1:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2520, "total_steps": 3402, "loss": 0.0955, "learning_rate": 6.649500819671047e-06, "epoch": 2.2222222222222223, "percentage": 74.07, "elapsed_time": "5:37:38", "remaining_time": "1:58:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2530, "total_steps": 3402, "loss": 0.0898, "learning_rate": 6.5082962159853834e-06, "epoch": 2.2310405643738975, "percentage": 74.37, "elapsed_time": "5:38:58", "remaining_time": "1:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2540, "total_steps": 3402, "loss": 0.0917, "learning_rate": 6.368315097244955e-06, "epoch": 2.239858906525573, "percentage": 74.66, "elapsed_time": "5:40:18", "remaining_time": "1:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2550, "total_steps": 3402, "loss": 0.0916, "learning_rate": 6.2295701575315594e-06, "epoch": 2.248677248677249, "percentage": 74.96, "elapsed_time": "5:41:38", "remaining_time": "1:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2560, "total_steps": 3402, "loss": 0.0927, "learning_rate": 6.092073978825022e-06, "epoch": 2.257495590828924, "percentage": 75.25, "elapsed_time": "5:42:58", "remaining_time": "1:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2570, "total_steps": 3402, "loss": 0.0946, "learning_rate": 5.955839029862245e-06, "epoch": 2.2663139329805997, "percentage": 75.54, "elapsed_time": "5:44:17", "remaining_time": "1:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2580, "total_steps": 3402, "loss": 0.0926, "learning_rate": 5.820877665006441e-06, "epoch": 2.2751322751322753, "percentage": 75.84, "elapsed_time": "5:45:37", "remaining_time": "1:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2590, "total_steps": 3402, "loss": 0.0952, "learning_rate": 5.687202123126832e-06, "epoch": 2.2839506172839505, "percentage": 76.13, "elapsed_time": "5:46:57", "remaining_time": "1:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2600, "total_steps": 3402, "loss": 0.0929, "learning_rate": 5.5548245264887515e-06, "epoch": 2.292768959435626, "percentage": 76.43, "elapsed_time": "5:48:17", "remaining_time": "1:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2610, "total_steps": 3402, "loss": 0.092, "learning_rate": 5.423756879654343e-06, "epoch": 2.3015873015873014, "percentage": 76.72, "elapsed_time": "5:49:37", "remaining_time": "1:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2620, "total_steps": 3402, "loss": 0.0932, "learning_rate": 5.294011068393945e-06, "epoch": 2.310405643738977, "percentage": 77.01, "elapsed_time": "5:50:57", "remaining_time": "1:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2630, "total_steps": 3402, "loss": 0.0944, "learning_rate": 5.1655988586082535e-06, "epoch": 2.3192239858906527, "percentage": 77.31, "elapsed_time": "5:52:17", "remaining_time": "1:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2640, "total_steps": 3402, "loss": 0.094, "learning_rate": 5.038531895261301e-06, "epoch": 2.328042328042328, "percentage": 77.6, "elapsed_time": "5:53:36", "remaining_time": "1:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2650, "total_steps": 3402, "loss": 0.0924, "learning_rate": 4.912821701324479e-06, "epoch": 2.3368606701940036, "percentage": 77.9, "elapsed_time": "5:54:56", "remaining_time": "1:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2660, "total_steps": 3402, "loss": 0.0936, "learning_rate": 4.788479676731581e-06, "epoch": 2.3456790123456788, "percentage": 78.19, "elapsed_time": "5:56:16", "remaining_time": "1:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2670, "total_steps": 3402, "loss": 0.0935, "learning_rate": 4.665517097344976e-06, "epoch": 2.3544973544973544, "percentage": 78.48, "elapsed_time": "5:57:36", "remaining_time": "1:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2680, "total_steps": 3402, "loss": 0.0931, "learning_rate": 4.543945113933099e-06, "epoch": 2.36331569664903, "percentage": 78.78, "elapsed_time": "5:58:56", "remaining_time": "1:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2690, "total_steps": 3402, "loss": 0.0937, "learning_rate": 4.423774751159247e-06, "epoch": 2.3721340388007053, "percentage": 79.07, "elapsed_time": "6:00:17", "remaining_time": "1:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2700, "total_steps": 3402, "loss": 0.0906, "learning_rate": 4.305016906581811e-06, "epoch": 2.380952380952381, "percentage": 79.37, "elapsed_time": "6:01:39", "remaining_time": "1:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2710, "total_steps": 3402, "loss": 0.0919, "learning_rate": 4.1876823496660245e-06, "epoch": 2.3897707231040566, "percentage": 79.66, "elapsed_time": "6:03:01", "remaining_time": "1:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2720, "total_steps": 3402, "loss": 0.0929, "learning_rate": 4.071781720807375e-06, "epoch": 2.398589065255732, "percentage": 79.95, "elapsed_time": "6:04:22", "remaining_time": "1:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2730, "total_steps": 3402, "loss": 0.0911, "learning_rate": 3.9573255303666554e-06, "epoch": 2.4074074074074074, "percentage": 80.25, "elapsed_time": "6:05:42", "remaining_time": "1:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2740, "total_steps": 3402, "loss": 0.0906, "learning_rate": 3.844324157716857e-06, "epoch": 2.416225749559083, "percentage": 80.54, "elapsed_time": "6:07:03", "remaining_time": "1:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2750, "total_steps": 3402, "loss": 0.0903, "learning_rate": 3.7327878503019243e-06, "epoch": 2.4250440917107583, "percentage": 80.83, "elapsed_time": "6:08:23", "remaining_time": "1:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2760, "total_steps": 3402, "loss": 0.09, "learning_rate": 3.622726722707479e-06, "epoch": 2.433862433862434, "percentage": 81.13, "elapsed_time": "6:09:44", "remaining_time": "1:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2770, "total_steps": 3402, "loss": 0.093, "learning_rate": 3.5141507557435504e-06, "epoch": 2.442680776014109, "percentage": 81.42, "elapsed_time": "6:11:05", "remaining_time": "1:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2780, "total_steps": 3402, "loss": 0.0897, "learning_rate": 3.4070697955395326e-06, "epoch": 2.451499118165785, "percentage": 81.72, "elapsed_time": "6:12:25", "remaining_time": "1:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2790, "total_steps": 3402, "loss": 0.0922, "learning_rate": 3.3014935526512383e-06, "epoch": 2.4603174603174605, "percentage": 82.01, "elapsed_time": "6:13:45", "remaining_time": "1:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2800, "total_steps": 3402, "loss": 0.0924, "learning_rate": 3.197431601180343e-06, "epoch": 2.4691358024691357, "percentage": 82.3, "elapsed_time": "6:15:05", "remaining_time": "1:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2810, "total_steps": 3402, "loss": 0.0897, "learning_rate": 3.094893377906143e-06, "epoch": 2.4779541446208113, "percentage": 82.6, "elapsed_time": "6:16:25", "remaining_time": "1:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2820, "total_steps": 3402, "loss": 0.0901, "learning_rate": 2.9938881814298002e-06, "epoch": 2.4867724867724865, "percentage": 82.89, "elapsed_time": "6:17:44", "remaining_time": "1:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2830, "total_steps": 3402, "loss": 0.0918, "learning_rate": 2.894425171331112e-06, "epoch": 2.495590828924162, "percentage": 83.19, "elapsed_time": "6:19:04", "remaining_time": "1:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2840, "total_steps": 3402, "loss": 0.0883, "learning_rate": 2.796513367337854e-06, "epoch": 2.504409171075838, "percentage": 83.48, "elapsed_time": "6:20:24", "remaining_time": "1:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2850, "total_steps": 3402, "loss": 0.0937, "learning_rate": 2.7001616485078553e-06, "epoch": 2.5132275132275135, "percentage": 83.77, "elapsed_time": "6:21:44", "remaining_time": "1:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2860, "total_steps": 3402, "loss": 0.0881, "learning_rate": 2.6053787524238084e-06, "epoch": 2.5220458553791887, "percentage": 84.07, "elapsed_time": "6:23:04", "remaining_time": "1:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2870, "total_steps": 3402, "loss": 0.0883, "learning_rate": 2.512173274400904e-06, "epoch": 2.5308641975308643, "percentage": 84.36, "elapsed_time": "6:24:24", "remaining_time": "1:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2880, "total_steps": 3402, "loss": 0.0914, "learning_rate": 2.4205536667073572e-06, "epoch": 2.5396825396825395, "percentage": 84.66, "elapsed_time": "6:25:44", "remaining_time": "1:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2890, "total_steps": 3402, "loss": 0.0916, "learning_rate": 2.330528237797949e-06, "epoch": 2.548500881834215, "percentage": 84.95, "elapsed_time": "6:27:03", "remaining_time": "1:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2900, "total_steps": 3402, "loss": 0.0897, "learning_rate": 2.242105151560554e-06, "epoch": 2.557319223985891, "percentage": 85.24, "elapsed_time": "6:28:23", "remaining_time": "1:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2910, "total_steps": 3402, "loss": 0.0883, "learning_rate": 2.1552924265758102e-06, "epoch": 2.566137566137566, "percentage": 85.54, "elapsed_time": "6:29:43", "remaining_time": "1:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2920, "total_steps": 3402, "loss": 0.088, "learning_rate": 2.070097935389974e-06, "epoch": 2.5749559082892417, "percentage": 85.83, "elapsed_time": "6:31:03", "remaining_time": "1:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2930, "total_steps": 3402, "loss": 0.09, "learning_rate": 1.9865294038009984e-06, "epoch": 2.583774250440917, "percentage": 86.13, "elapsed_time": "6:32:23", "remaining_time": "1:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2940, "total_steps": 3402, "loss": 0.0896, "learning_rate": 1.9045944101579073e-06, "epoch": 2.5925925925925926, "percentage": 86.42, "elapsed_time": "6:33:42", "remaining_time": "1:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2950, "total_steps": 3402, "loss": 0.0916, "learning_rate": 1.8243003846735807e-06, "epoch": 2.601410934744268, "percentage": 86.71, "elapsed_time": "6:35:02", "remaining_time": "1:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2960, "total_steps": 3402, "loss": 0.0882, "learning_rate": 1.7456546087509419e-06, "epoch": 2.6102292768959434, "percentage": 87.01, "elapsed_time": "6:36:22", "remaining_time": "0:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2970, "total_steps": 3402, "loss": 0.0892, "learning_rate": 1.6686642143226484e-06, "epoch": 2.619047619047619, "percentage": 87.3, "elapsed_time": "6:37:42", "remaining_time": "0:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2980, "total_steps": 3402, "loss": 0.0884, "learning_rate": 1.593336183204346e-06, "epoch": 2.6278659611992943, "percentage": 87.6, "elapsed_time": "6:39:02", "remaining_time": "0:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2990, "total_steps": 3402, "loss": 0.0902, "learning_rate": 1.5196773464615167e-06, "epoch": 2.63668430335097, "percentage": 87.89, "elapsed_time": "6:40:22", "remaining_time": "0:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 3402, "loss": 0.0915, "learning_rate": 1.4476943837900105e-06, "epoch": 2.6455026455026456, "percentage": 88.18, "elapsed_time": "6:41:41", "remaining_time": "0:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3010, "total_steps": 3402, "loss": 0.0904, "learning_rate": 1.377393822910318e-06, "epoch": 2.6543209876543212, "percentage": 88.48, "elapsed_time": "6:43:01", "remaining_time": "0:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3020, "total_steps": 3402, "loss": 0.0883, "learning_rate": 1.30878203897558e-06, "epoch": 2.6631393298059964, "percentage": 88.77, "elapsed_time": "6:44:21", "remaining_time": "0:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3030, "total_steps": 3402, "loss": 0.0899, "learning_rate": 1.241865253993495e-06, "epoch": 2.671957671957672, "percentage": 89.07, "elapsed_time": "6:45:41", "remaining_time": "0:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3040, "total_steps": 3402, "loss": 0.09, "learning_rate": 1.1766495362620555e-06, "epoch": 2.6807760141093473, "percentage": 89.36, "elapsed_time": "6:47:01", "remaining_time": "0:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3050, "total_steps": 3402, "loss": 0.089, "learning_rate": 1.1131407998192567e-06, "epoch": 2.689594356261023, "percentage": 89.65, "elapsed_time": "6:48:20", "remaining_time": "0:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3060, "total_steps": 3402, "loss": 0.0892, "learning_rate": 1.0513448039067954e-06, "epoch": 2.6984126984126986, "percentage": 89.95, "elapsed_time": "6:49:40", "remaining_time": "0:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3070, "total_steps": 3402, "loss": 0.0878, "learning_rate": 9.91267152447779e-07, "epoch": 2.707231040564374, "percentage": 90.24, "elapsed_time": "6:51:00", "remaining_time": "0:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3080, "total_steps": 3402, "loss": 0.0899, "learning_rate": 9.329132935385577e-07, "epoch": 2.7160493827160495, "percentage": 90.53, "elapsed_time": "6:52:20", "remaining_time": "0:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3090, "total_steps": 3402, "loss": 0.0916, "learning_rate": 8.7628851895466e-07, "epoch": 2.7248677248677247, "percentage": 90.83, "elapsed_time": "6:53:40", "remaining_time": "0:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3100, "total_steps": 3402, "loss": 0.0922, "learning_rate": 8.213979636709046e-07, "epoch": 2.7336860670194003, "percentage": 91.12, "elapsed_time": "6:55:00", "remaining_time": "0:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3110, "total_steps": 3402, "loss": 0.0888, "learning_rate": 7.682466053957438e-07, "epoch": 2.742504409171076, "percentage": 91.42, "elapsed_time": "6:56:21", "remaining_time": "0:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3120, "total_steps": 3402, "loss": 0.0869, "learning_rate": 7.168392641198796e-07, "epoch": 2.751322751322751, "percentage": 91.71, "elapsed_time": "6:57:43", "remaining_time": "0:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3130, "total_steps": 3402, "loss": 0.0877, "learning_rate": 6.671806016791337e-07, "epoch": 2.760141093474427, "percentage": 92.0, "elapsed_time": "6:59:04", "remaining_time": "0:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3140, "total_steps": 3402, "loss": 0.0869, "learning_rate": 6.192751213317261e-07, "epoch": 2.768959435626102, "percentage": 92.3, "elapsed_time": "7:00:25", "remaining_time": "0:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3150, "total_steps": 3402, "loss": 0.0876, "learning_rate": 5.731271673498807e-07, "epoch": 2.7777777777777777, "percentage": 92.59, "elapsed_time": "7:01:46", "remaining_time": "0:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3160, "total_steps": 3402, "loss": 0.0867, "learning_rate": 5.287409246258724e-07, "epoch": 2.7865961199294533, "percentage": 92.89, "elapsed_time": "7:03:07", "remaining_time": "0:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3170, "total_steps": 3402, "loss": 0.0861, "learning_rate": 4.861204182925238e-07, "epoch": 2.795414462081129, "percentage": 93.18, "elapsed_time": "7:04:28", "remaining_time": "0:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3180, "total_steps": 3402, "loss": 0.0897, "learning_rate": 4.452695133581908e-07, "epoch": 2.804232804232804, "percentage": 93.47, "elapsed_time": "7:05:48", "remaining_time": "0:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3190, "total_steps": 3402, "loss": 0.0898, "learning_rate": 4.0619191435626647e-07, "epoch": 2.81305114638448, "percentage": 93.77, "elapsed_time": "7:07:08", "remaining_time": "0:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3200, "total_steps": 3402, "loss": 0.0892, "learning_rate": 3.688911650092375e-07, "epoch": 2.821869488536155, "percentage": 94.06, "elapsed_time": "7:08:28", "remaining_time": "0:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3210, "total_steps": 3402, "loss": 0.0904, "learning_rate": 3.333706479073229e-07, "epoch": 2.8306878306878307, "percentage": 94.36, "elapsed_time": "7:09:49", "remaining_time": "0:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3220, "total_steps": 3402, "loss": 0.0915, "learning_rate": 2.996335842017306e-07, "epoch": 2.8395061728395063, "percentage": 94.65, "elapsed_time": "7:11:09", "remaining_time": "0:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3230, "total_steps": 3402, "loss": 0.089, "learning_rate": 2.676830333125424e-07, "epoch": 2.8483245149911816, "percentage": 94.94, "elapsed_time": "7:12:29", "remaining_time": "0:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3240, "total_steps": 3402, "loss": 0.0868, "learning_rate": 2.3752189265128234e-07, "epoch": 2.857142857142857, "percentage": 95.24, "elapsed_time": "7:13:48", "remaining_time": "0:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3250, "total_steps": 3402, "loss": 0.0891, "learning_rate": 2.0915289735816247e-07, "epoch": 2.8659611992945324, "percentage": 95.53, "elapsed_time": "7:15:08", "remaining_time": "0:20:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3260, "total_steps": 3402, "loss": 0.0898, "learning_rate": 1.8257862005404802e-07, "epoch": 2.874779541446208, "percentage": 95.83, "elapsed_time": "7:16:28", "remaining_time": "0:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3270, "total_steps": 3402, "loss": 0.0877, "learning_rate": 1.5780147060715955e-07, "epoch": 2.8835978835978837, "percentage": 96.12, "elapsed_time": "7:17:48", "remaining_time": "0:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3280, "total_steps": 3402, "loss": 0.0911, "learning_rate": 1.3482369591453882e-07, "epoch": 2.892416225749559, "percentage": 96.41, "elapsed_time": "7:19:08", "remaining_time": "0:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3290, "total_steps": 3402, "loss": 0.0909, "learning_rate": 1.1364737969829176e-07, "epoch": 2.9012345679012346, "percentage": 96.71, "elapsed_time": "7:20:27", "remaining_time": "0:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3300, "total_steps": 3402, "loss": 0.0862, "learning_rate": 9.427444231662863e-08, "epoch": 2.91005291005291, "percentage": 97.0, "elapsed_time": "7:21:47", "remaining_time": "0:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3310, "total_steps": 3402, "loss": 0.0875, "learning_rate": 7.670664058970545e-08, "epoch": 2.9188712522045854, "percentage": 97.3, "elapsed_time": "7:23:07", "remaining_time": "0:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3320, "total_steps": 3402, "loss": 0.0886, "learning_rate": 6.094556764032922e-08, "epoch": 2.927689594356261, "percentage": 97.59, "elapsed_time": "7:24:27", "remaining_time": "0:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3330, "total_steps": 3402, "loss": 0.0865, "learning_rate": 4.699265274946907e-08, "epoch": 2.9365079365079367, "percentage": 97.88, "elapsed_time": "7:25:47", "remaining_time": "0:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3340, "total_steps": 3402, "loss": 0.0889, "learning_rate": 3.484916122664883e-08, "epoch": 2.945326278659612, "percentage": 98.18, "elapsed_time": "7:27:06", "remaining_time": "0:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3350, "total_steps": 3402, "loss": 0.0899, "learning_rate": 2.4516194295205466e-08, "epoch": 2.9541446208112876, "percentage": 98.47, "elapsed_time": "7:28:26", "remaining_time": "0:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3360, "total_steps": 3402, "loss": 0.0895, "learning_rate": 1.5994688992424513e-08, "epoch": 2.962962962962963, "percentage": 98.77, "elapsed_time": "7:29:46", "remaining_time": "0:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3370, "total_steps": 3402, "loss": 0.0886, "learning_rate": 9.285418084565845e-09, "epoch": 2.9717813051146384, "percentage": 99.06, "elapsed_time": "7:31:06", "remaining_time": "0:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3380, "total_steps": 3402, "loss": 0.0886, "learning_rate": 4.3889899967797244e-09, "epoch": 2.980599647266314, "percentage": 99.35, "elapsed_time": "7:32:25", "remaining_time": "0:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3390, "total_steps": 3402, "loss": 0.0888, "learning_rate": 1.3058487579420409e-09, "epoch": 2.9894179894179893, "percentage": 99.65, "elapsed_time": "7:33:45", "remaining_time": "0:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3400, "total_steps": 3402, "loss": 0.0869, "learning_rate": 3.627396038208275e-11, "epoch": 2.998236331569665, "percentage": 99.94, "elapsed_time": "7:35:05", "remaining_time": "0:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3402, "total_steps": 3402, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "7:36:20", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}