|
{"current_steps": 5, "total_steps": 1119, "loss": 1.2958, "learning_rate": 4.4642857142857147e-07, "epoch": 0.013377926421404682, "percentage": 0.45, "elapsed_time": "0:01:08", "remaining_time": "4:15:35"} |
|
{"current_steps": 10, "total_steps": 1119, "loss": 1.2627, "learning_rate": 8.928571428571429e-07, "epoch": 0.026755852842809364, "percentage": 0.89, "elapsed_time": "0:02:17", "remaining_time": "4:14:43"} |
|
{"current_steps": 15, "total_steps": 1119, "loss": 1.2874, "learning_rate": 1.3392857142857143e-06, "epoch": 0.04013377926421405, "percentage": 1.34, "elapsed_time": "0:03:19", "remaining_time": "4:04:48"} |
|
{"current_steps": 20, "total_steps": 1119, "loss": 1.2337, "learning_rate": 1.7857142857142859e-06, "epoch": 0.05351170568561873, "percentage": 1.79, "elapsed_time": "0:04:16", "remaining_time": "3:54:31"} |
|
{"current_steps": 25, "total_steps": 1119, "loss": 1.2754, "learning_rate": 2.2321428571428573e-06, "epoch": 0.06688963210702341, "percentage": 2.23, "elapsed_time": "0:05:11", "remaining_time": "3:47:31"} |
|
{"current_steps": 30, "total_steps": 1119, "loss": 1.238, "learning_rate": 2.6785714285714285e-06, "epoch": 0.0802675585284281, "percentage": 2.68, "elapsed_time": "0:06:12", "remaining_time": "3:45:30"} |
|
{"current_steps": 35, "total_steps": 1119, "loss": 1.2122, "learning_rate": 3.125e-06, "epoch": 0.09364548494983277, "percentage": 3.13, "elapsed_time": "0:07:08", "remaining_time": "3:41:07"} |
|
{"current_steps": 40, "total_steps": 1119, "loss": 1.1821, "learning_rate": 3.5714285714285718e-06, "epoch": 0.10702341137123746, "percentage": 3.57, "elapsed_time": "0:08:07", "remaining_time": "3:39:04"} |
|
{"current_steps": 45, "total_steps": 1119, "loss": 1.1503, "learning_rate": 4.017857142857143e-06, "epoch": 0.12040133779264214, "percentage": 4.02, "elapsed_time": "0:09:05", "remaining_time": "3:37:05"} |
|
{"current_steps": 50, "total_steps": 1119, "loss": 1.1426, "learning_rate": 4.464285714285715e-06, "epoch": 0.13377926421404682, "percentage": 4.47, "elapsed_time": "0:10:02", "remaining_time": "3:34:40"} |
|
{"current_steps": 55, "total_steps": 1119, "loss": 1.1012, "learning_rate": 4.910714285714286e-06, "epoch": 0.14715719063545152, "percentage": 4.92, "elapsed_time": "0:10:59", "remaining_time": "3:32:28"} |
|
{"current_steps": 60, "total_steps": 1119, "loss": 1.1423, "learning_rate": 5.357142857142857e-06, "epoch": 0.1605351170568562, "percentage": 5.36, "elapsed_time": "0:11:55", "remaining_time": "3:30:32"} |
|
{"current_steps": 65, "total_steps": 1119, "loss": 1.1462, "learning_rate": 5.8035714285714295e-06, "epoch": 0.17391304347826086, "percentage": 5.81, "elapsed_time": "0:12:50", "remaining_time": "3:28:21"} |
|
{"current_steps": 70, "total_steps": 1119, "loss": 1.105, "learning_rate": 6.25e-06, "epoch": 0.18729096989966554, "percentage": 6.26, "elapsed_time": "0:13:56", "remaining_time": "3:28:57"} |
|
{"current_steps": 75, "total_steps": 1119, "loss": 1.0921, "learning_rate": 6.696428571428571e-06, "epoch": 0.20066889632107024, "percentage": 6.7, "elapsed_time": "0:14:55", "remaining_time": "3:27:43"} |
|
{"current_steps": 80, "total_steps": 1119, "loss": 1.109, "learning_rate": 7.1428571428571436e-06, "epoch": 0.2140468227424749, "percentage": 7.15, "elapsed_time": "0:15:55", "remaining_time": "3:26:53"} |
|
{"current_steps": 85, "total_steps": 1119, "loss": 1.0625, "learning_rate": 7.589285714285714e-06, "epoch": 0.22742474916387959, "percentage": 7.6, "elapsed_time": "0:17:00", "remaining_time": "3:26:54"} |
|
{"current_steps": 90, "total_steps": 1119, "loss": 1.0792, "learning_rate": 8.035714285714286e-06, "epoch": 0.2408026755852843, "percentage": 8.04, "elapsed_time": "0:18:00", "remaining_time": "3:25:51"} |
|
{"current_steps": 95, "total_steps": 1119, "loss": 1.062, "learning_rate": 8.482142857142858e-06, "epoch": 0.25418060200668896, "percentage": 8.49, "elapsed_time": "0:18:59", "remaining_time": "3:24:44"} |
|
{"current_steps": 100, "total_steps": 1119, "loss": 1.042, "learning_rate": 8.92857142857143e-06, "epoch": 0.26755852842809363, "percentage": 8.94, "elapsed_time": "0:19:59", "remaining_time": "3:23:45"} |
|
{"current_steps": 100, "total_steps": 1119, "eval_loss": 1.0254441499710083, "epoch": 0.26755852842809363, "percentage": 8.94, "elapsed_time": "0:22:29", "remaining_time": "3:49:15"} |
|
{"current_steps": 105, "total_steps": 1119, "loss": 1.0349, "learning_rate": 9.375000000000001e-06, "epoch": 0.2809364548494983, "percentage": 9.38, "elapsed_time": "0:23:26", "remaining_time": "3:46:23"} |
|
{"current_steps": 110, "total_steps": 1119, "loss": 1.0631, "learning_rate": 9.821428571428573e-06, "epoch": 0.29431438127090304, "percentage": 9.83, "elapsed_time": "0:24:23", "remaining_time": "3:43:40"} |
|
{"current_steps": 115, "total_steps": 1119, "loss": 1.0234, "learning_rate": 9.99978101208322e-06, "epoch": 0.3076923076923077, "percentage": 10.28, "elapsed_time": "0:25:21", "remaining_time": "3:41:23"} |
|
{"current_steps": 120, "total_steps": 1119, "loss": 1.0557, "learning_rate": 9.99844282205785e-06, "epoch": 0.3210702341137124, "percentage": 10.72, "elapsed_time": "0:26:22", "remaining_time": "3:39:30"} |
|
{"current_steps": 125, "total_steps": 1119, "loss": 1.0582, "learning_rate": 9.995888427170226e-06, "epoch": 0.33444816053511706, "percentage": 11.17, "elapsed_time": "0:27:20", "remaining_time": "3:37:29"} |
|
{"current_steps": 130, "total_steps": 1119, "loss": 1.0259, "learning_rate": 9.992118448947408e-06, "epoch": 0.34782608695652173, "percentage": 11.62, "elapsed_time": "0:28:20", "remaining_time": "3:35:38"} |
|
{"current_steps": 135, "total_steps": 1119, "loss": 1.0689, "learning_rate": 9.987133804688247e-06, "epoch": 0.3612040133779264, "percentage": 12.06, "elapsed_time": "0:29:20", "remaining_time": "3:33:54"} |
|
{"current_steps": 140, "total_steps": 1119, "loss": 1.0185, "learning_rate": 9.98093570724018e-06, "epoch": 0.3745819397993311, "percentage": 12.51, "elapsed_time": "0:30:21", "remaining_time": "3:32:17"} |
|
{"current_steps": 145, "total_steps": 1119, "loss": 1.0098, "learning_rate": 9.973525664704137e-06, "epoch": 0.3879598662207358, "percentage": 12.96, "elapsed_time": "0:31:19", "remaining_time": "3:30:24"} |
|
{"current_steps": 150, "total_steps": 1119, "loss": 1.0266, "learning_rate": 9.964905480067585e-06, "epoch": 0.4013377926421405, "percentage": 13.4, "elapsed_time": "0:32:23", "remaining_time": "3:29:15"} |
|
{"current_steps": 155, "total_steps": 1119, "loss": 1.0324, "learning_rate": 9.955077250765833e-06, "epoch": 0.41471571906354515, "percentage": 13.85, "elapsed_time": "0:33:22", "remaining_time": "3:27:31"} |
|
{"current_steps": 160, "total_steps": 1119, "loss": 1.0481, "learning_rate": 9.944043368171692e-06, "epoch": 0.4280936454849498, "percentage": 14.3, "elapsed_time": "0:34:22", "remaining_time": "3:26:02"} |
|
{"current_steps": 165, "total_steps": 1119, "loss": 1.0721, "learning_rate": 9.931806517013612e-06, "epoch": 0.4414715719063545, "percentage": 14.75, "elapsed_time": "0:35:23", "remaining_time": "3:24:40"} |
|
{"current_steps": 170, "total_steps": 1119, "loss": 1.0181, "learning_rate": 9.91836967472245e-06, "epoch": 0.45484949832775917, "percentage": 15.19, "elapsed_time": "0:36:21", "remaining_time": "3:22:56"} |
|
{"current_steps": 175, "total_steps": 1119, "loss": 1.0196, "learning_rate": 9.903736110707001e-06, "epoch": 0.4682274247491639, "percentage": 15.64, "elapsed_time": "0:37:17", "remaining_time": "3:21:07"} |
|
{"current_steps": 180, "total_steps": 1119, "loss": 1.0617, "learning_rate": 9.8879093855585e-06, "epoch": 0.4816053511705686, "percentage": 16.09, "elapsed_time": "0:38:14", "remaining_time": "3:19:27"} |
|
{"current_steps": 185, "total_steps": 1119, "loss": 1.0196, "learning_rate": 9.870893350184274e-06, "epoch": 0.49498327759197325, "percentage": 16.53, "elapsed_time": "0:39:12", "remaining_time": "3:17:56"} |
|
{"current_steps": 190, "total_steps": 1119, "loss": 1.0577, "learning_rate": 9.852692144870746e-06, "epoch": 0.5083612040133779, "percentage": 16.98, "elapsed_time": "0:40:09", "remaining_time": "3:16:19"} |
|
{"current_steps": 195, "total_steps": 1119, "loss": 1.036, "learning_rate": 9.833310198276037e-06, "epoch": 0.5217391304347826, "percentage": 17.43, "elapsed_time": "0:41:06", "remaining_time": "3:14:46"} |
|
{"current_steps": 200, "total_steps": 1119, "loss": 0.9872, "learning_rate": 9.812752226352405e-06, "epoch": 0.5351170568561873, "percentage": 17.87, "elapsed_time": "0:42:01", "remaining_time": "3:13:08"} |
|
{"current_steps": 200, "total_steps": 1119, "eval_loss": 1.0063743591308594, "epoch": 0.5351170568561873, "percentage": 17.87, "elapsed_time": "0:44:31", "remaining_time": "3:24:36"} |
|
{"current_steps": 205, "total_steps": 1119, "loss": 1.0283, "learning_rate": 9.791023231198757e-06, "epoch": 0.5484949832775919, "percentage": 18.32, "elapsed_time": "0:47:21", "remaining_time": "3:31:10"} |
|
{"current_steps": 210, "total_steps": 1119, "loss": 1.0278, "learning_rate": 9.768128499843579e-06, "epoch": 0.5618729096989966, "percentage": 18.77, "elapsed_time": "0:48:21", "remaining_time": "3:29:17"} |
|
{"current_steps": 215, "total_steps": 1119, "loss": 1.0498, "learning_rate": 9.744073602958493e-06, "epoch": 0.5752508361204013, "percentage": 19.21, "elapsed_time": "0:49:21", "remaining_time": "3:27:31"} |
|
{"current_steps": 220, "total_steps": 1119, "loss": 1.0187, "learning_rate": 9.718864393502828e-06, "epoch": 0.5886287625418061, "percentage": 19.66, "elapsed_time": "0:50:21", "remaining_time": "3:25:47"} |
|
{"current_steps": 225, "total_steps": 1119, "loss": 1.0398, "learning_rate": 9.692507005299499e-06, "epoch": 0.6020066889632107, "percentage": 20.11, "elapsed_time": "0:51:22", "remaining_time": "3:24:07"} |
|
{"current_steps": 230, "total_steps": 1119, "loss": 1.042, "learning_rate": 9.665007851542541e-06, "epoch": 0.6153846153846154, "percentage": 20.55, "elapsed_time": "0:52:23", "remaining_time": "3:22:28"} |
|
{"current_steps": 235, "total_steps": 1119, "loss": 0.9689, "learning_rate": 9.636373623236672e-06, "epoch": 0.6287625418060201, "percentage": 21.0, "elapsed_time": "0:53:22", "remaining_time": "3:20:45"} |
|
{"current_steps": 240, "total_steps": 1119, "loss": 0.9335, "learning_rate": 9.60661128756926e-06, "epoch": 0.6421404682274248, "percentage": 21.45, "elapsed_time": "0:54:29", "remaining_time": "3:19:33"} |
|
{"current_steps": 245, "total_steps": 1119, "loss": 1.0172, "learning_rate": 9.575728086215093e-06, "epoch": 0.6555183946488294, "percentage": 21.89, "elapsed_time": "0:55:28", "remaining_time": "3:17:54"} |
|
{"current_steps": 250, "total_steps": 1119, "loss": 0.9927, "learning_rate": 9.543731533574349e-06, "epoch": 0.6688963210702341, "percentage": 22.34, "elapsed_time": "0:56:27", "remaining_time": "3:16:16"} |
|
{"current_steps": 255, "total_steps": 1119, "loss": 1.0104, "learning_rate": 9.510629414944229e-06, "epoch": 0.6822742474916388, "percentage": 22.79, "elapsed_time": "0:57:22", "remaining_time": "3:14:23"} |
|
{"current_steps": 260, "total_steps": 1119, "loss": 1.0316, "learning_rate": 9.47642978462465e-06, "epoch": 0.6956521739130435, "percentage": 23.24, "elapsed_time": "0:58:21", "remaining_time": "3:12:50"} |
|
{"current_steps": 265, "total_steps": 1119, "loss": 1.0672, "learning_rate": 9.441140963958515e-06, "epoch": 0.7090301003344481, "percentage": 23.68, "elapsed_time": "0:59:17", "remaining_time": "3:11:05"} |
|
{"current_steps": 270, "total_steps": 1119, "loss": 1.0328, "learning_rate": 9.404771539306978e-06, "epoch": 0.7224080267558528, "percentage": 24.13, "elapsed_time": "1:00:18", "remaining_time": "3:09:39"} |
|
{"current_steps": 275, "total_steps": 1119, "loss": 0.9912, "learning_rate": 9.367330359960239e-06, "epoch": 0.7357859531772575, "percentage": 24.58, "elapsed_time": "1:01:21", "remaining_time": "3:08:17"} |
|
{"current_steps": 280, "total_steps": 1119, "loss": 1.014, "learning_rate": 9.328826535984374e-06, "epoch": 0.7491638795986622, "percentage": 25.02, "elapsed_time": "1:02:19", "remaining_time": "3:06:45"} |
|
{"current_steps": 285, "total_steps": 1119, "loss": 0.9737, "learning_rate": 9.289269436004692e-06, "epoch": 0.7625418060200669, "percentage": 25.47, "elapsed_time": "1:03:20", "remaining_time": "3:05:21"} |
|
{"current_steps": 290, "total_steps": 1119, "loss": 0.9971, "learning_rate": 9.248668684926199e-06, "epoch": 0.7759197324414716, "percentage": 25.92, "elapsed_time": "1:04:24", "remaining_time": "3:04:06"} |
|
{"current_steps": 295, "total_steps": 1119, "loss": 1.0176, "learning_rate": 9.207034161591689e-06, "epoch": 0.7892976588628763, "percentage": 26.36, "elapsed_time": "1:05:30", "remaining_time": "3:02:59"} |
|
{"current_steps": 300, "total_steps": 1119, "loss": 1.008, "learning_rate": 9.16437599637807e-06, "epoch": 0.802675585284281, "percentage": 26.81, "elapsed_time": "1:06:29", "remaining_time": "3:01:30"} |
|
{"current_steps": 300, "total_steps": 1119, "eval_loss": 0.993434488773346, "epoch": 0.802675585284281, "percentage": 26.81, "elapsed_time": "1:08:59", "remaining_time": "3:08:21"} |
|
{"current_steps": 305, "total_steps": 1119, "loss": 1.0055, "learning_rate": 9.120704568731455e-06, "epoch": 0.8160535117056856, "percentage": 27.26, "elapsed_time": "1:10:05", "remaining_time": "3:07:05"} |
|
{"current_steps": 310, "total_steps": 1119, "loss": 0.9808, "learning_rate": 9.07603050464169e-06, "epoch": 0.8294314381270903, "percentage": 27.7, "elapsed_time": "1:11:03", "remaining_time": "3:05:25"} |
|
{"current_steps": 315, "total_steps": 1119, "loss": 1.0094, "learning_rate": 9.030364674056853e-06, "epoch": 0.842809364548495, "percentage": 28.15, "elapsed_time": "1:12:08", "remaining_time": "3:04:07"} |
|
{"current_steps": 320, "total_steps": 1119, "loss": 0.9978, "learning_rate": 8.983718188238428e-06, "epoch": 0.8561872909698997, "percentage": 28.6, "elapsed_time": "1:13:07", "remaining_time": "3:02:36"} |
|
{"current_steps": 325, "total_steps": 1119, "loss": 0.9654, "learning_rate": 8.936102397057737e-06, "epoch": 0.8695652173913043, "percentage": 29.04, "elapsed_time": "1:14:06", "remaining_time": "3:01:03"} |
|
{"current_steps": 330, "total_steps": 1119, "loss": 0.9949, "learning_rate": 8.88752888623434e-06, "epoch": 0.882943143812709, "percentage": 29.49, "elapsed_time": "1:15:02", "remaining_time": "2:59:24"} |
|
{"current_steps": 335, "total_steps": 1119, "loss": 1.0466, "learning_rate": 8.838009474517022e-06, "epoch": 0.8963210702341137, "percentage": 29.94, "elapsed_time": "1:16:03", "remaining_time": "2:57:59"} |
|
{"current_steps": 340, "total_steps": 1119, "loss": 1.0075, "learning_rate": 8.787556210808101e-06, "epoch": 0.9096989966555183, "percentage": 30.38, "elapsed_time": "1:17:01", "remaining_time": "2:56:28"} |
|
{"current_steps": 345, "total_steps": 1119, "loss": 1.0351, "learning_rate": 8.736181371231728e-06, "epoch": 0.9230769230769231, "percentage": 30.83, "elapsed_time": "1:17:58", "remaining_time": "2:54:55"} |
|
{"current_steps": 350, "total_steps": 1119, "loss": 1.0235, "learning_rate": 8.683897456146897e-06, "epoch": 0.9364548494983278, "percentage": 31.28, "elapsed_time": "1:18:55", "remaining_time": "2:53:25"} |
|
{"current_steps": 355, "total_steps": 1119, "loss": 0.9868, "learning_rate": 8.630717187105902e-06, "epoch": 0.9498327759197325, "percentage": 31.72, "elapsed_time": "1:19:52", "remaining_time": "2:51:53"} |
|
{"current_steps": 360, "total_steps": 1119, "loss": 1.0067, "learning_rate": 8.576653503758964e-06, "epoch": 0.9632107023411371, "percentage": 32.17, "elapsed_time": "1:20:53", "remaining_time": "2:50:32"} |
|
{"current_steps": 365, "total_steps": 1119, "loss": 0.9743, "learning_rate": 8.52171956070581e-06, "epoch": 0.9765886287625418, "percentage": 32.62, "elapsed_time": "1:21:51", "remaining_time": "2:49:05"} |
|
{"current_steps": 370, "total_steps": 1119, "loss": 0.96, "learning_rate": 8.465928724294923e-06, "epoch": 0.9899665551839465, "percentage": 33.07, "elapsed_time": "1:22:45", "remaining_time": "2:47:31"} |
|
{"current_steps": 375, "total_steps": 1119, "loss": 0.9897, "learning_rate": 8.409294569371293e-06, "epoch": 1.0033444816053512, "percentage": 33.51, "elapsed_time": "1:23:41", "remaining_time": "2:46:02"} |
|
{"current_steps": 380, "total_steps": 1119, "loss": 0.7912, "learning_rate": 8.351830875973436e-06, "epoch": 1.0167224080267558, "percentage": 33.96, "elapsed_time": "1:24:44", "remaining_time": "2:44:47"} |
|
{"current_steps": 385, "total_steps": 1119, "loss": 0.7677, "learning_rate": 8.293551625980468e-06, "epoch": 1.0301003344481605, "percentage": 34.41, "elapsed_time": "1:25:38", "remaining_time": "2:43:16"} |
|
{"current_steps": 390, "total_steps": 1119, "loss": 0.7457, "learning_rate": 8.234470999710086e-06, "epoch": 1.0434782608695652, "percentage": 34.85, "elapsed_time": "1:26:32", "remaining_time": "2:41:46"} |
|
{"current_steps": 395, "total_steps": 1119, "loss": 0.7489, "learning_rate": 8.174603372468259e-06, "epoch": 1.0568561872909699, "percentage": 35.3, "elapsed_time": "1:27:28", "remaining_time": "2:40:20"} |
|
{"current_steps": 400, "total_steps": 1119, "loss": 0.7473, "learning_rate": 8.113963311051474e-06, "epoch": 1.0702341137123745, "percentage": 35.75, "elapsed_time": "1:28:30", "remaining_time": "2:39:05"} |
|
{"current_steps": 400, "total_steps": 1119, "eval_loss": 1.0105931758880615, "epoch": 1.0702341137123745, "percentage": 35.75, "elapsed_time": "1:31:00", "remaining_time": "2:43:34"} |
|
{"current_steps": 405, "total_steps": 1119, "loss": 0.78, "learning_rate": 8.052565570202394e-06, "epoch": 1.0836120401337792, "percentage": 36.19, "elapsed_time": "1:33:52", "remaining_time": "2:45:30"} |
|
{"current_steps": 410, "total_steps": 1119, "loss": 0.7339, "learning_rate": 7.990425089019774e-06, "epoch": 1.0969899665551839, "percentage": 36.64, "elapsed_time": "1:34:48", "remaining_time": "2:43:57"} |
|
{"current_steps": 415, "total_steps": 1119, "loss": 0.775, "learning_rate": 7.927556987323534e-06, "epoch": 1.1103678929765886, "percentage": 37.09, "elapsed_time": "1:35:47", "remaining_time": "2:42:30"} |
|
{"current_steps": 420, "total_steps": 1119, "loss": 0.7532, "learning_rate": 7.86397656197586e-06, "epoch": 1.1237458193979932, "percentage": 37.53, "elapsed_time": "1:36:44", "remaining_time": "2:41:00"} |
|
{"current_steps": 425, "total_steps": 1119, "loss": 0.792, "learning_rate": 7.799699283159199e-06, "epoch": 1.137123745819398, "percentage": 37.98, "elapsed_time": "1:37:41", "remaining_time": "2:39:31"} |
|
{"current_steps": 430, "total_steps": 1119, "loss": 0.7748, "learning_rate": 7.734740790612137e-06, "epoch": 1.1505016722408028, "percentage": 38.43, "elapsed_time": "1:38:36", "remaining_time": "2:38:00"} |
|
{"current_steps": 435, "total_steps": 1119, "loss": 0.7524, "learning_rate": 7.669116889823955e-06, "epoch": 1.1638795986622075, "percentage": 38.87, "elapsed_time": "1:39:39", "remaining_time": "2:36:42"} |
|
{"current_steps": 440, "total_steps": 1119, "loss": 0.7835, "learning_rate": 7.602843548188915e-06, "epoch": 1.1772575250836121, "percentage": 39.32, "elapsed_time": "1:40:36", "remaining_time": "2:35:15"} |
|
{"current_steps": 445, "total_steps": 1119, "loss": 0.7696, "learning_rate": 7.5359368911211115e-06, "epoch": 1.1906354515050168, "percentage": 39.77, "elapsed_time": "1:41:35", "remaining_time": "2:33:52"} |
|
{"current_steps": 450, "total_steps": 1119, "loss": 0.7652, "learning_rate": 7.468413198130891e-06, "epoch": 1.2040133779264215, "percentage": 40.21, "elapsed_time": "1:42:31", "remaining_time": "2:32:25"} |
|
{"current_steps": 455, "total_steps": 1119, "loss": 0.7223, "learning_rate": 7.400288898863779e-06, "epoch": 1.2173913043478262, "percentage": 40.66, "elapsed_time": "1:43:34", "remaining_time": "2:31:08"} |
|
{"current_steps": 460, "total_steps": 1119, "loss": 0.7756, "learning_rate": 7.3315805691028615e-06, "epoch": 1.2307692307692308, "percentage": 41.11, "elapsed_time": "1:44:32", "remaining_time": "2:29:46"} |
|
{"current_steps": 465, "total_steps": 1119, "loss": 0.8294, "learning_rate": 7.262304926735633e-06, "epoch": 1.2441471571906355, "percentage": 41.55, "elapsed_time": "1:45:30", "remaining_time": "2:28:23"} |
|
{"current_steps": 470, "total_steps": 1119, "loss": 0.7392, "learning_rate": 7.192478827686242e-06, "epoch": 1.2575250836120402, "percentage": 42.0, "elapsed_time": "1:46:24", "remaining_time": "2:26:56"} |
|
{"current_steps": 475, "total_steps": 1119, "loss": 0.7595, "learning_rate": 7.122119261814175e-06, "epoch": 1.2709030100334449, "percentage": 42.45, "elapsed_time": "1:47:26", "remaining_time": "2:25:39"} |
|
{"current_steps": 480, "total_steps": 1119, "loss": 0.7432, "learning_rate": 7.0512433487803245e-06, "epoch": 1.2842809364548495, "percentage": 42.9, "elapsed_time": "1:48:28", "remaining_time": "2:24:23"} |
|
{"current_steps": 485, "total_steps": 1119, "loss": 0.7664, "learning_rate": 6.979868333881499e-06, "epoch": 1.2976588628762542, "percentage": 43.34, "elapsed_time": "1:49:28", "remaining_time": "2:23:06"} |
|
{"current_steps": 490, "total_steps": 1119, "loss": 0.7236, "learning_rate": 6.908011583854353e-06, "epoch": 1.3110367892976589, "percentage": 43.79, "elapsed_time": "1:50:25", "remaining_time": "2:21:44"} |
|
{"current_steps": 495, "total_steps": 1119, "loss": 0.762, "learning_rate": 6.835690582649762e-06, "epoch": 1.3244147157190636, "percentage": 44.24, "elapsed_time": "1:51:23", "remaining_time": "2:20:24"} |
|
{"current_steps": 500, "total_steps": 1119, "loss": 0.7788, "learning_rate": 6.762922927178696e-06, "epoch": 1.3377926421404682, "percentage": 44.68, "elapsed_time": "1:52:21", "remaining_time": "2:19:05"} |
|
{"current_steps": 500, "total_steps": 1119, "eval_loss": 1.0046015977859497, "epoch": 1.3377926421404682, "percentage": 44.68, "elapsed_time": "1:54:50", "remaining_time": "2:22:10"} |
|
{"current_steps": 505, "total_steps": 1119, "loss": 0.7847, "learning_rate": 6.689726323030582e-06, "epoch": 1.351170568561873, "percentage": 45.13, "elapsed_time": "1:55:52", "remaining_time": "2:20:52"} |
|
{"current_steps": 510, "total_steps": 1119, "loss": 0.7676, "learning_rate": 6.6161185801652495e-06, "epoch": 1.3645484949832776, "percentage": 45.58, "elapsed_time": "1:56:56", "remaining_time": "2:19:38"} |
|
{"current_steps": 515, "total_steps": 1119, "loss": 0.7217, "learning_rate": 6.5421176085794645e-06, "epoch": 1.3779264214046822, "percentage": 46.02, "elapsed_time": "1:57:50", "remaining_time": "2:18:12"} |
|
{"current_steps": 520, "total_steps": 1119, "loss": 0.7707, "learning_rate": 6.467741413949124e-06, "epoch": 1.391304347826087, "percentage": 46.47, "elapsed_time": "1:58:53", "remaining_time": "2:16:56"} |
|
{"current_steps": 525, "total_steps": 1119, "loss": 0.7755, "learning_rate": 6.39300809324818e-06, "epoch": 1.4046822742474916, "percentage": 46.92, "elapsed_time": "1:59:53", "remaining_time": "2:15:39"} |
|
{"current_steps": 530, "total_steps": 1119, "loss": 0.7635, "learning_rate": 6.3179358303453386e-06, "epoch": 1.4180602006688963, "percentage": 47.36, "elapsed_time": "2:00:56", "remaining_time": "2:14:24"} |
|
{"current_steps": 535, "total_steps": 1119, "loss": 0.7505, "learning_rate": 6.242542891579619e-06, "epoch": 1.431438127090301, "percentage": 47.81, "elapsed_time": "2:01:59", "remaining_time": "2:13:09"} |
|
{"current_steps": 540, "total_steps": 1119, "loss": 0.7029, "learning_rate": 6.1668476213158525e-06, "epoch": 1.4448160535117056, "percentage": 48.26, "elapsed_time": "2:02:53", "remaining_time": "2:11:45"} |
|
{"current_steps": 545, "total_steps": 1119, "loss": 0.7637, "learning_rate": 6.090868437481185e-06, "epoch": 1.4581939799331103, "percentage": 48.7, "elapsed_time": "2:03:50", "remaining_time": "2:10:25"} |
|
{"current_steps": 550, "total_steps": 1119, "loss": 0.8025, "learning_rate": 6.0146238270836895e-06, "epoch": 1.471571906354515, "percentage": 49.15, "elapsed_time": "2:04:48", "remaining_time": "2:09:06"} |
|
{"current_steps": 555, "total_steps": 1119, "loss": 0.7436, "learning_rate": 5.938132341714173e-06, "epoch": 1.4849498327759196, "percentage": 49.6, "elapsed_time": "2:05:48", "remaining_time": "2:07:50"} |
|
{"current_steps": 560, "total_steps": 1119, "loss": 0.7566, "learning_rate": 5.861412593032247e-06, "epoch": 1.4983277591973243, "percentage": 50.04, "elapsed_time": "2:06:47", "remaining_time": "2:06:33"} |
|
{"current_steps": 565, "total_steps": 1119, "loss": 0.7137, "learning_rate": 5.7844832482378245e-06, "epoch": 1.511705685618729, "percentage": 50.49, "elapsed_time": "2:07:49", "remaining_time": "2:05:19"} |
|
{"current_steps": 570, "total_steps": 1119, "loss": 0.7716, "learning_rate": 5.7073630255290515e-06, "epoch": 1.5250836120401337, "percentage": 50.94, "elapsed_time": "2:08:52", "remaining_time": "2:04:07"} |
|
{"current_steps": 575, "total_steps": 1119, "loss": 0.7631, "learning_rate": 5.630070689547875e-06, "epoch": 1.5384615384615383, "percentage": 51.39, "elapsed_time": "2:10:00", "remaining_time": "2:02:59"} |
|
{"current_steps": 580, "total_steps": 1119, "loss": 0.7737, "learning_rate": 5.552625046814283e-06, "epoch": 1.551839464882943, "percentage": 51.83, "elapsed_time": "2:11:05", "remaining_time": "2:01:49"} |
|
{"current_steps": 585, "total_steps": 1119, "loss": 0.7399, "learning_rate": 5.475044941150361e-06, "epoch": 1.5652173913043477, "percentage": 52.28, "elapsed_time": "2:12:07", "remaining_time": "2:00:35"} |
|
{"current_steps": 590, "total_steps": 1119, "loss": 0.7521, "learning_rate": 5.397349249095279e-06, "epoch": 1.5785953177257523, "percentage": 52.73, "elapsed_time": "2:13:05", "remaining_time": "1:59:19"} |
|
{"current_steps": 595, "total_steps": 1119, "loss": 0.7779, "learning_rate": 5.319556875312313e-06, "epoch": 1.5919732441471572, "percentage": 53.17, "elapsed_time": "2:14:03", "remaining_time": "1:58:03"} |
|
{"current_steps": 600, "total_steps": 1119, "loss": 0.7246, "learning_rate": 5.241686747989023e-06, "epoch": 1.605351170568562, "percentage": 53.62, "elapsed_time": "2:15:01", "remaining_time": "1:56:47"} |
|
{"current_steps": 600, "total_steps": 1119, "eval_loss": 1.00019371509552, "epoch": 1.605351170568562, "percentage": 53.62, "elapsed_time": "2:17:32", "remaining_time": "1:58:58"} |
|
{"current_steps": 605, "total_steps": 1119, "loss": 0.7553, "learning_rate": 5.163757814231708e-06, "epoch": 1.6187290969899666, "percentage": 54.07, "elapsed_time": "2:20:24", "remaining_time": "1:59:17"} |
|
{"current_steps": 610, "total_steps": 1119, "loss": 0.7372, "learning_rate": 5.085789035455256e-06, "epoch": 1.6321070234113713, "percentage": 54.51, "elapsed_time": "2:21:23", "remaining_time": "1:57:58"} |
|
{"current_steps": 615, "total_steps": 1119, "loss": 0.7422, "learning_rate": 5.007799382769516e-06, "epoch": 1.645484949832776, "percentage": 54.96, "elapsed_time": "2:22:22", "remaining_time": "1:56:41"} |
|
{"current_steps": 620, "total_steps": 1119, "loss": 0.7515, "learning_rate": 4.929807832363308e-06, "epoch": 1.6588628762541806, "percentage": 55.41, "elapsed_time": "2:23:21", "remaining_time": "1:55:23"} |
|
{"current_steps": 625, "total_steps": 1119, "loss": 0.758, "learning_rate": 4.8518333608872015e-06, "epoch": 1.6722408026755853, "percentage": 55.85, "elapsed_time": "2:24:21", "remaining_time": "1:54:05"} |
|
{"current_steps": 630, "total_steps": 1119, "loss": 0.749, "learning_rate": 4.773894940836174e-06, "epoch": 1.68561872909699, "percentage": 56.3, "elapsed_time": "2:25:16", "remaining_time": "1:52:45"} |
|
{"current_steps": 635, "total_steps": 1119, "loss": 0.7784, "learning_rate": 4.69601153593329e-06, "epoch": 1.6989966555183946, "percentage": 56.75, "elapsed_time": "2:26:14", "remaining_time": "1:51:27"} |
|
{"current_steps": 640, "total_steps": 1119, "loss": 0.7553, "learning_rate": 4.618202096515505e-06, "epoch": 1.7123745819397993, "percentage": 57.19, "elapsed_time": "2:27:13", "remaining_time": "1:50:11"} |
|
{"current_steps": 645, "total_steps": 1119, "loss": 0.7655, "learning_rate": 4.540485554922729e-06, "epoch": 1.725752508361204, "percentage": 57.64, "elapsed_time": "2:28:12", "remaining_time": "1:48:54"} |
|
{"current_steps": 650, "total_steps": 1119, "loss": 0.7506, "learning_rate": 4.462880820891284e-06, "epoch": 1.7391304347826086, "percentage": 58.09, "elapsed_time": "2:29:14", "remaining_time": "1:47:40"} |
|
{"current_steps": 655, "total_steps": 1119, "loss": 0.7681, "learning_rate": 4.385406776952833e-06, "epoch": 1.7525083612040135, "percentage": 58.53, "elapsed_time": "2:30:08", "remaining_time": "1:46:21"} |
|
{"current_steps": 660, "total_steps": 1119, "loss": 0.7859, "learning_rate": 4.308082273839953e-06, "epoch": 1.7658862876254182, "percentage": 58.98, "elapsed_time": "2:31:07", "remaining_time": "1:45:05"} |
|
{"current_steps": 665, "total_steps": 1119, "loss": 0.7677, "learning_rate": 4.230926125899432e-06, "epoch": 1.779264214046823, "percentage": 59.43, "elapsed_time": "2:32:05", "remaining_time": "1:43:49"} |
|
{"current_steps": 670, "total_steps": 1119, "loss": 0.7224, "learning_rate": 4.153957106514428e-06, "epoch": 1.7926421404682276, "percentage": 59.87, "elapsed_time": "2:33:05", "remaining_time": "1:42:35"} |
|
{"current_steps": 675, "total_steps": 1119, "loss": 0.7286, "learning_rate": 4.0771939435365795e-06, "epoch": 1.8060200668896322, "percentage": 60.32, "elapsed_time": "2:34:05", "remaining_time": "1:41:21"} |
|
{"current_steps": 680, "total_steps": 1119, "loss": 0.7939, "learning_rate": 4.000655314729222e-06, "epoch": 1.819397993311037, "percentage": 60.77, "elapsed_time": "2:35:03", "remaining_time": "1:40:06"} |
|
{"current_steps": 685, "total_steps": 1119, "loss": 0.7843, "learning_rate": 3.924359843222758e-06, "epoch": 1.8327759197324416, "percentage": 61.22, "elapsed_time": "2:36:02", "remaining_time": "1:38:51"} |
|
{"current_steps": 690, "total_steps": 1119, "loss": 0.732, "learning_rate": 3.848326092983356e-06, "epoch": 1.8461538461538463, "percentage": 61.66, "elapsed_time": "2:37:03", "remaining_time": "1:37:38"} |
|
{"current_steps": 695, "total_steps": 1119, "loss": 0.7317, "learning_rate": 3.7725725642960047e-06, "epoch": 1.859531772575251, "percentage": 62.11, "elapsed_time": "2:38:03", "remaining_time": "1:36:25"} |
|
{"current_steps": 700, "total_steps": 1119, "loss": 0.7525, "learning_rate": 3.6971176892631048e-06, "epoch": 1.8729096989966556, "percentage": 62.56, "elapsed_time": "2:39:02", "remaining_time": "1:35:11"} |
|
{"current_steps": 700, "total_steps": 1119, "eval_loss": 0.9970734119415283, "epoch": 1.8729096989966556, "percentage": 62.56, "elapsed_time": "2:41:32", "remaining_time": "1:36:41"} |
|
{"current_steps": 705, "total_steps": 1119, "loss": 0.7621, "learning_rate": 3.6219798273196147e-06, "epoch": 1.8862876254180603, "percentage": 63.0, "elapsed_time": "2:42:30", "remaining_time": "1:35:25"} |
|
{"current_steps": 710, "total_steps": 1119, "loss": 0.7473, "learning_rate": 3.547177260765904e-06, "epoch": 1.899665551839465, "percentage": 63.45, "elapsed_time": "2:43:27", "remaining_time": "1:34:09"} |
|
{"current_steps": 715, "total_steps": 1119, "loss": 0.7279, "learning_rate": 3.47272819031935e-06, "epoch": 1.9130434782608696, "percentage": 63.9, "elapsed_time": "2:44:32", "remaining_time": "1:32:58"} |
|
{"current_steps": 720, "total_steps": 1119, "loss": 0.7681, "learning_rate": 3.398650730685813e-06, "epoch": 1.9264214046822743, "percentage": 64.34, "elapsed_time": "2:45:29", "remaining_time": "1:31:42"} |
|
{"current_steps": 725, "total_steps": 1119, "loss": 0.7551, "learning_rate": 3.3249629061520126e-06, "epoch": 1.939799331103679, "percentage": 64.79, "elapsed_time": "2:46:33", "remaining_time": "1:30:30"} |
|
{"current_steps": 730, "total_steps": 1119, "loss": 0.7567, "learning_rate": 3.2516826461999287e-06, "epoch": 1.9531772575250836, "percentage": 65.24, "elapsed_time": "2:47:29", "remaining_time": "1:29:15"} |
|
{"current_steps": 735, "total_steps": 1119, "loss": 0.7621, "learning_rate": 3.1788277811442436e-06, "epoch": 1.9665551839464883, "percentage": 65.68, "elapsed_time": "2:48:25", "remaining_time": "1:27:59"} |
|
{"current_steps": 740, "total_steps": 1119, "loss": 0.7707, "learning_rate": 3.1064160377939457e-06, "epoch": 1.979933110367893, "percentage": 66.13, "elapsed_time": "2:49:26", "remaining_time": "1:26:46"} |
|
{"current_steps": 745, "total_steps": 1119, "loss": 0.7902, "learning_rate": 3.0344650351390797e-06, "epoch": 1.9933110367892977, "percentage": 66.58, "elapsed_time": "2:50:22", "remaining_time": "1:25:31"} |
|
{"current_steps": 750, "total_steps": 1119, "loss": 0.6413, "learning_rate": 2.962992280063771e-06, "epoch": 2.0066889632107023, "percentage": 67.02, "elapsed_time": "2:51:16", "remaining_time": "1:24:16"} |
|
{"current_steps": 755, "total_steps": 1119, "loss": 0.5334, "learning_rate": 2.8920151630864906e-06, "epoch": 2.020066889632107, "percentage": 67.47, "elapsed_time": "2:52:11", "remaining_time": "1:23:00"} |
|
{"current_steps": 760, "total_steps": 1119, "loss": 0.5353, "learning_rate": 2.821550954128667e-06, "epoch": 2.0334448160535117, "percentage": 67.92, "elapsed_time": "2:53:08", "remaining_time": "1:21:47"} |
|
{"current_steps": 765, "total_steps": 1119, "loss": 0.5371, "learning_rate": 2.7516167983126053e-06, "epoch": 2.0468227424749164, "percentage": 68.36, "elapsed_time": "2:54:07", "remaining_time": "1:20:34"} |
|
{"current_steps": 770, "total_steps": 1119, "loss": 0.535, "learning_rate": 2.6822297117898144e-06, "epoch": 2.060200668896321, "percentage": 68.81, "elapsed_time": "2:55:19", "remaining_time": "1:19:27"} |
|
{"current_steps": 775, "total_steps": 1119, "loss": 0.5595, "learning_rate": 2.61340657760067e-06, "epoch": 2.0735785953177257, "percentage": 69.26, "elapsed_time": "2:56:18", "remaining_time": "1:18:15"} |
|
{"current_steps": 780, "total_steps": 1119, "loss": 0.5129, "learning_rate": 2.5451641415665097e-06, "epoch": 2.0869565217391304, "percentage": 69.71, "elapsed_time": "2:57:16", "remaining_time": "1:17:02"} |
|
{"current_steps": 785, "total_steps": 1119, "loss": 0.5391, "learning_rate": 2.4775190082150747e-06, "epoch": 2.100334448160535, "percentage": 70.15, "elapsed_time": "2:58:18", "remaining_time": "1:15:51"} |
|
{"current_steps": 790, "total_steps": 1119, "loss": 0.5462, "learning_rate": 2.4104876367403602e-06, "epoch": 2.1137123745819397, "percentage": 70.6, "elapsed_time": "2:59:19", "remaining_time": "1:14:40"} |
|
{"current_steps": 795, "total_steps": 1119, "loss": 0.5001, "learning_rate": 2.344086336997819e-06, "epoch": 2.1270903010033444, "percentage": 71.05, "elapsed_time": "3:00:18", "remaining_time": "1:13:29"} |
|
{"current_steps": 800, "total_steps": 1119, "loss": 0.529, "learning_rate": 2.278331265535898e-06, "epoch": 2.140468227424749, "percentage": 71.49, "elapsed_time": "3:01:15", "remaining_time": "1:12:16"} |
|
{"current_steps": 800, "total_steps": 1119, "eval_loss": 1.0470257997512817, "epoch": 2.140468227424749, "percentage": 71.49, "elapsed_time": "3:03:45", "remaining_time": "1:13:16"} |
|
{"current_steps": 805, "total_steps": 1119, "loss": 0.5773, "learning_rate": 2.2132384216648783e-06, "epoch": 2.1538461538461537, "percentage": 71.94, "elapsed_time": "3:06:38", "remaining_time": "1:12:48"} |
|
{"current_steps": 810, "total_steps": 1119, "loss": 0.5209, "learning_rate": 2.148823643563973e-06, "epoch": 2.1672240802675584, "percentage": 72.39, "elapsed_time": "3:07:45", "remaining_time": "1:11:37"} |
|
{"current_steps": 815, "total_steps": 1119, "loss": 0.5338, "learning_rate": 2.0851026044276405e-06, "epoch": 2.180602006688963, "percentage": 72.83, "elapsed_time": "3:08:42", "remaining_time": "1:10:23"} |
|
{"current_steps": 820, "total_steps": 1119, "loss": 0.5502, "learning_rate": 2.022090808652024e-06, "epoch": 2.1939799331103678, "percentage": 73.28, "elapsed_time": "3:09:40", "remaining_time": "1:09:09"} |
|
{"current_steps": 825, "total_steps": 1119, "loss": 0.5352, "learning_rate": 1.9598035880624832e-06, "epoch": 2.2073578595317724, "percentage": 73.73, "elapsed_time": "3:10:37", "remaining_time": "1:07:55"} |
|
{"current_steps": 830, "total_steps": 1119, "loss": 0.5474, "learning_rate": 1.8982560981830911e-06, "epoch": 2.220735785953177, "percentage": 74.17, "elapsed_time": "3:11:35", "remaining_time": "1:06:42"} |
|
{"current_steps": 835, "total_steps": 1119, "loss": 0.4991, "learning_rate": 1.8374633145490566e-06, "epoch": 2.234113712374582, "percentage": 74.62, "elapsed_time": "3:12:39", "remaining_time": "1:05:31"} |
|
{"current_steps": 840, "total_steps": 1119, "loss": 0.532, "learning_rate": 1.7774400290629095e-06, "epoch": 2.2474916387959865, "percentage": 75.07, "elapsed_time": "3:13:43", "remaining_time": "1:04:20"} |
|
{"current_steps": 845, "total_steps": 1119, "loss": 0.5582, "learning_rate": 1.7182008463953986e-06, "epoch": 2.260869565217391, "percentage": 75.51, "elapsed_time": "3:14:46", "remaining_time": "1:03:09"} |
|
{"current_steps": 850, "total_steps": 1119, "loss": 0.508, "learning_rate": 1.6597601804319186e-06, "epoch": 2.274247491638796, "percentage": 75.96, "elapsed_time": "3:15:46", "remaining_time": "1:01:57"} |
|
{"current_steps": 855, "total_steps": 1119, "loss": 0.5539, "learning_rate": 1.602132250765378e-06, "epoch": 2.2876254180602005, "percentage": 76.41, "elapsed_time": "3:16:43", "remaining_time": "1:00:44"} |
|
{"current_steps": 860, "total_steps": 1119, "loss": 0.545, "learning_rate": 1.5453310792363275e-06, "epoch": 2.3010033444816056, "percentage": 76.85, "elapsed_time": "3:17:41", "remaining_time": "0:59:32"} |
|
{"current_steps": 865, "total_steps": 1119, "loss": 0.5266, "learning_rate": 1.489370486521219e-06, "epoch": 2.3143812709030103, "percentage": 77.3, "elapsed_time": "3:18:36", "remaining_time": "0:58:19"} |
|
{"current_steps": 870, "total_steps": 1119, "loss": 0.5175, "learning_rate": 1.4342640887695935e-06, "epoch": 2.327759197324415, "percentage": 77.75, "elapsed_time": "3:19:36", "remaining_time": "0:57:07"} |
|
{"current_steps": 875, "total_steps": 1119, "loss": 0.5132, "learning_rate": 1.380025294291057e-06, "epoch": 2.3411371237458196, "percentage": 78.19, "elapsed_time": "3:20:38", "remaining_time": "0:55:56"} |
|
{"current_steps": 880, "total_steps": 1119, "loss": 0.5381, "learning_rate": 1.3266673002927993e-06, "epoch": 2.3545150501672243, "percentage": 78.64, "elapsed_time": "3:21:42", "remaining_time": "0:54:46"} |
|
{"current_steps": 885, "total_steps": 1119, "loss": 0.5151, "learning_rate": 1.2742030896685075e-06, "epoch": 2.367892976588629, "percentage": 79.09, "elapsed_time": "3:22:39", "remaining_time": "0:53:34"} |
|
{"current_steps": 890, "total_steps": 1119, "loss": 0.5314, "learning_rate": 1.2226454278393956e-06, "epoch": 2.3812709030100336, "percentage": 79.54, "elapsed_time": "3:23:41", "remaining_time": "0:52:24"} |
|
{"current_steps": 895, "total_steps": 1119, "loss": 0.5083, "learning_rate": 1.1720068596481765e-06, "epoch": 2.3946488294314383, "percentage": 79.98, "elapsed_time": "3:24:40", "remaining_time": "0:51:13"} |
|
{"current_steps": 900, "total_steps": 1119, "loss": 0.5365, "learning_rate": 1.1222997063066855e-06, "epoch": 2.408026755852843, "percentage": 80.43, "elapsed_time": "3:25:40", "remaining_time": "0:50:02"} |
|
{"current_steps": 900, "total_steps": 1119, "eval_loss": 1.0517374277114868, "epoch": 2.408026755852843, "percentage": 80.43, "elapsed_time": "3:28:10", "remaining_time": "0:50:39"} |
|
{"current_steps": 905, "total_steps": 1119, "loss": 0.5308, "learning_rate": 1.0735360623979201e-06, "epoch": 2.4214046822742477, "percentage": 80.88, "elapsed_time": "3:29:10", "remaining_time": "0:49:27"} |
|
{"current_steps": 910, "total_steps": 1119, "loss": 0.5204, "learning_rate": 1.0257277929332332e-06, "epoch": 2.4347826086956523, "percentage": 81.32, "elapsed_time": "3:30:13", "remaining_time": "0:48:17"} |
|
{"current_steps": 915, "total_steps": 1119, "loss": 0.5391, "learning_rate": 9.788865304653727e-07, "epoch": 2.448160535117057, "percentage": 81.77, "elapsed_time": "3:31:11", "remaining_time": "0:47:05"} |
|
{"current_steps": 920, "total_steps": 1119, "loss": 0.5106, "learning_rate": 9.330236722580832e-07, "epoch": 2.4615384615384617, "percentage": 82.22, "elapsed_time": "3:32:12", "remaining_time": "0:45:53"} |
|
{"current_steps": 925, "total_steps": 1119, "loss": 0.5413, "learning_rate": 8.881503775129696e-07, "epoch": 2.4749163879598663, "percentage": 82.66, "elapsed_time": "3:33:13", "remaining_time": "0:44:43"} |
|
{"current_steps": 930, "total_steps": 1119, "loss": 0.5388, "learning_rate": 8.442775646542656e-07, "epoch": 2.488294314381271, "percentage": 83.11, "elapsed_time": "3:34:09", "remaining_time": "0:43:31"} |
|
{"current_steps": 935, "total_steps": 1119, "loss": 0.5242, "learning_rate": 8.014159086722101e-07, "epoch": 2.5016722408026757, "percentage": 83.56, "elapsed_time": "3:35:09", "remaining_time": "0:42:20"} |
|
{"current_steps": 940, "total_steps": 1119, "loss": 0.5477, "learning_rate": 7.595758385256325e-07, "epoch": 2.5150501672240804, "percentage": 84.0, "elapsed_time": "3:36:11", "remaining_time": "0:41:10"} |
|
{"current_steps": 945, "total_steps": 1119, "loss": 0.5078, "learning_rate": 7.187675346044165e-07, "epoch": 2.528428093645485, "percentage": 84.45, "elapsed_time": "3:37:05", "remaining_time": "0:39:58"} |
|
{"current_steps": 950, "total_steps": 1119, "loss": 0.5414, "learning_rate": 6.790009262524455e-07, "epoch": 2.5418060200668897, "percentage": 84.9, "elapsed_time": "3:38:05", "remaining_time": "0:38:47"} |
|
{"current_steps": 955, "total_steps": 1119, "loss": 0.5165, "learning_rate": 6.40285689351619e-07, "epoch": 2.5551839464882944, "percentage": 85.34, "elapsed_time": "3:39:00", "remaining_time": "0:37:36"} |
|
{"current_steps": 960, "total_steps": 1119, "loss": 0.5129, "learning_rate": 6.026312439675553e-07, "epoch": 2.568561872909699, "percentage": 85.79, "elapsed_time": "3:39:56", "remaining_time": "0:36:25"} |
|
{"current_steps": 965, "total_steps": 1119, "loss": 0.503, "learning_rate": 5.66046752057523e-07, "epoch": 2.5819397993311037, "percentage": 86.24, "elapsed_time": "3:40:55", "remaining_time": "0:35:15"} |
|
{"current_steps": 970, "total_steps": 1119, "loss": 0.5241, "learning_rate": 5.305411152411943e-07, "epoch": 2.5953177257525084, "percentage": 86.68, "elapsed_time": "3:41:50", "remaining_time": "0:34:04"} |
|
{"current_steps": 975, "total_steps": 1119, "loss": 0.5176, "learning_rate": 4.961229726347233e-07, "epoch": 2.608695652173913, "percentage": 87.13, "elapsed_time": "3:42:47", "remaining_time": "0:32:54"} |
|
{"current_steps": 980, "total_steps": 1119, "loss": 0.4961, "learning_rate": 4.628006987487088e-07, "epoch": 2.6220735785953178, "percentage": 87.58, "elapsed_time": "3:43:45", "remaining_time": "0:31:44"} |
|
{"current_steps": 985, "total_steps": 1119, "loss": 0.5436, "learning_rate": 4.3058240145053223e-07, "epoch": 2.6354515050167224, "percentage": 88.03, "elapsed_time": "3:44:44", "remaining_time": "0:30:34"} |
|
{"current_steps": 990, "total_steps": 1119, "loss": 0.5004, "learning_rate": 3.994759199915821e-07, "epoch": 2.648829431438127, "percentage": 88.47, "elapsed_time": "3:45:44", "remaining_time": "0:29:24"} |
|
{"current_steps": 995, "total_steps": 1119, "loss": 0.5275, "learning_rate": 3.694888230998289e-07, "epoch": 2.6622073578595318, "percentage": 88.92, "elapsed_time": "3:46:43", "remaining_time": "0:28:15"} |
|
{"current_steps": 1000, "total_steps": 1119, "loss": 0.5256, "learning_rate": 3.406284071382288e-07, "epoch": 2.6755852842809364, "percentage": 89.37, "elapsed_time": "3:47:41", "remaining_time": "0:27:05"} |
|
{"current_steps": 1000, "total_steps": 1119, "eval_loss": 1.0514318943023682, "epoch": 2.6755852842809364, "percentage": 89.37, "elapsed_time": "3:50:11", "remaining_time": "0:27:23"} |
|
{"current_steps": 1005, "total_steps": 1119, "loss": 0.5022, "learning_rate": 3.1290169432939556e-07, "epoch": 2.688963210702341, "percentage": 89.81, "elapsed_time": "3:53:08", "remaining_time": "0:26:26"} |
|
{"current_steps": 1010, "total_steps": 1119, "loss": 0.5397, "learning_rate": 2.863154310469768e-07, "epoch": 2.702341137123746, "percentage": 90.26, "elapsed_time": "3:54:09", "remaining_time": "0:25:16"} |
|
{"current_steps": 1015, "total_steps": 1119, "loss": 0.5359, "learning_rate": 2.6087608617414715e-07, "epoch": 2.7157190635451505, "percentage": 90.71, "elapsed_time": "3:55:08", "remaining_time": "0:24:05"} |
|
{"current_steps": 1020, "total_steps": 1119, "loss": 0.5013, "learning_rate": 2.365898495296226e-07, "epoch": 2.729096989966555, "percentage": 91.15, "elapsed_time": "3:56:02", "remaining_time": "0:22:54"} |
|
{"current_steps": 1025, "total_steps": 1119, "loss": 0.5468, "learning_rate": 2.1346263036157112e-07, "epoch": 2.74247491638796, "percentage": 91.6, "elapsed_time": "3:57:01", "remaining_time": "0:21:44"} |
|
{"current_steps": 1030, "total_steps": 1119, "loss": 0.52, "learning_rate": 1.9150005590979682e-07, "epoch": 2.7558528428093645, "percentage": 92.05, "elapsed_time": "3:57:55", "remaining_time": "0:20:33"} |
|
{"current_steps": 1035, "total_steps": 1119, "loss": 0.4959, "learning_rate": 1.707074700365341e-07, "epoch": 2.769230769230769, "percentage": 92.49, "elapsed_time": "3:58:55", "remaining_time": "0:19:23"} |
|
{"current_steps": 1040, "total_steps": 1119, "loss": 0.5014, "learning_rate": 1.5108993192620268e-07, "epoch": 2.782608695652174, "percentage": 92.94, "elapsed_time": "3:59:53", "remaining_time": "0:18:13"} |
|
{"current_steps": 1045, "total_steps": 1119, "loss": 0.5043, "learning_rate": 1.326522148544157e-07, "epoch": 2.7959866220735785, "percentage": 93.39, "elapsed_time": "4:00:56", "remaining_time": "0:17:03"} |
|
{"current_steps": 1050, "total_steps": 1119, "loss": 0.5492, "learning_rate": 1.153988050265692e-07, "epoch": 2.809364548494983, "percentage": 93.83, "elapsed_time": "4:01:56", "remaining_time": "0:15:53"} |
|
{"current_steps": 1055, "total_steps": 1119, "loss": 0.5247, "learning_rate": 9.933390048626645e-08, "epoch": 2.822742474916388, "percentage": 94.28, "elapsed_time": "4:02:50", "remaining_time": "0:14:43"} |
|
{"current_steps": 1060, "total_steps": 1119, "loss": 0.52, "learning_rate": 8.446141009386955e-08, "epoch": 2.8361204013377925, "percentage": 94.73, "elapsed_time": "4:03:47", "remaining_time": "0:13:34"} |
|
{"current_steps": 1065, "total_steps": 1119, "loss": 0.5146, "learning_rate": 7.078495257540341e-08, "epoch": 2.849498327759197, "percentage": 95.17, "elapsed_time": "4:04:49", "remaining_time": "0:12:24"} |
|
{"current_steps": 1070, "total_steps": 1119, "loss": 0.5674, "learning_rate": 5.830785564206298e-08, "epoch": 2.862876254180602, "percentage": 95.62, "elapsed_time": "4:05:43", "remaining_time": "0:11:15"} |
|
{"current_steps": 1075, "total_steps": 1119, "loss": 0.544, "learning_rate": 4.7033155180522535e-08, "epoch": 2.8762541806020065, "percentage": 96.07, "elapsed_time": "4:06:46", "remaining_time": "0:10:06"} |
|
{"current_steps": 1080, "total_steps": 1119, "loss": 0.5008, "learning_rate": 3.696359451425491e-08, "epoch": 2.8896321070234112, "percentage": 96.51, "elapsed_time": "4:07:47", "remaining_time": "0:08:56"} |
|
{"current_steps": 1085, "total_steps": 1119, "loss": 0.5273, "learning_rate": 2.8101623736035422e-08, "epoch": 2.903010033444816, "percentage": 96.96, "elapsed_time": "4:08:46", "remaining_time": "0:07:47"} |
|
{"current_steps": 1090, "total_steps": 1119, "loss": 0.5461, "learning_rate": 2.0449399111791003e-08, "epoch": 2.9163879598662206, "percentage": 97.41, "elapsed_time": "4:09:41", "remaining_time": "0:06:38"} |
|
{"current_steps": 1095, "total_steps": 1119, "loss": 0.5118, "learning_rate": 1.400878255594762e-08, "epoch": 2.9297658862876252, "percentage": 97.86, "elapsed_time": "4:10:33", "remaining_time": "0:05:29"} |
|
{"current_steps": 1100, "total_steps": 1119, "loss": 0.518, "learning_rate": 8.781341178393244e-09, "epoch": 2.94314381270903, "percentage": 98.3, "elapsed_time": "4:11:31", "remaining_time": "0:04:20"} |
|
{"current_steps": 1100, "total_steps": 1119, "eval_loss": 1.0516117811203003, "epoch": 2.94314381270903, "percentage": 98.3, "elapsed_time": "4:14:03", "remaining_time": "0:04:23"} |
|
{"current_steps": 1105, "total_steps": 1119, "loss": 0.5003, "learning_rate": 4.76834690317396e-09, "epoch": 2.9565217391304346, "percentage": 98.75, "elapsed_time": "4:15:00", "remaining_time": "0:03:13"} |
|
{"current_steps": 1110, "total_steps": 1119, "loss": 0.5345, "learning_rate": 1.9707761590148642e-09, "epoch": 2.9698996655518393, "percentage": 99.2, "elapsed_time": "4:15:57", "remaining_time": "0:02:04"} |
|
{"current_steps": 1115, "total_steps": 1119, "loss": 0.5564, "learning_rate": 3.8930964173733434e-10, "epoch": 2.983277591973244, "percentage": 99.64, "elapsed_time": "4:17:04", "remaining_time": "0:00:55"} |
|
{"current_steps": 1119, "total_steps": 1119, "epoch": 2.993979933110368, "percentage": 100.0, "elapsed_time": "4:19:48", "remaining_time": "0:00:00"} |
|
|