{"step": 1, "l2_params": 207.83166265038426, "train/loss": 6.9062498807907104, "l2_grads": 0.58984375, "lr": 0.0, "uptime": 76.64550542500001, "examples_seen": 1024.0, "progress": 8.88075806150813e-06, "epoch": 0.0007992712893791364} {"step": 2, "l2_params": 207.83166265038912, "train/loss": 6.90625, "l2_grads": 0.5859375, "lr": 1.0000000000000001e-07, "uptime": 78.4814042879998, "examples_seen": 2048.0, "progress": 1.776151612301626e-05, "epoch": 0.0015985425787582727} {"step": 50, "l2_params": 207.83166336385142, "train/loss": 6.9063109159469604, "l2_grads": 0.58203125, "lr": 4.9e-06, "uptime": 162.29491573999985, "examples_seen": 51200.0, "progress": 0.0004440379030754065, "epoch": 0.03996356446895682, "img/sec/core": 586.4448243306131, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.023281530958888904, "core_hours": 0.023281530958888904} {"step": 100, "l2_params": 207.83168220795426, "train/loss": 6.906715393066406, "l2_grads": 0.609375, "lr": 9.900000000000002e-06, "uptime": 251.76883455999996, "examples_seen": 102400.0, "progress": 0.000888075806150813, "epoch": 0.07992712893791364, "img/sec/core": 572.23379366005, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.04813539729777783, "core_hours": 0.04813539729777783} {"step": 150, "l2_params": 207.83179455781215, "train/loss": 6.902469515800476, "l2_grads": 0.60546875, "lr": 1.49e-05, "uptime": 342.78957389399966, "examples_seen": 153600.0, "progress": 0.0013321137092262196, "epoch": 0.11989069340687046, "img/sec/core": 562.5091641161264, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.07341893600166663, "core_hours": 0.07341893600166663} {"step": 200, "l2_params": 207.83198534026928, "train/loss": 6.892016053199768, "l2_grads": 0.58203125, "lr": 1.9900000000000003e-05, "uptime": 434.61464481999974, "examples_seen": 204800.0, "progress": 0.001776151612301626, "epoch": 0.15985425787582727, "img/sec/core": 557.5819270671843, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.09892590014777776, "core_hours": 0.09892590014777776} {"step": 250, "l2_params": 207.84188168640515, "train/loss": 6.8753063678741455, "l2_grads": 0.6171875, "lr": 2.49e-05, "uptime": 526.6235965229998, "examples_seen": 256000.0, "progress": 0.0022201895153770327, "epoch": 0.1998178223447841, "img/sec/core": 556.4675942105158, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.12448394228750001, "core_hours": 0.12448394228750001} {"step": 300, "l2_params": 207.85191426224992, "train/loss": 6.857430577278137, "l2_grads": 0.60546875, "lr": 2.9900000000000002e-05, "uptime": 618.6865964640001, "examples_seen": 307200.0, "progress": 0.0026642274184524393, "epoch": 0.23978138681374092, "img/sec/core": 556.1409038681355, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.15005699782666676, "core_hours": 0.15005699782666676} {"step": 350, "l2_params": 207.85244201462604, "train/loss": 6.825409412384033, "l2_grads": 0.81640625, "lr": 3.49e-05, "uptime": 710.7981772719995, "examples_seen": 358400.0, "progress": 0.003108265321527846, "epoch": 0.2797449512826977, "img/sec/core": 555.8475877937983, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.17564354805111104, "core_hours": 0.17564354805111104} {"step": 400, "l2_params": 207.86274322508382, "train/loss": 6.83647346496582, "l2_grads": 1.3359375, "lr": 3.99e-05, "uptime": 802.9022893679994, "examples_seen": 409600.0, "progress": 0.003552303224603252, "epoch": 0.31970851575165454, "img/sec/core": 555.8926614116248, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.20122802363333323, "core_hours": 0.20122802363333323} {"step": 450, "l2_params": 207.86354326985054, "train/loss": 6.811252474784851, "l2_grads": 0.93359375, "lr": 4.49e-05, "uptime": 895.0891182219993, "examples_seen": 460800.0, "progress": 0.003996341127678659, "epoch": 0.35967208022061137, "img/sec/core": 555.3938739023938, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.22683547609277765, "core_hours": 0.22683547609277765} {"step": 500, "l2_params": 207.86442018746402, "train/loss": 6.74031388759613, "l2_grads": 0.9453125, "lr": 4.99e-05, "uptime": 987.2726819929994, "examples_seen": 512000.0, "progress": 0.0044403790307540655, "epoch": 0.3996356446895682, "img/sec/core": 555.4135455989709, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.2524420215847221, "core_hours": 0.2524420215847221} {"step": 550, "l2_params": 207.86531294813565, "train/loss": 6.748172402381897, "l2_grads": 1.359375, "lr": 5.49e-05, "uptime": 1079.549124319, "examples_seen": 563200.0, "progress": 0.004884416933829472, "epoch": 0.439599209158525, "img/sec/core": 554.8545079264884, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.2780743666752778, "core_hours": 0.2780743666752778} {"step": 600, "l2_params": 207.8661053487031, "train/loss": 6.730957627296448, "l2_grads": 1.5625, "lr": 5.9900000000000006e-05, "uptime": 1171.758201097, "examples_seen": 614400.0, "progress": 0.0053284548369048786, "epoch": 0.47956277362748184, "img/sec/core": 555.2598701673119, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.30368799911361116, "core_hours": 0.30368799911361116} {"step": 650, "l2_params": 207.87182660642566, "train/loss": 6.777011513710022, "l2_grads": 2.625, "lr": 6.49e-05, "uptime": 1264.0831543109998, "examples_seen": 665600.0, "progress": 0.005772492739980285, "epoch": 0.5195263380964387, "img/sec/core": 554.5629671896353, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.32933381945083334, "core_hours": 0.32933381945083334} {"step": 700, "l2_params": 207.87262058788716, "train/loss": 6.692772388458252, "l2_grads": 2.3125, "lr": 6.99e-05, "uptime": 1356.4102695789998, "examples_seen": 716800.0, "progress": 0.006216530643055692, "epoch": 0.5594899025653954, "img/sec/core": 554.5499808087866, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.35498024035861114, "core_hours": 0.35498024035861114} {"step": 750, "l2_params": 207.87340416126537, "train/loss": 6.703240394592285, "l2_grads": 3.15625, "lr": 7.489999999999999e-05, "uptime": 1448.7562060999999, "examples_seen": 768000.0, "progress": 0.006660568546131097, "epoch": 0.5994534670343523, "img/sec/core": 554.4369566099615, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.38063188939222226, "core_hours": 0.38063188939222226} {"step": 800, "l2_params": 207.8935486299435, "train/loss": 6.670055031776428, "l2_grads": 3.828125, "lr": 7.99e-05, "uptime": 1541.0975852329993, "examples_seen": 819200.0, "progress": 0.007104606449206504, "epoch": 0.6394170315033091, "img/sec/core": 554.4643201208479, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.4062822724847221, "core_hours": 0.4062822724847221} {"step": 850, "l2_params": 207.90423266499886, "train/loss": 6.616488099098206, "l2_grads": 2.125, "lr": 8.49e-05, "uptime": 1633.4763670439997, "examples_seen": 870400.0, "progress": 0.00754864435228191, "epoch": 0.679380595972266, "img/sec/core": 554.2398264652494, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.43194304521, "core_hours": 0.43194304521} {"step": 900, "l2_params": 207.90517420786415, "train/loss": 6.667346835136414, "l2_grads": 2.828125, "lr": 8.989999999999999e-05, "uptime": 1725.9126851929996, "examples_seen": 921600.0, "progress": 0.007992682255357318, "epoch": 0.7193441604412227, "img/sec/core": 553.8948437720093, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.4576198002513888, "core_hours": 0.4576198002513888} {"step": 950, "l2_params": 207.91582522581945, "train/loss": 6.637000560760498, "l2_grads": 2.484375, "lr": 9.49e-05, "uptime": 1818.443458533, "examples_seen": 972800.0, "progress": 0.008436720158432724, "epoch": 0.7593077249101795, "img/sec/core": 553.3294292469354, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.4833227928458334, "core_hours": 0.4833227928458334} {"step": 1000, "l2_params": 207.91694593187842, "train/loss": 6.770874381065369, "l2_grads": 1.8515625, "lr": 9.99e-05, "uptime": 1910.9521817599998, "examples_seen": 1024000.0, "progress": 0.008880758061508131, "epoch": 0.7992712893791364, "img/sec/core": 553.4613192570434, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.5090196604088889, "core_hours": 0.5090196604088889} {"step": 1050, "l2_params": 207.9469364044235, "train/loss": 6.7737027406692505, "l2_grads": 5.78125, "lr": 0.0001049, "uptime": 2003.6342478299994, "examples_seen": 1075200.0, "progress": 0.009324795964583537, "epoch": 0.8392348538480932, "img/sec/core": 552.4261830905929, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.5347646787616666, "core_hours": 0.5347646787616666} {"step": 1100, "l2_params": 207.94837811757742, "train/loss": 6.756062746047974, "l2_grads": 2.953125, "lr": 0.0001099, "uptime": 2096.1618790149996, "examples_seen": 1126400.0, "progress": 0.009768833867658944, "epoch": 0.87919841831705, "img/sec/core": 553.348219815878, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.5604667985352777, "core_hours": 0.5604667985352777} {"step": 1150, "l2_params": 207.94943246179258, "train/loss": 6.629732012748718, "l2_grads": 2.34375, "lr": 0.0001149, "uptime": 2188.6601942429998, "examples_seen": 1177600.0, "progress": 0.01021287177073435, "epoch": 0.9191619827860068, "img/sec/core": 553.5235952546437, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.5861607749875, "core_hours": 0.5861607749875} {"step": 1200, "l2_params": 207.96538640833893, "train/loss": 6.661787509918213, "l2_grads": 2.609375, "lr": 0.00011990000000000001, "uptime": 2281.1378932609996, "examples_seen": 1228800.0, "progress": 0.010656909673809757, "epoch": 0.9591255472549637, "img/sec/core": 553.6469932068103, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.6118490247147221, "core_hours": 0.6118490247147221} {"step": 1250, "l2_params": 207.97659404816446, "train/loss": 6.573065638542175, "l2_grads": 3.09375, "lr": 0.0001249, "uptime": 2373.5472992709992, "examples_seen": 1280000.0, "progress": 0.011100947576885163, "epoch": 0.9990891117239205, "img/sec/core": 554.0561530550216, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.6375183041619442, "core_hours": 0.6375183041619442} {"step": 1300, "l2_params": 207.97796200498874, "train/loss": 6.6279871463775635, "l2_grads": 3.828125, "lr": 0.00012989999999999999, "uptime": 2465.9966982139995, "examples_seen": 1331200.0, "progress": 0.01154498547996057, "epoch": 1.0390526761928773, "img/sec/core": 553.8164724204147, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.6631986927572221, "core_hours": 0.6631986927572221} {"step": 1350, "l2_params": 207.98917157156964, "train/loss": 6.577640175819397, "l2_grads": 2.265625, "lr": 0.0001349, "uptime": 2558.4841390779993, "examples_seen": 1382400.0, "progress": 0.011989023383035976, "epoch": 1.079016240661834, "img/sec/core": 553.5886767078803, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.6888896485527777, "core_hours": 0.6888896485527777} {"step": 1400, "l2_params": 207.99109282128686, "train/loss": 6.519563555717468, "l2_grads": 2.140625, "lr": 0.0001399, "uptime": 2650.9473517399992, "examples_seen": 1433600.0, "progress": 0.012433061286111383, "epoch": 1.1189798051307909, "img/sec/core": 553.7337339462997, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.7145738742922221, "core_hours": 0.7145738742922221} {"step": 1450, "l2_params": 208.00308982681588, "train/loss": 6.72875714302063, "l2_grads": 2.65625, "lr": 0.0001449, "uptime": 2743.5134343219997, "examples_seen": 1484800.0, "progress": 0.012877099189186789, "epoch": 1.1589433695997478, "img/sec/core": 553.1183622753401, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.7402866750094445, "core_hours": 0.7402866750094445} {"step": 1500, "l2_params": 208.02439176151682, "train/loss": 6.517720699310303, "l2_grads": 2.671875, "lr": 0.0001499, "uptime": 2836.0809853359997, "examples_seen": 1536000.0, "progress": 0.013321137092262195, "epoch": 1.1989069340687046, "img/sec/core": 553.1095879619468, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.7659998836244444, "core_hours": 0.7659998836244444} {"step": 1550, "l2_params": 208.05530733445417, "train/loss": 6.478211522102356, "l2_grads": 3.171875, "lr": 0.00015490000000000002, "uptime": 2928.7093405329997, "examples_seen": 1587200.0, "progress": 0.013765174995337602, "epoch": 1.2388704985376613, "img/sec/core": 552.7465093286924, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.7917299822902778, "core_hours": 0.7917299822902778} {"step": 1600, "l2_params": 208.05707982784844, "train/loss": 6.5447447299957275, "l2_grads": 4.03125, "lr": 0.00015989999999999998, "uptime": 3021.341463768, "examples_seen": 1638400.0, "progress": 0.014209212898413008, "epoch": 1.2788340630066182, "img/sec/core": 552.7240250135452, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.8174611276333333, "core_hours": 0.8174611276333333} {"step": 1650, "l2_params": 208.05865711480268, "train/loss": 6.491197109222412, "l2_grads": 2.3125, "lr": 0.0001649, "uptime": 3114.0000376049993, "examples_seen": 1689600.0, "progress": 0.014653250801488415, "epoch": 1.318797627475575, "img/sec/core": 552.5662427102383, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.8431996203658332, "core_hours": 0.8431996203658332} {"step": 1700, "l2_params": 208.08957366487584, "train/loss": 6.528055548667908, "l2_grads": 3.140625, "lr": 0.0001699, "uptime": 3206.7147506679994, "examples_seen": 1740800.0, "progress": 0.01509728870456382, "epoch": 1.358761191944532, "img/sec/core": 552.2316610655889, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.8689537073277777, "core_hours": 0.8689537073277777} {"step": 1750, "l2_params": 208.111380594847, "train/loss": 6.468620181083679, "l2_grads": 2.171875, "lr": 0.0001749, "uptime": 3299.3660535849995, "examples_seen": 1792000.0, "progress": 0.015541326607639228, "epoch": 1.3987247564134886, "img/sec/core": 552.6096059962218, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.8946901803602777, "core_hours": 0.8946901803602777} {"step": 1800, "l2_params": 208.14247201890845, "train/loss": 6.403588175773621, "l2_grads": 2.609375, "lr": 0.0001799, "uptime": 3392.081024153, "examples_seen": 1843200.0, "progress": 0.015985364510714636, "epoch": 1.4386883208824455, "img/sec/core": 552.2301273066593, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.9204443388513889, "core_hours": 0.9204443388513889} {"step": 1850, "l2_params": 208.16856009989237, "train/loss": 6.457463383674622, "l2_grads": 2.578125, "lr": 0.00018490000000000002, "uptime": 3484.759300733999, "examples_seen": 1894400.0, "progress": 0.01642940241379004, "epoch": 1.4786518853514024, "img/sec/core": 552.4487710477867, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.9461883045683331, "core_hours": 0.9461883045683331} {"step": 1900, "l2_params": 208.2188457252343, "train/loss": 6.571776628494263, "l2_grads": 4.1875, "lr": 0.0001899, "uptime": 3577.4941135299996, "examples_seen": 1945600.0, "progress": 0.016873440316865447, "epoch": 1.518615449820359, "img/sec/core": 552.1119680548732, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.9719479747894444, "core_hours": 0.9719479747894444} {"step": 1951, "l2_params": 208.25562008604788, "train/loss": 6.361223936080933, "l2_grads": 2.09375, "lr": 0.0001949, "uptime": 3670.199842039, "examples_seen": 1996800.0, "progress": 0.017317478219940854, "epoch": 1.558579014289316, "img/sec/core": 552.2851804678844, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 0.9976995660419445, "core_hours": 0.9976995660419445} {"step": 2000, "l2_params": 208.306189110972, "train/loss": 6.467161417007446, "l2_grads": 3.21875, "lr": 0.0001999, "uptime": 3762.8970891179997, "examples_seen": 2048000.0, "progress": 0.017761516123016262, "epoch": 1.5985425787582728, "img/sec/core": 552.3357123687358, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.0234488013416667, "core_hours": 1.0234488013416667} {"step": 2050, "l2_params": 208.337572019055, "train/loss": 6.29259181022644, "l2_grads": 2.546875, "lr": 0.0002049, "uptime": 3855.832939674, "examples_seen": 2099200.0, "progress": 0.018205554026091666, "epoch": 1.6385061432272296, "img/sec/core": 550.9176458136403, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.049264315385, "core_hours": 1.049264315385} {"step": 2100, "l2_params": 208.37435799484345, "train/loss": 6.565992832183838, "l2_grads": 5.59375, "lr": 0.0002099, "uptime": 3948.5116849469996, "examples_seen": 2150400.0, "progress": 0.018649591929167073, "epoch": 1.6784697076961863, "img/sec/core": 552.4459772214492, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.0750084112941667, "core_hours": 1.0750084112941667} {"step": 2150, "l2_params": 208.41565480292297, "train/loss": 6.372379779815674, "l2_grads": 2.375, "lr": 0.00021490000000000002, "uptime": 4041.259481489, "examples_seen": 2201600.0, "progress": 0.01909362983224248, "epoch": 1.7184332721651432, "img/sec/core": 552.0346780078423, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.100771688111389, "core_hours": 1.100771688111389} {"step": 2200, "l2_params": 208.44794322879733, "train/loss": 6.325015068054199, "l2_grads": 2.328125, "lr": 0.0002199, "uptime": 4133.997703793, "examples_seen": 2252800.0, "progress": 0.019537667735317888, "epoch": 1.7583968366341, "img/sec/core": 552.0916697342324, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.1265323054180558, "core_hours": 1.1265323054180558} {"step": 2250, "l2_params": 208.48951762536112, "train/loss": 6.298551559448242, "l2_grads": 3.28125, "lr": 0.0002249, "uptime": 4226.7670098710005, "examples_seen": 2304000.0, "progress": 0.019981705638393292, "epoch": 1.7983604011030567, "img/sec/core": 551.9066829814503, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.1523015571063893, "core_hours": 1.1523015571063893} {"step": 2300, "l2_params": 208.530786414012, "train/loss": 6.723063111305237, "l2_grads": 2.390625, "lr": 0.0002299, "uptime": 4319.515562504999, "examples_seen": 2355200.0, "progress": 0.0204257435414687, "epoch": 1.8383239655720136, "img/sec/core": 552.0301777866413, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.1780650439491667, "core_hours": 1.1780650439491667} {"step": 2350, "l2_params": 208.56342044543763, "train/loss": 6.323840975761414, "l2_grads": 2.265625, "lr": 0.0002349, "uptime": 4412.328786967999, "examples_seen": 2406400.0, "progress": 0.020869781444544107, "epoch": 1.8782875300409705, "img/sec/core": 551.6455256913424, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.2038464951888885, "core_hours": 1.2038464951888885} {"step": 2400, "l2_params": 208.63439945830865, "train/loss": 6.206691384315491, "l2_grads": 4.0625, "lr": 0.0002399, "uptime": 4505.155586445999, "examples_seen": 2457600.0, "progress": 0.021313819347619514, "epoch": 1.9182510945099274, "img/sec/core": 551.5648529079632, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.2296317172661106, "core_hours": 1.2296317172661106} {"step": 2450, "l2_params": 208.6576826987071, "train/loss": 6.2512664794921875, "l2_grads": 2.21875, "lr": 0.0002449, "uptime": 4598.015483064999, "examples_seen": 2508800.0, "progress": 0.021757857250694918, "epoch": 1.958214658978884, "img/sec/core": 551.3682640642083, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.255426132993611, "core_hours": 1.255426132993611} {"step": 2500, "l2_params": 208.69035717155597, "train/loss": 6.172760248184204, "l2_grads": 2.546875, "lr": 0.0002499, "uptime": 4690.872886716999, "examples_seen": 2560000.0, "progress": 0.022201895153770326, "epoch": 1.998178223447841, "img/sec/core": 551.3830667921872, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.2812198562302775, "core_hours": 1.2812198562302775, "val/acc@1": 0.0418327487244898, "val/loss": 5.893508444027025, "z/secs/eval/val": 35.79783149399918} {"step": 2550, "l2_params": 208.73796670003622, "train/loss": 6.172629952430725, "l2_grads": 2.1875, "lr": 0.0002549, "uptime": 4819.046039171999, "examples_seen": 2611200.0, "progress": 0.022645933056845733, "epoch": 2.0381417879167976, "img/sec/core": 399.45962956615153, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.3168235096899998, "core_hours": 1.3168235096899998} {"step": 2600, "l2_params": 208.8095522423867, "train/loss": 6.7525928020477295, "l2_grads": 4.15625, "lr": 0.00025990000000000003, "uptime": 4911.710485681, "examples_seen": 2662400.0, "progress": 0.02308997095992114, "epoch": 2.0781053523857547, "img/sec/core": 552.5312234506958, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.342563633720278, "core_hours": 1.342563633720278} {"step": 2650, "l2_params": 208.90028678468965, "train/loss": 6.1548038721084595, "l2_grads": 2.75, "lr": 0.00026490000000000004, "uptime": 5004.468038735, "examples_seen": 2713600.0, "progress": 0.023534008862996544, "epoch": 2.1180689168547113, "img/sec/core": 551.9766133782483, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.3683296206797224, "core_hours": 1.3683296206797224} {"step": 2700, "l2_params": 208.9467065570316, "train/loss": 6.193925499916077, "l2_grads": 1.953125, "lr": 0.0002699, "uptime": 5097.342757054999, "examples_seen": 2764800.0, "progress": 0.023978046766071952, "epoch": 2.158032481323668, "img/sec/core": 551.2802722436331, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.3941281535463887, "core_hours": 1.3941281535463887} {"step": 2750, "l2_params": 208.999119478406, "train/loss": 6.34933602809906, "l2_grads": 2.1875, "lr": 0.00027489999999999996, "uptime": 5191.812308523, "examples_seen": 2816000.0, "progress": 0.02442208466914736, "epoch": 2.197996045792625, "img/sec/core": 541.9735693075964, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.4203696956208334, "core_hours": 1.4203696956208334} {"step": 2800, "l2_params": 209.08027804612917, "train/loss": 6.177191972732544, "l2_grads": 2.09375, "lr": 0.0002799, "uptime": 5284.643352461, "examples_seen": 2867200.0, "progress": 0.024866122572222767, "epoch": 2.2379596102615817, "img/sec/core": 551.5396340279802, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.4461560967147224, "core_hours": 1.4461560967147224} {"step": 2850, "l2_params": 209.14291270461524, "train/loss": 6.1803261041641235, "l2_grads": 2.625, "lr": 0.0002849, "uptime": 5378.428653122999, "examples_seen": 2918400.0, "progress": 0.02531016047529817, "epoch": 2.277923174730539, "img/sec/core": 545.9277694755618, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.4722075691208332, "core_hours": 1.4722075691208332} {"step": 2900, "l2_params": 209.26289162067948, "train/loss": 6.603275537490845, "l2_grads": 2.5625, "lr": 0.0002899, "uptime": 5471.243591699, "examples_seen": 2969600.0, "progress": 0.025754198378373578, "epoch": 2.3178867391994955, "img/sec/core": 551.6353378618606, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.4979894965030556, "core_hours": 1.4979894965030556} {"step": 2950, "l2_params": 209.38340635817895, "train/loss": 6.585144400596619, "l2_grads": 2.84375, "lr": 0.0002949, "uptime": 5565.7198283180005, "examples_seen": 3020800.0, "progress": 0.026198236281448985, "epoch": 2.357850303668452, "img/sec/core": 541.9352191861424, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.524232895563889, "core_hours": 1.524232895563889} {"step": 3000, "l2_params": 209.47095821718528, "train/loss": 6.313150644302368, "l2_grads": 2.109375, "lr": 0.0002999, "uptime": 5658.554794797999, "examples_seen": 3072000.0, "progress": 0.02664227418452439, "epoch": 2.3978138681374093, "img/sec/core": 551.5163299060481, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.5500203862527777, "core_hours": 1.5500203862527777} {"step": 3050, "l2_params": 209.51559772558133, "train/loss": 6.440333127975464, "l2_grads": 1.578125, "lr": 0.0003049, "uptime": 5752.333795541999, "examples_seen": 3123200.0, "progress": 0.027086312087599797, "epoch": 2.437777432606366, "img/sec/core": 545.9644439992165, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.5760701086816664, "core_hours": 1.5760701086816664} {"step": 3101, "l2_params": 209.64492959701482, "train/loss": 6.5341551303863525, "l2_grads": 2.390625, "lr": 0.0003099, "uptime": 5845.18022126, "examples_seen": 3174400.0, "progress": 0.027530349990675204, "epoch": 2.4777409970753226, "img/sec/core": 551.4482609756916, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.601860782492222, "core_hours": 1.601860782492222} {"step": 3150, "l2_params": 209.74082961285686, "train/loss": 6.56733512878418, "l2_grads": 2.140625, "lr": 0.0003149, "uptime": 5939.11454911, "examples_seen": 3225600.0, "progress": 0.02797438789375061, "epoch": 2.5177045615442797, "img/sec/core": 545.0616528790116, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.6279536513394446, "core_hours": 1.6279536513394446} {"step": 3200, "l2_params": 209.8462267674828, "train/loss": 6.137189030647278, "l2_grads": 2.1875, "lr": 0.0003199, "uptime": 6032.632072626, "examples_seen": 3276800.0, "progress": 0.028418425796826016, "epoch": 2.5576681260132363, "img/sec/core": 547.4909736167244, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.653930741205, "core_hours": 1.653930741205} {"step": 3250, "l2_params": 209.95826426350536, "train/loss": 6.004402279853821, "l2_grads": 1.5, "lr": 0.00032490000000000004, "uptime": 6126.206545849, "examples_seen": 3328000.0, "progress": 0.028862463699901423, "epoch": 2.597631690482193, "img/sec/core": 547.1577689567544, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.679923650433611, "core_hours": 1.679923650433611} {"step": 3300, "l2_params": 210.06837109683676, "train/loss": 6.039193153381348, "l2_grads": 1.9140625, "lr": 0.00032990000000000005, "uptime": 6219.7810245069995, "examples_seen": 3379200.0, "progress": 0.02930650160297683, "epoch": 2.63759525495115, "img/sec/core": 547.1577371766934, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.7059165611719442, "core_hours": 1.7059165611719442} {"step": 3350, "l2_params": 210.25331760832603, "train/loss": 5.93924355506897, "l2_grads": 2.453125, "lr": 0.0003349, "uptime": 6313.329685073, "examples_seen": 3430400.0, "progress": 0.029750539506052238, "epoch": 2.6775588194201068, "img/sec/core": 547.3087448844573, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.7319023002180558, "core_hours": 1.7319023002180558} {"step": 3400, "l2_params": 210.34548240835716, "train/loss": 5.961772799491882, "l2_grads": 1.6640625, "lr": 0.00033989999999999997, "uptime": 6406.870920915999, "examples_seen": 3481600.0, "progress": 0.03019457740912764, "epoch": 2.717522383889064, "img/sec/core": 547.3521868573034, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.7578859768411108, "core_hours": 1.7578859768411108} {"step": 3450, "l2_params": 210.48522853897722, "train/loss": 6.0102821588516235, "l2_grads": 1.90625, "lr": 0.0003449, "uptime": 6499.821574374, "examples_seen": 3532800.0, "progress": 0.03063861531220305, "epoch": 2.7574859483580205, "img/sec/core": 550.8299091531841, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.783705602801667, "core_hours": 1.783705602801667} {"step": 3500, "l2_params": 210.62131652327838, "train/loss": 5.9398651123046875, "l2_grads": 2.03125, "lr": 0.0003499, "uptime": 6593.9737908179995, "examples_seen": 3584000.0, "progress": 0.031082653215278457, "epoch": 2.797449512826977, "img/sec/core": 543.8002623172782, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.8098589962583334, "core_hours": 1.8098589962583334} {"step": 3550, "l2_params": 210.78937569035747, "train/loss": 5.911717414855957, "l2_grads": 1.78125, "lr": 0.0003549, "uptime": 6686.859120097999, "examples_seen": 3635200.0, "progress": 0.031526691118353864, "epoch": 2.8374130772959343, "img/sec/core": 551.2172955285482, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.8356604766138886, "core_hours": 1.8356604766138886} {"step": 3600, "l2_params": 210.90033193953732, "train/loss": 5.828477501869202, "l2_grads": 2.34375, "lr": 0.0003599, "uptime": 6780.667459095999, "examples_seen": 3686400.0, "progress": 0.03197072902142927, "epoch": 2.877376641764891, "img/sec/core": 545.7936953887595, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.8617183485577775, "core_hours": 1.8617183485577775} {"step": 3650, "l2_params": 211.0824501249036, "train/loss": 6.5171051025390625, "l2_grads": 1.875, "lr": 0.00036490000000000003, "uptime": 6873.966830027999, "examples_seen": 3737600.0, "progress": 0.03241476692450468, "epoch": 2.9173402062338476, "img/sec/core": 548.7711169812335, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.8876348404833332, "core_hours": 1.8876348404833332} {"step": 3700, "l2_params": 211.21817300522702, "train/loss": 6.194607853889465, "l2_grads": 1.9453125, "lr": 0.0003699, "uptime": 6967.387267394, "examples_seen": 3788800.0, "progress": 0.03285880482758008, "epoch": 2.9573037707028047, "img/sec/core": 548.0599475188637, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.9135849619738892, "core_hours": 1.9135849619738892} {"step": 3750, "l2_params": 211.39873953798084, "train/loss": 5.875433564186096, "l2_grads": 1.8828125, "lr": 0.0003749, "uptime": 7060.863945498, "examples_seen": 3840000.0, "progress": 0.03330284273065549, "epoch": 2.9972673351717614, "img/sec/core": 547.7302043514658, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.9395507058916668, "core_hours": 1.9395507058916668} {"step": 3800, "l2_params": 211.64301123810495, "train/loss": 5.971150636672974, "l2_grads": 1.984375, "lr": 0.0003799, "uptime": 7154.354507562, "examples_seen": 3891200.0, "progress": 0.033746880633730894, "epoch": 3.037230899640718, "img/sec/core": 547.6488628333453, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.9655203064650002, "core_hours": 1.9655203064650002} {"step": 3851, "l2_params": 211.80320635161593, "train/loss": 6.5460532903671265, "l2_grads": 2.34375, "lr": 0.00038490000000000003, "uptime": 7247.799266443, "examples_seen": 3942400.0, "progress": 0.0341909185368063, "epoch": 3.077194464109675, "img/sec/core": 547.9173001580776, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 1.9914771839319445, "core_hours": 1.9914771839319445} {"step": 3900, "l2_params": 211.97751066293677, "train/loss": 5.79978883266449, "l2_grads": 1.5625, "lr": 0.00038990000000000004, "uptime": 7341.718325137999, "examples_seen": 3993600.0, "progress": 0.03463495643988171, "epoch": 3.117158028578632, "img/sec/core": 545.150267809555, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.017565811347222, "core_hours": 2.017565811347222} {"step": 3950, "l2_params": 212.15169402594026, "train/loss": 6.271235108375549, "l2_grads": 1.7109375, "lr": 0.0003949, "uptime": 7436.1067443209995, "examples_seen": 4044800.0, "progress": 0.035078994342957116, "epoch": 3.1571215930475884, "img/sec/core": 542.4394268192316, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.0437848166758332, "core_hours": 2.0437848166758332} {"step": 4000, "l2_params": 212.317341144877, "train/loss": 5.8193511962890625, "l2_grads": 1.4453125, "lr": 0.00039989999999999996, "uptime": 7529.211817198, "examples_seen": 4096000.0, "progress": 0.035523032246032524, "epoch": 3.1970851575165455, "img/sec/core": 549.9163302051156, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.0696473369194446, "core_hours": 2.0696473369194446} {"step": 4050, "l2_params": 212.49488619765947, "train/loss": 5.776368975639343, "l2_grads": 1.9609375, "lr": 0.0004049, "uptime": 7623.751285266, "examples_seen": 4147200.0, "progress": 0.03596707014910793, "epoch": 3.237048721985502, "img/sec/core": 541.572753119078, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.0959083002716667, "core_hours": 2.0959083002716667} {"step": 4100, "l2_params": 212.7132119132729, "train/loss": 6.173025727272034, "l2_grads": 1.4765625, "lr": 0.0004099, "uptime": 7716.86988563, "examples_seen": 4198400.0, "progress": 0.03641110805218333, "epoch": 3.2770122864544593, "img/sec/core": 549.8364429862537, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.1217745781505557, "core_hours": 2.1217745781505557} {"step": 4150, "l2_params": 212.87615088411002, "train/loss": 6.276281118392944, "l2_grads": 2.015625, "lr": 0.0004149, "uptime": 7811.390791733, "examples_seen": 4249600.0, "progress": 0.03685514595525874, "epoch": 3.316975850923416, "img/sec/core": 541.6791068867562, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.148030385401389, "core_hours": 2.148030385401389} {"step": 4200, "l2_params": 213.05070830457717, "train/loss": 6.196481823921204, "l2_grads": 1.5703125, "lr": 0.0004199, "uptime": 7905.6806502300005, "examples_seen": 4300800.0, "progress": 0.037299183858334146, "epoch": 3.3569394153923726, "img/sec/core": 543.0064358578777, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.1742220127616667, "core_hours": 2.1742220127616667} {"step": 4250, "l2_params": 213.267507355442, "train/loss": 5.6738317012786865, "l2_grads": 1.734375, "lr": 0.00042490000000000003, "uptime": 7999.8460541019995, "examples_seen": 4352000.0, "progress": 0.037743221761409554, "epoch": 3.3969029798613297, "img/sec/core": 543.724105613111, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.200379069392778, "core_hours": 2.200379069392778} {"step": 4300, "l2_params": 213.50744122797406, "train/loss": 5.729138374328613, "l2_grads": 1.7421875, "lr": 0.0004299, "uptime": 8093.814674682999, "examples_seen": 4403200.0, "progress": 0.03818725966448496, "epoch": 3.4368665443302864, "img/sec/core": 544.8627391083861, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.226481463998611, "core_hours": 2.226481463998611} {"step": 4350, "l2_params": 213.72833477671082, "train/loss": 6.495797753334045, "l2_grads": 1.6640625, "lr": 0.0004349, "uptime": 8188.1465573820005, "examples_seen": 4454400.0, "progress": 0.03863129756756037, "epoch": 3.476830108799243, "img/sec/core": 542.764530242349, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.2526847647483335, "core_hours": 2.2526847647483335} {"step": 4400, "l2_params": 213.93732554244457, "train/loss": 5.6654052734375, "l2_grads": 1.671875, "lr": 0.0004399, "uptime": 8282.07590346, "examples_seen": 4505600.0, "progress": 0.039075335470635776, "epoch": 3.5167936732682, "img/sec/core": 545.0905615533983, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.2787762497699995, "core_hours": 2.2787762497699995} {"step": 4450, "l2_params": 214.09473219069787, "train/loss": 5.790745377540588, "l2_grads": 1.9453125, "lr": 0.0004449, "uptime": 8375.797256124, "examples_seen": 4556800.0, "progress": 0.03951937337371118, "epoch": 3.556757237737157, "img/sec/core": 546.3002671713082, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.3048099588433333, "core_hours": 2.3048099588433333} {"step": 4500, "l2_params": 214.31267094820848, "train/loss": 6.129344820976257, "l2_grads": 1.359375, "lr": 0.00044990000000000004, "uptime": 8468.717184221, "examples_seen": 4608000.0, "progress": 0.039963411276786584, "epoch": 3.5967208022061135, "img/sec/core": 551.0120492834702, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.3306210499813886, "core_hours": 2.3306210499813886} {"step": 4550, "l2_params": 214.58880341998895, "train/loss": 5.621910095214844, "l2_grads": 1.59375, "lr": 0.00045490000000000005, "uptime": 8563.063544964, "examples_seen": 4659200.0, "progress": 0.04040744917986199, "epoch": 3.6366843666750706, "img/sec/core": 542.6812396025417, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.35682837241, "core_hours": 2.35682837241} {"step": 4600, "l2_params": 214.76912411322834, "train/loss": 5.71711802482605, "l2_grads": 1.7890625, "lr": 0.0004599, "uptime": 8655.980487036, "examples_seen": 4710400.0, "progress": 0.0408514870829374, "epoch": 3.676647931144027, "img/sec/core": 551.0297568803477, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.3826386340966663, "core_hours": 2.3826386340966663} {"step": 4650, "l2_params": 215.02594157007127, "train/loss": 6.2231467962265015, "l2_grads": 1.6640625, "lr": 0.00046489999999999997, "uptime": 8750.135854077, "examples_seen": 4761600.0, "progress": 0.041295524986012806, "epoch": 3.7166114956129843, "img/sec/core": 543.7820658455429, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.408792902719166, "core_hours": 2.408792902719166} {"step": 4700, "l2_params": 215.2547109267806, "train/loss": 6.154559850692749, "l2_grads": 1.3203125, "lr": 0.0004699, "uptime": 8843.191988278999, "examples_seen": 4812800.0, "progress": 0.041739562889088214, "epoch": 3.756575060081941, "img/sec/core": 550.2055338862342, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.4346418288863885, "core_hours": 2.4346418288863885} {"step": 4750, "l2_params": 215.38808854373409, "train/loss": 5.582153558731079, "l2_grads": 1.453125, "lr": 0.0004749, "uptime": 8937.972314585999, "examples_seen": 4864000.0, "progress": 0.04218360079216362, "epoch": 3.7965386245508976, "img/sec/core": 540.1964943036774, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.4609696973049995, "core_hours": 2.4609696973049995} {"step": 4800, "l2_params": 215.68603210922464, "train/loss": 5.60210919380188, "l2_grads": 1.578125, "lr": 0.0004799, "uptime": 9031.891876459, "examples_seen": 4915200.0, "progress": 0.04262763869523903, "epoch": 3.8365021890198547, "img/sec/core": 545.1473471440721, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.4870584644919442, "core_hours": 2.4870584644919442} {"step": 4850, "l2_params": 215.9257625586244, "train/loss": 5.632081985473633, "l2_grads": 1.53125, "lr": 0.0004849, "uptime": 9124.896679004, "examples_seen": 4966400.0, "progress": 0.04307167659831443, "epoch": 3.8764657534888114, "img/sec/core": 550.509205965222, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.512893131865555, "core_hours": 2.512893131865555} {"step": 4900, "l2_params": 216.15835841596765, "train/loss": 5.6318395137786865, "l2_grads": 1.421875, "lr": 0.0004899, "uptime": 9218.342372879999, "examples_seen": 5017600.0, "progress": 0.043515714501389836, "epoch": 3.916429317957768, "img/sec/core": 547.911817830165, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.538850269053333, "core_hours": 2.538850269053333} {"step": 4950, "l2_params": 216.42523883014556, "train/loss": 5.47230339050293, "l2_grads": 1.75, "lr": 0.0004949, "uptime": 9312.451566677999, "examples_seen": 5068800.0, "progress": 0.043959752404465244, "epoch": 3.956392882426725, "img/sec/core": 544.0488642363453, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.5649917117749994, "core_hours": 2.5649917117749994} {"step": 5000, "l2_params": 216.65960230339127, "train/loss": 5.437730193138123, "l2_grads": 1.4453125, "lr": 0.0004999000000000001, "uptime": 9405.972115751, "examples_seen": 5120000.0, "progress": 0.04440379030754065, "epoch": 3.996356446895682, "img/sec/core": 547.4732613046809, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.590969642073055, "core_hours": 2.590969642073055, "val/acc@1": 0.11356026785714286, "val/loss": 4.886652255544857, "z/secs/eval/val": 32.29485458399904} {"step": 5050, "l2_params": 216.9512325634289, "train/loss": 5.543553352355957, "l2_grads": 1.6015625, "lr": 0.0005049000000000001, "uptime": 9531.296599522999, "examples_seen": 5171200.0, "progress": 0.04484782821061606, "epoch": 4.036320011364639, "img/sec/core": 408.5394845363754, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.625781998676388, "core_hours": 2.625781998676388} {"step": 5100, "l2_params": 217.23798845489637, "train/loss": 5.441771745681763, "l2_grads": 1.8203125, "lr": 0.0005099, "uptime": 9624.483154615, "examples_seen": 5222400.0, "progress": 0.045291866113691466, "epoch": 4.076283575833595, "img/sec/core": 549.4354840078737, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.651667152868611, "core_hours": 2.651667152868611} {"step": 5150, "l2_params": 217.51056387667523, "train/loss": 6.3921799659729, "l2_grads": 1.3984375, "lr": 0.0005149, "uptime": 9718.781610464, "examples_seen": 5273600.0, "progress": 0.04573590401676687, "epoch": 4.116247140302552, "img/sec/core": 542.9569290295286, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.677861168382222, "core_hours": 2.677861168382222} {"step": 5200, "l2_params": 217.76660590461705, "train/loss": 5.642182946205139, "l2_grads": 1.734375, "lr": 0.0005199, "uptime": 9812.563974982999, "examples_seen": 5324800.0, "progress": 0.04617994191984228, "epoch": 4.156210704771509, "img/sec/core": 545.944861409716, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.703911825193055, "core_hours": 2.703911825193055} {"step": 5250, "l2_params": 218.0751656254073, "train/loss": 5.489780426025391, "l2_grads": 1.4921875, "lr": 0.0005249, "uptime": 9906.33552666, "examples_seen": 5376000.0, "progress": 0.04662397982291768, "epoch": 4.1961742692404655, "img/sec/core": 546.0078145700342, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.7299594784366663, "core_hours": 2.7299594784366663} {"step": 5300, "l2_params": 218.298709707951, "train/loss": 5.577523350715637, "l2_grads": 1.4921875, "lr": 0.0005299, "uptime": 9999.990479324999, "examples_seen": 5427200.0, "progress": 0.04706801772599309, "epoch": 4.236137833709423, "img/sec/core": 546.6875861134705, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.755974743065833, "core_hours": 2.755974743065833} {"step": 5350, "l2_params": 218.58119470342942, "train/loss": 5.454126000404358, "l2_grads": 1.5, "lr": 0.0005349, "uptime": 10093.707487085, "examples_seen": 5478400.0, "progress": 0.047512055629068496, "epoch": 4.27610139817838, "img/sec/core": 546.3255947214827, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.782007245221388, "core_hours": 2.782007245221388} {"step": 5400, "l2_params": 218.85881800937102, "train/loss": 5.663575649261475, "l2_grads": 1.6796875, "lr": 0.0005399000000000001, "uptime": 10187.382280878, "examples_seen": 5529600.0, "progress": 0.047956093532143904, "epoch": 4.316064962647336, "img/sec/core": 546.571792974956, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.8080280212749997, "core_hours": 2.8080280212749997} {"step": 5450, "l2_params": 219.20022954163053, "train/loss": 5.3195167779922485, "l2_grads": 1.6796875, "lr": 0.0005449000000000001, "uptime": 10281.212453815, "examples_seen": 5580800.0, "progress": 0.04840013143521931, "epoch": 4.356028527116293, "img/sec/core": 545.6666911866104, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.8340919582019444, "core_hours": 2.8340919582019444} {"step": 5500, "l2_params": 219.48406006931737, "train/loss": 5.670673370361328, "l2_grads": 1.5859375, "lr": 0.0005499000000000001, "uptime": 10375.807136194999, "examples_seen": 5632000.0, "progress": 0.04884416933829472, "epoch": 4.39599209158525, "img/sec/core": 541.2566405617096, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.860368258863055, "core_hours": 2.860368258863055} {"step": 5550, "l2_params": 219.75376060835382, "train/loss": 5.277057409286499, "l2_grads": 1.875, "lr": 0.0005549, "uptime": 10469.559592251999, "examples_seen": 5683200.0, "progress": 0.049288207241370126, "epoch": 4.435955656054206, "img/sec/core": 546.1190261391254, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.886410607767777, "core_hours": 2.886410607767777} {"step": 5600, "l2_params": 220.11653782069163, "train/loss": 5.279862761497498, "l2_grads": 1.4375, "lr": 0.0005599, "uptime": 10564.247375810999, "examples_seen": 5734400.0, "progress": 0.04973224514444553, "epoch": 4.4759192205231635, "img/sec/core": 540.7244533091969, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.9127127698674995, "core_hours": 2.9127127698674995} {"step": 5650, "l2_params": 220.40596608638936, "train/loss": 5.474686503410339, "l2_grads": 1.8515625, "lr": 0.0005649, "uptime": 10658.536149006999, "examples_seen": 5785600.0, "progress": 0.050176283047520934, "epoch": 4.515882784992121, "img/sec/core": 543.0126860763108, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.9389040957552774, "core_hours": 2.9389040957552774} {"step": 5700, "l2_params": 220.7018059280272, "train/loss": 5.493955373764038, "l2_grads": 1.9609375, "lr": 0.0005698999999999999, "uptime": 10752.545453378, "examples_seen": 5836800.0, "progress": 0.05062032095059634, "epoch": 4.555846349461078, "img/sec/core": 544.6269424347959, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.965017791413888, "core_hours": 2.965017791413888} {"step": 5750, "l2_params": 220.9928243861682, "train/loss": 5.197087645530701, "l2_grads": 1.4140625, "lr": 0.0005748999999999999, "uptime": 10846.495962963, "examples_seen": 5888000.0, "progress": 0.05106435885367175, "epoch": 4.595809913930034, "img/sec/core": 544.9677732048676, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 2.9911151551874995, "core_hours": 2.9911151551874995} {"step": 5800, "l2_params": 221.29715025489483, "train/loss": 5.268111228942871, "l2_grads": 1.6171875, "lr": 0.0005799, "uptime": 10940.68320311, "examples_seen": 5939200.0, "progress": 0.051508396756747156, "epoch": 4.635773478398991, "img/sec/core": 543.5980491634598, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.0172782774505555, "core_hours": 3.0172782774505555} {"step": 5850, "l2_params": 221.6596214761921, "train/loss": 5.233166456222534, "l2_grads": 1.640625, "lr": 0.0005849, "uptime": 11035.107427666, "examples_seen": 5990400.0, "progress": 0.05195243465982256, "epoch": 4.675737042867948, "img/sec/core": 542.2337354715046, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.043507228716111, "core_hours": 3.043507228716111} {"step": 5900, "l2_params": 221.96286291226068, "train/loss": 5.272388577461243, "l2_grads": 1.546875, "lr": 0.0005899, "uptime": 11128.256257048, "examples_seen": 6041600.0, "progress": 0.05239647256289797, "epoch": 4.715700607336904, "img/sec/core": 549.6580079394288, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.0693819035444445, "core_hours": 3.0693819035444445} {"step": 5950, "l2_params": 222.34244443573127, "train/loss": 6.399750113487244, "l2_grads": 1.2265625, "lr": 0.0005949, "uptime": 11222.219559678999, "examples_seen": 6092800.0, "progress": 0.05284051046597338, "epoch": 4.755664171805861, "img/sec/core": 544.8935761769313, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.0954828209419443, "core_hours": 3.0954828209419443} {"step": 6000, "l2_params": 222.63568147868946, "train/loss": 5.301631450653076, "l2_grads": 2.421875, "lr": 0.0005999, "uptime": 11315.324415973, "examples_seen": 6144000.0, "progress": 0.05328454836904878, "epoch": 4.7956277362748185, "img/sec/core": 549.9176094351456, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.121345281023611, "core_hours": 3.121345281023611} {"step": 6050, "l2_params": 222.98697559314914, "train/loss": 5.152811765670776, "l2_grads": 1.7109375, "lr": 0.0006049, "uptime": 11408.4627535, "examples_seen": 6195200.0, "progress": 0.053728586272124186, "epoch": 4.835591300743775, "img/sec/core": 549.7199258592918, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.1472170414477776, "core_hours": 3.1472170414477776} {"step": 6100, "l2_params": 223.2839794379185, "train/loss": 5.176834344863892, "l2_grads": 1.59375, "lr": 0.0006099, "uptime": 11501.607854912, "examples_seen": 6246400.0, "progress": 0.054172624175199593, "epoch": 4.875554865212732, "img/sec/core": 549.6800070411883, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.1730906807288886, "core_hours": 3.1730906807288886} {"step": 6150, "l2_params": 223.64815763400765, "train/loss": 5.161349058151245, "l2_grads": 1.546875, "lr": 0.0006149, "uptime": 11594.361535109, "examples_seen": 6297600.0, "progress": 0.054616662078275, "epoch": 4.915518429681689, "img/sec/core": 551.9996607278123, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.1988555918947217, "core_hours": 3.1988555918947217} {"step": 6200, "l2_params": 223.94910969984133, "train/loss": 5.222040176391602, "l2_grads": 1.703125, "lr": 0.0006199, "uptime": 11687.073492312, "examples_seen": 6348800.0, "progress": 0.05506069998135041, "epoch": 4.955481994150645, "img/sec/core": 552.2480761342717, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.2246089133399995, "core_hours": 3.2246089133399995} {"step": 6250, "l2_params": 224.3029113063578, "train/loss": 5.0808398723602295, "l2_grads": 1.34375, "lr": 0.0006249000000000001, "uptime": 11779.729427238, "examples_seen": 6400000.0, "progress": 0.055504737884425816, "epoch": 4.995445558619602, "img/sec/core": 552.5819802141197, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.250346673041667, "core_hours": 3.250346673041667} {"step": 6300, "l2_params": 224.65173635858187, "train/loss": 5.120813250541687, "l2_grads": 1.8203125, "lr": 0.0006299000000000001, "uptime": 11872.435139125, "examples_seen": 6451200.0, "progress": 0.05594877578750122, "epoch": 5.035409123088559, "img/sec/core": 552.285279491822, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.276098259676944, "core_hours": 3.276098259676944} {"step": 6350, "l2_params": 224.99098262095347, "train/loss": 5.557651519775391, "l2_grads": 1.359375, "lr": 0.0006349, "uptime": 11965.115794504, "examples_seen": 6502400.0, "progress": 0.05639281369057663, "epoch": 5.075372687557516, "img/sec/core": 552.4345915620437, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.3018428861711104, "core_hours": 3.3018428861711104} {"step": 6400, "l2_params": 225.28986022048144, "train/loss": 5.671110987663269, "l2_grads": 1.5625, "lr": 0.0006399, "uptime": 12057.815020328, "examples_seen": 6553600.0, "progress": 0.05683685159365203, "epoch": 5.115336252026473, "img/sec/core": 552.3239222861325, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.3275926711222223, "core_hours": 3.3275926711222223} {"step": 6450, "l2_params": 225.70814952545916, "train/loss": 4.998944640159607, "l2_grads": 1.5078125, "lr": 0.0006449, "uptime": 12150.472979514001, "examples_seen": 6604800.0, "progress": 0.05728088949672744, "epoch": 5.15529981649543, "img/sec/core": 552.569908184806, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.3533309931183335, "core_hours": 3.3533309931183335} {"step": 6500, "l2_params": 226.0593848062592, "train/loss": 5.12208092212677, "l2_grads": 1.6796875, "lr": 0.0006499, "uptime": 12243.091376312, "examples_seen": 6656000.0, "progress": 0.057724927399802846, "epoch": 5.195263380964386, "img/sec/core": 552.8059410450282, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.379058325562222, "core_hours": 3.379058325562222} {"step": 6550, "l2_params": 226.4013915325845, "train/loss": 5.278810620307922, "l2_grads": 1.328125, "lr": 0.0006549, "uptime": 12335.763149045, "examples_seen": 6707200.0, "progress": 0.05816896530287825, "epoch": 5.235226945433343, "img/sec/core": 552.4875427549482, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.404800484654722, "core_hours": 3.404800484654722} {"step": 6600, "l2_params": 226.76902211741762, "train/loss": 5.376396656036377, "l2_grads": 1.3671875, "lr": 0.0006599, "uptime": 12428.362127068001, "examples_seen": 6758400.0, "progress": 0.05861300320595366, "epoch": 5.2751905099023, "img/sec/core": 552.9218690435458, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.4305224229944447, "core_hours": 3.4305224229944447} {"step": 6650, "l2_params": 227.13185276406975, "train/loss": 5.1128658056259155, "l2_grads": 1.5546875, "lr": 0.0006649000000000001, "uptime": 12520.953865213, "examples_seen": 6809600.0, "progress": 0.05905704110902907, "epoch": 5.315154074371256, "img/sec/core": 552.9651027807807, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.456242350256944, "core_hours": 3.456242350256944} {"step": 6700, "l2_params": 227.533591135935, "train/loss": 6.413294792175293, "l2_grads": 1.6875, "lr": 0.0006699000000000001, "uptime": 12613.650583237999, "examples_seen": 6860800.0, "progress": 0.059501079012104476, "epoch": 5.3551176388402135, "img/sec/core": 552.3388647502261, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.4819914385972215, "core_hours": 3.4819914385972215} {"step": 6750, "l2_params": 227.89942601170554, "train/loss": 5.104199528694153, "l2_grads": 1.5625, "lr": 0.0006749000000000001, "uptime": 12706.214385249, "examples_seen": 6912000.0, "progress": 0.05994511691517988, "epoch": 5.395081203309171, "img/sec/core": 553.1319899102085, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.5077036058225, "core_hours": 3.5077036058225} {"step": 6800, "l2_params": 228.33944089568647, "train/loss": 5.065725803375244, "l2_grads": 1.28125, "lr": 0.0006799, "uptime": 12798.747604157, "examples_seen": 6963200.0, "progress": 0.06038915481825528, "epoch": 5.435044767778128, "img/sec/core": 553.3148052582605, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.533407277741389, "core_hours": 3.533407277741389} {"step": 6850, "l2_params": 228.72601626211375, "train/loss": 5.239918351173401, "l2_grads": 1.4296875, "lr": 0.0006849, "uptime": 12891.253855985, "examples_seen": 7014400.0, "progress": 0.06083319272133069, "epoch": 5.475008332247084, "img/sec/core": 553.4761055414754, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.559103458804722, "core_hours": 3.559103458804722} {"step": 6900, "l2_params": 229.14684708032854, "train/loss": 4.9919188022613525, "l2_grads": 1.8671875, "lr": 0.0006899, "uptime": 12983.727625427, "examples_seen": 7065600.0, "progress": 0.0612772306244061, "epoch": 5.514971896716041, "img/sec/core": 553.6705198560427, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.5847906169830552, "core_hours": 3.5847906169830552} {"step": 6950, "l2_params": 229.5581148654648, "train/loss": 5.903771996498108, "l2_grads": 1.1640625, "lr": 0.0006948999999999999, "uptime": 13076.249635265998, "examples_seen": 7116800.0, "progress": 0.061721268527481506, "epoch": 5.554935461184998, "img/sec/core": 553.3818395114359, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.610491175271666, "core_hours": 3.610491175271666} {"step": 7001, "l2_params": 229.9207489141639, "train/loss": 5.606208443641663, "l2_grads": 1.2109375, "lr": 0.0006998999999999999, "uptime": 13168.750386570999, "examples_seen": 7168000.0, "progress": 0.06216530643055691, "epoch": 5.594899025653954, "img/sec/core": 553.5090177935907, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.636185828411944, "core_hours": 3.636185828411944} {"step": 7050, "l2_params": 230.3742122046775, "train/loss": 6.322555065155029, "l2_grads": 1.21875, "lr": 0.0007049, "uptime": 13261.48165228, "examples_seen": 7219200.0, "progress": 0.06260934433363231, "epoch": 5.6348625901229115, "img/sec/core": 552.1330870288173, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.6619445133311106, "core_hours": 3.6619445133311106} {"step": 7100, "l2_params": 230.75309419055603, "train/loss": 4.902190685272217, "l2_grads": 1.6015625, "lr": 0.0007099, "uptime": 13354.012959503998, "examples_seen": 7270400.0, "progress": 0.06305338223670773, "epoch": 5.674826154591869, "img/sec/core": 553.3262366655604, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.687647654226666, "core_hours": 3.687647654226666} {"step": 7150, "l2_params": 231.1442538257444, "train/loss": 4.8130784034729, "l2_grads": 1.734375, "lr": 0.0007149, "uptime": 13446.580173848, "examples_seen": 7321600.0, "progress": 0.06349742013978313, "epoch": 5.714789719060825, "img/sec/core": 553.1115996396767, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.713360769322222, "core_hours": 3.713360769322222} {"step": 7200, "l2_params": 231.5820968428367, "train/loss": 4.914934873580933, "l2_grads": 1.7421875, "lr": 0.0007199, "uptime": 13539.047351271998, "examples_seen": 7372800.0, "progress": 0.06394145804285854, "epoch": 5.754753283529782, "img/sec/core": 553.7099912245423, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.7390460963844436, "core_hours": 3.7390460963844436} {"step": 7250, "l2_params": 231.95494431334342, "train/loss": 6.011101007461548, "l2_grads": 1.4609375, "lr": 0.0007249, "uptime": 13631.561541583, "examples_seen": 7424000.0, "progress": 0.06438549594593394, "epoch": 5.794716847998739, "img/sec/core": 553.4286127120912, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.7647444825819445, "core_hours": 3.7647444825819445} {"step": 7300, "l2_params": 232.37877830482995, "train/loss": 5.275770664215088, "l2_grads": 1.6328125, "lr": 0.0007299, "uptime": 13724.063733384999, "examples_seen": 7475200.0, "progress": 0.06482953384900936, "epoch": 5.834680412467695, "img/sec/core": 553.5003982348167, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.7904395358602776, "core_hours": 3.7904395358602776} {"step": 7350, "l2_params": 232.81453124113892, "train/loss": 5.785489320755005, "l2_grads": 1.1875, "lr": 0.0007349, "uptime": 13816.595854701998, "examples_seen": 7526400.0, "progress": 0.06527357175208476, "epoch": 5.874643976936652, "img/sec/core": 553.3213685288551, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.816142902892777, "core_hours": 3.816142902892777} {"step": 7400, "l2_params": 233.25387717210685, "train/loss": 5.524191498756409, "l2_grads": 1.2265625, "lr": 0.0007399, "uptime": 13909.084935683, "examples_seen": 7577600.0, "progress": 0.06571760965516016, "epoch": 5.914607541405609, "img/sec/core": 553.5788598712186, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.841834314276389, "core_hours": 3.841834314276389} {"step": 7450, "l2_params": 233.66688576042725, "train/loss": 5.150023341178894, "l2_grads": 1.578125, "lr": 0.0007449000000000001, "uptime": 14001.564660611999, "examples_seen": 7628800.0, "progress": 0.06616164755823557, "epoch": 5.954571105874566, "img/sec/core": 553.6348647155778, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.8675231267566663, "core_hours": 3.8675231267566663} {"step": 7500, "l2_params": 234.16011451251816, "train/loss": 5.851511001586914, "l2_grads": 1.2734375, "lr": 0.0007499000000000001, "uptime": 14094.076509076, "examples_seen": 7680000.0, "progress": 0.06660568546131097, "epoch": 5.994534670343523, "img/sec/core": 553.4426222163702, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.893220862441111, "core_hours": 3.893220862441111, "val/acc@1": 0.21291055484693877, "val/loss": 4.004948556423187, "z/secs/eval/val": 31.51998823199756} {"step": 7550, "l2_params": 234.6182495511825, "train/loss": 5.967741250991821, "l2_grads": 1.21875, "lr": 0.0007549000000000001, "uptime": 14217.771079035, "examples_seen": 7731200.0, "progress": 0.06704972336438639, "epoch": 6.03449823481248, "img/sec/core": 413.92277783067584, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.9275804652074995, "core_hours": 3.9275804652074995} {"step": 7600, "l2_params": 235.04147739016193, "train/loss": 4.593119263648987, "l2_grads": 1.5703125, "lr": 0.0007599, "uptime": 14310.161035057, "examples_seen": 7782400.0, "progress": 0.06749376126746179, "epoch": 6.074461799281436, "img/sec/core": 554.1727932829335, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.953244341880278, "core_hours": 3.953244341880278} {"step": 7650, "l2_params": 235.46812349576575, "train/loss": 4.953213572502136, "l2_grads": 1.4140625, "lr": 0.0007649, "uptime": 14402.578509726001, "examples_seen": 7833600.0, "progress": 0.0679377991705372, "epoch": 6.114425363750393, "img/sec/core": 554.0077802750648, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 3.978915862621667, "core_hours": 3.978915862621667} {"step": 7700, "l2_params": 235.9531542302644, "train/loss": 5.283560037612915, "l2_grads": 1.4375, "lr": 0.0007699, "uptime": 14495.035726716, "examples_seen": 7884800.0, "progress": 0.0683818370736126, "epoch": 6.15438892821935, "img/sec/core": 553.7696425097737, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.004598422896667, "core_hours": 4.004598422896667} {"step": 7750, "l2_params": 236.28955857837659, "train/loss": 5.0648432970047, "l2_grads": 1.578125, "lr": 0.0007749, "uptime": 14587.47622071, "examples_seen": 7936000.0, "progress": 0.068825874976688, "epoch": 6.1943524926883065, "img/sec/core": 553.8698224970916, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.030276337895, "core_hours": 4.030276337895} {"step": 7800, "l2_params": 236.70544491280125, "train/loss": 6.317407131195068, "l2_grads": 1.1328125, "lr": 0.0007799, "uptime": 14679.911409272001, "examples_seen": 7987200.0, "progress": 0.06926991287976342, "epoch": 6.234316057157264, "img/sec/core": 553.9016125407387, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.055952779162222, "core_hours": 4.055952779162222} {"step": 7850, "l2_params": 237.1923346427562, "train/loss": 4.727930426597595, "l2_grads": 1.5625, "lr": 0.0007849, "uptime": 14772.361408483, "examples_seen": 8038400.0, "progress": 0.06971395078283882, "epoch": 6.274279621626221, "img/sec/core": 553.8128765490387, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.081633334498611, "core_hours": 4.081633334498611} {"step": 7900, "l2_params": 237.75415959615393, "train/loss": 5.701470494270325, "l2_grads": 1.265625, "lr": 0.0007899000000000001, "uptime": 14864.796777544001, "examples_seen": 8089600.0, "progress": 0.07015798868591423, "epoch": 6.314243186095177, "img/sec/core": 553.9005309343415, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.107309825904445, "core_hours": 4.107309825904445} {"step": 7950, "l2_params": 238.19282913752684, "train/loss": 4.879296779632568, "l2_grads": 1.421875, "lr": 0.0007949000000000001, "uptime": 14957.226475139, "examples_seen": 8140800.0, "progress": 0.07060202658898963, "epoch": 6.354206750564134, "img/sec/core": 553.934518149615, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.132984741903055, "core_hours": 4.132984741903055} {"step": 8000, "l2_params": 238.70193959579984, "train/loss": 4.754421830177307, "l2_grads": 1.5234375, "lr": 0.0007999000000000001, "uptime": 15049.661760025, "examples_seen": 8192000.0, "progress": 0.07104606449206505, "epoch": 6.394170315033091, "img/sec/core": 553.9010353367202, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.158661209926944, "core_hours": 4.158661209926944} {"step": 8050, "l2_params": 239.14746141404314, "train/loss": 4.574748992919922, "l2_grads": 1.5390625, "lr": 0.0008049, "uptime": 15142.296924587, "examples_seen": 8243200.0, "progress": 0.07149010239514045, "epoch": 6.434133879502048, "img/sec/core": 552.7058784003277, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.184393200083056, "core_hours": 4.184393200083056} {"step": 8100, "l2_params": 239.61716241013366, "train/loss": 4.663712501525879, "l2_grads": 1.671875, "lr": 0.0008099, "uptime": 15234.701932429998, "examples_seen": 8294400.0, "progress": 0.07193414029821586, "epoch": 6.474097443971004, "img/sec/core": 554.0825242609411, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.210061257817221, "core_hours": 4.210061257817221} {"step": 8150, "l2_params": 240.08998531759855, "train/loss": 5.266080856323242, "l2_grads": 1.4375, "lr": 0.0008149, "uptime": 15327.154479828998, "examples_seen": 8345600.0, "progress": 0.07237817820129126, "epoch": 6.5140610084399615, "img/sec/core": 553.7976122933087, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.23574252098361, "core_hours": 4.23574252098361} {"step": 8200, "l2_params": 240.5991313712532, "train/loss": 4.681001543998718, "l2_grads": 1.5859375, "lr": 0.0008198999999999999, "uptime": 15419.572282295998, "examples_seen": 8396800.0, "progress": 0.07282221610436666, "epoch": 6.554024572908919, "img/sec/core": 554.0058152571004, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.26141413278, "core_hours": 4.26141413278} {"step": 8250, "l2_params": 241.0864556070051, "train/loss": 4.731106996536255, "l2_grads": 1.296875, "lr": 0.0008248999999999999, "uptime": 15512.016706364, "examples_seen": 8448000.0, "progress": 0.07326625400744208, "epoch": 6.593988137377875, "img/sec/core": 553.8462759239778, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.287093139465555, "core_hours": 4.287093139465555} {"step": 8300, "l2_params": 241.56058274627247, "train/loss": 5.235134124755859, "l2_grads": 1.375, "lr": 0.0008299, "uptime": 15604.440332307, "examples_seen": 8499200.0, "progress": 0.07371029191051748, "epoch": 6.633951701846832, "img/sec/core": 553.970908169913, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.312766368894166, "core_hours": 4.312766368894166} {"step": 8350, "l2_params": 242.02145013245985, "train/loss": 4.609705567359924, "l2_grads": 1.421875, "lr": 0.0008349, "uptime": 15696.887076181, "examples_seen": 8550400.0, "progress": 0.07415432981359289, "epoch": 6.673915266315789, "img/sec/core": 553.8323780206173, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.338446019970277, "core_hours": 4.338446019970277} {"step": 8400, "l2_params": 242.5185987753375, "train/loss": 4.54434597492218, "l2_grads": 1.5234375, "lr": 0.0008399, "uptime": 15789.320716514001, "examples_seen": 8601600.0, "progress": 0.07459836771666829, "epoch": 6.713878830784745, "img/sec/core": 553.9108901861567, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.364122031173889, "core_hours": 4.364122031173889} {"step": 8450, "l2_params": 243.00653318562948, "train/loss": 5.228797078132629, "l2_grads": 1.2734375, "lr": 0.0008449, "uptime": 15881.697927218, "examples_seen": 8652800.0, "progress": 0.07504240561974371, "epoch": 6.753842395253702, "img/sec/core": 554.2492527086423, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.389782367480555, "core_hours": 4.389782367480555} {"step": 8500, "l2_params": 243.54270106330623, "train/loss": 4.703230381011963, "l2_grads": 1.5859375, "lr": 0.0008499, "uptime": 15974.068719553, "examples_seen": 8704000.0, "progress": 0.07548644352281911, "epoch": 6.793805959722659, "img/sec/core": 554.2877646249146, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.415440920906945, "core_hours": 4.415440920906945} {"step": 8550, "l2_params": 243.97526524980137, "train/loss": 4.985008716583252, "l2_grads": 1.3828125, "lr": 0.0008549, "uptime": 16066.446721519998, "examples_seen": 8755200.0, "progress": 0.07593048142589451, "epoch": 6.833769524191616, "img/sec/core": 554.2445052913293, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.441101477008888, "core_hours": 4.441101477008888} {"step": 8600, "l2_params": 244.5175952157987, "train/loss": 4.61015522480011, "l2_grads": 1.40625, "lr": 0.0008599, "uptime": 16158.845288585999, "examples_seen": 8806400.0, "progress": 0.07637451932896992, "epoch": 6.873733088660573, "img/sec/core": 554.1211473921212, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.466767745638333, "core_hours": 4.466767745638333} {"step": 8650, "l2_params": 244.97302869915916, "train/loss": 4.641776204109192, "l2_grads": 1.5234375, "lr": 0.0008649, "uptime": 16251.242448175999, "examples_seen": 8857600.0, "progress": 0.07681855723204532, "epoch": 6.91369665312953, "img/sec/core": 554.1295882599964, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.4924336233022215, "core_hours": 4.4924336233022215} {"step": 8700, "l2_params": 245.4726462731833, "train/loss": 4.6044957637786865, "l2_grads": 1.3671875, "lr": 0.0008699000000000001, "uptime": 16343.570847611998, "examples_seen": 8908800.0, "progress": 0.07726259513512074, "epoch": 6.953660217598486, "img/sec/core": 554.5422677395296, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.518080400923333, "core_hours": 4.518080400923333} {"step": 8750, "l2_params": 246.02381694839906, "train/loss": 4.755034804344177, "l2_grads": 1.421875, "lr": 0.0008749000000000001, "uptime": 16435.976794195, "examples_seen": 8960000.0, "progress": 0.07770663303819614, "epoch": 6.993623782067443, "img/sec/core": 554.0768954085636, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.543748719418612, "core_hours": 4.543748719418612} {"step": 8800, "l2_params": 246.5821619120941, "train/loss": 5.165970802307129, "l2_grads": 1.28125, "lr": 0.0008799000000000001, "uptime": 16528.267483912, "examples_seen": 9011200.0, "progress": 0.07815067094127155, "epoch": 7.0335873465364, "img/sec/core": 554.7688521669932, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.5693850221177765, "core_hours": 4.5693850221177765} {"step": 8850, "l2_params": 247.10660417747843, "train/loss": 4.4800578355789185, "l2_grads": 1.546875, "lr": 0.0008849, "uptime": 16620.600862843, "examples_seen": 9062400.0, "progress": 0.07859470884434695, "epoch": 7.0735509110053565, "img/sec/core": 554.5123615400491, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.595033182931943, "core_hours": 4.595033182931943} {"step": 8900, "l2_params": 247.61378874954895, "train/loss": 5.226345658302307, "l2_grads": 1.6171875, "lr": 0.0008899, "uptime": 16712.978410097, "examples_seen": 9113600.0, "progress": 0.07903874674742235, "epoch": 7.113514475474314, "img/sec/core": 554.2472334670366, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.620693612724721, "core_hours": 4.620693612724721} {"step": 8950, "l2_params": 248.09601530959742, "train/loss": 4.6051799058914185, "l2_grads": 1.4375, "lr": 0.0008949, "uptime": 16805.424737006, "examples_seen": 9164800.0, "progress": 0.07948278465049777, "epoch": 7.153478039943271, "img/sec/core": 553.8348759967324, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.646373147977221, "core_hours": 4.646373147977221} {"step": 9000, "l2_params": 248.64138990016198, "train/loss": 5.737058401107788, "l2_grads": 1.0859375, "lr": 0.0008999, "uptime": 16897.815688013, "examples_seen": 9216000.0, "progress": 0.07992682255357317, "epoch": 7.193441604412227, "img/sec/core": 554.1668252350865, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.672037301034722, "core_hours": 4.672037301034722} {"step": 9050, "l2_params": 249.12115202983443, "train/loss": 4.580302596092224, "l2_grads": 1.3359375, "lr": 0.0009049, "uptime": 16990.4711599, "examples_seen": 9267200.0, "progress": 0.08037086045664858, "epoch": 7.233405168881184, "img/sec/core": 552.5847417024919, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.697774932114443, "core_hours": 4.697774932114443} {"step": 9100, "l2_params": 249.63636786756328, "train/loss": 4.504965901374817, "l2_grads": 1.4296875, "lr": 0.0009099, "uptime": 17082.90682756, "examples_seen": 9318400.0, "progress": 0.08081489835972398, "epoch": 7.273368733350141, "img/sec/core": 553.8987416451142, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.723451506464444, "core_hours": 4.723451506464444} {"step": 9150, "l2_params": 250.27071231640224, "train/loss": 4.760912179946899, "l2_grads": 1.3828125, "lr": 0.0009149000000000001, "uptime": 17175.348333977, "examples_seen": 9369600.0, "progress": 0.0812589362627994, "epoch": 7.313332297819097, "img/sec/core": 553.8637564930998, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.749129702691389, "core_hours": 4.749129702691389} {"step": 9200, "l2_params": 250.83943298966796, "train/loss": 4.585180878639221, "l2_grads": 1.4140625, "lr": 0.0009199000000000001, "uptime": 17267.725464117, "examples_seen": 9420800.0, "progress": 0.0817029741658748, "epoch": 7.353295862288054, "img/sec/core": 554.2497360808289, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.774790016619166, "core_hours": 4.774790016619166} {"step": 9250, "l2_params": 251.3830017606973, "train/loss": 4.846356272697449, "l2_grads": 1.3046875, "lr": 0.0009249000000000001, "uptime": 17360.149649465, "examples_seen": 9472000.0, "progress": 0.08214701206895021, "epoch": 7.3932594267570115, "img/sec/core": 553.9675552153411, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.800463401438054, "core_hours": 4.800463401438054} {"step": 9300, "l2_params": 251.9054659381794, "train/loss": 4.493746519088745, "l2_grads": 1.5390625, "lr": 0.0009299, "uptime": 17452.520519575, "examples_seen": 9523200.0, "progress": 0.08259104997202561, "epoch": 7.433222991225969, "img/sec/core": 554.2872979222582, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.8261219764686105, "core_hours": 4.8261219764686105} {"step": 9350, "l2_params": 252.4507208448376, "train/loss": 4.766923189163208, "l2_grads": 1.421875, "lr": 0.0009349, "uptime": 17544.894573463, "examples_seen": 9574400.0, "progress": 0.08303508787510101, "epoch": 7.473186555694925, "img/sec/core": 554.2681937730853, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.851781435881944, "core_hours": 4.851781435881944} {"step": 9400, "l2_params": 253.05406702885404, "train/loss": 4.441660404205322, "l2_grads": 1.4296875, "lr": 0.0009399, "uptime": 17637.306847177, "examples_seen": 9625600.0, "progress": 0.08347912577817643, "epoch": 7.513150120163882, "img/sec/core": 554.0389597864007, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.87745151191361, "core_hours": 4.87745151191361} {"step": 9450, "l2_params": 253.56525900874487, "train/loss": 4.647918462753296, "l2_grads": 1.4375, "lr": 0.0009448999999999999, "uptime": 17729.732623281, "examples_seen": 9676800.0, "progress": 0.08392316368125183, "epoch": 7.553113684632839, "img/sec/core": 553.9580207840174, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.903125338609167, "core_hours": 4.903125338609167} {"step": 9500, "l2_params": 254.11488879832362, "train/loss": 4.435158848762512, "l2_grads": 1.4375, "lr": 0.0009498999999999999, "uptime": 17822.360053251, "examples_seen": 9728000.0, "progress": 0.08436720158432724, "epoch": 7.593077249101795, "img/sec/core": 552.7520305441233, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.928855180267499, "core_hours": 4.928855180267499} {"step": 9550, "l2_params": 254.61239594326264, "train/loss": 6.155918836593628, "l2_grads": 1.0, "lr": 0.0009549, "uptime": 17914.740375725, "examples_seen": 9779200.0, "progress": 0.08481123948740264, "epoch": 7.633040813570752, "img/sec/core": 554.2305831895072, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.954516380954721, "core_hours": 4.954516380954721} {"step": 9600, "l2_params": 255.23412821383846, "train/loss": 5.527473449707031, "l2_grads": 1.2109375, "lr": 0.0009599, "uptime": 18007.126016247, "examples_seen": 9830400.0, "progress": 0.08525527739047806, "epoch": 7.6730043780397095, "img/sec/core": 554.1986796942533, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 4.980179058877499, "core_hours": 4.980179058877499} {"step": 9650, "l2_params": 255.86978700188624, "train/loss": 4.438668847084045, "l2_grads": 1.3515625, "lr": 0.0009649, "uptime": 18099.540703268, "examples_seen": 9881600.0, "progress": 0.08569931529355346, "epoch": 7.712967942508666, "img/sec/core": 554.0244916737544, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.005849805272222, "core_hours": 5.005849805272222} {"step": 9700, "l2_params": 256.3832913624516, "train/loss": 4.600859999656677, "l2_grads": 1.515625, "lr": 0.0009699, "uptime": 18191.917110727998, "examples_seen": 9932800.0, "progress": 0.08614335319662886, "epoch": 7.752931506977623, "img/sec/core": 554.2540720927256, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.031509918455554, "core_hours": 5.031509918455554} {"step": 9750, "l2_params": 257.00081459242864, "train/loss": 5.376337885856628, "l2_grads": 1.234375, "lr": 0.0009749, "uptime": 18284.26197973, "examples_seen": 9984000.0, "progress": 0.08658739109970427, "epoch": 7.79289507144658, "img/sec/core": 554.4433659751076, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.057161270956111, "core_hours": 5.057161270956111} {"step": 9801, "l2_params": 257.5387983702953, "train/loss": 5.034173965454102, "l2_grads": 1.3984375, "lr": 0.0009799, "uptime": 18376.643639276, "examples_seen": 10035200.0, "progress": 0.08703142900277967, "epoch": 7.832858635915536, "img/sec/core": 554.2225616168447, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.082822843052222, "core_hours": 5.082822843052222} {"step": 9850, "l2_params": 258.15791018637583, "train/loss": 4.334225058555603, "l2_grads": 1.484375, "lr": 0.0009849, "uptime": 18469.07312969, "examples_seen": 10086400.0, "progress": 0.08747546690585509, "epoch": 7.872822200384493, "img/sec/core": 553.9357597956048, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.108497701500555, "core_hours": 5.108497701500555} {"step": 9900, "l2_params": 258.77532664018486, "train/loss": 6.163599729537964, "l2_grads": 1.109375, "lr": 0.0009899, "uptime": 18561.555780635, "examples_seen": 10137600.0, "progress": 0.08791950480893049, "epoch": 7.91278576485345, "img/sec/core": 553.6173485170667, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.134187326763055, "core_hours": 5.134187326763055} {"step": 9950, "l2_params": 259.24825922676774, "train/loss": 4.751848578453064, "l2_grads": 1.2578125, "lr": 0.0009949, "uptime": 18654.038211311, "examples_seen": 10188800.0, "progress": 0.0883635427120059, "epoch": 7.9527493293224065, "img/sec/core": 553.618667089032, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.159876890839722, "core_hours": 5.159876890839722} {"step": 10000, "l2_params": 259.858939536494, "train/loss": 6.220222234725952, "l2_grads": 1.15625, "lr": 0.0009999, "uptime": 18746.638982165, "examples_seen": 10240000.0, "progress": 0.0888075806150813, "epoch": 7.992712893791364, "img/sec/core": 552.9111639980188, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.185599327188055, "core_hours": 5.185599327188055, "val/acc@1": 0.28981983418367346, "val/loss": 3.461851012950041, "z/secs/eval/val": 31.52187673300068} {"step": 10050, "l2_params": 260.4412904504283, "train/loss": 4.458603501319885, "l2_grads": 1.4921875, "lr": 0.0009999994372549106, "uptime": 18870.600756177, "examples_seen": 10291200.0, "progress": 0.08925161851815672, "epoch": 8.03267645826032, "img/sec/core": 413.03055242694955, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.220033153302499, "core_hours": 5.220033153302499} {"step": 10100, "l2_params": 261.09137538193045, "train/loss": 4.5124815702438354, "l2_grads": 1.3828125, "lr": 0.000999997702848216, "uptime": 18963.071580021, "examples_seen": 10342400.0, "progress": 0.08969565642123212, "epoch": 8.072640022729278, "img/sec/core": 553.6881566706429, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.245719493259165, "core_hours": 5.245719493259165} {"step": 10150, "l2_params": 261.6404836331359, "train/loss": 5.405255913734436, "l2_grads": 1.09375, "lr": 0.0009999947965496018, "uptime": 19055.678627058, "examples_seen": 10393600.0, "progress": 0.09013969432430752, "epoch": 8.112603587198235, "img/sec/core": 552.8736919938922, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.2714436729916665, "core_hours": 5.2714436729916665} {"step": 10200, "l2_params": 262.234181817095, "train/loss": 4.280034065246582, "l2_grads": 1.375, "lr": 0.0009999907183658799, "uptime": 19148.358274231, "examples_seen": 10444800.0, "progress": 0.09058373222738293, "epoch": 8.15256715166719, "img/sec/core": 552.4406011648822, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.297188019428611, "core_hours": 5.297188019428611} {"step": 10250, "l2_params": 262.7659464750962, "train/loss": 4.938976764678955, "l2_grads": 1.203125, "lr": 0.0009999854683066078, "uptime": 19241.011639392, "examples_seen": 10496000.0, "progress": 0.09102777013045833, "epoch": 8.192530716136147, "img/sec/core": 552.5973062179819, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.3229250653066655, "core_hours": 5.3229250653066655} {"step": 10300, "l2_params": 263.38355393679194, "train/loss": 4.393300890922546, "l2_grads": 1.4609375, "lr": 0.0009999790463840923, "uptime": 19333.703801806, "examples_seen": 10547200.0, "progress": 0.09147180803353375, "epoch": 8.232494280605104, "img/sec/core": 552.3660109613121, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.348672888199444, "core_hours": 5.348672888199444} {"step": 10350, "l2_params": 263.92406689413053, "train/loss": 4.497364282608032, "l2_grads": 1.265625, "lr": 0.0009999714526133829, "uptime": 19426.521955448, "examples_seen": 10598400.0, "progress": 0.09191584593660915, "epoch": 8.272457845074062, "img/sec/core": 551.6162301340291, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.374455708655555, "core_hours": 5.374455708655555} {"step": 10400, "l2_params": 264.4899074309122, "train/loss": 4.401048541069031, "l2_grads": 1.6171875, "lr": 0.0009999626870122785, "uptime": 19519.465961279, "examples_seen": 10649600.0, "progress": 0.09235988383968456, "epoch": 8.312421409543019, "img/sec/core": 550.8693061185392, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.400273488053054, "core_hours": 5.400273488053054} {"step": 10450, "l2_params": 264.9525739733021, "train/loss": 4.422258138656616, "l2_grads": 1.3046875, "lr": 0.0009999527496013254, "uptime": 19612.356412728, "examples_seen": 10700800.0, "progress": 0.09280392174275996, "epoch": 8.352384974011976, "img/sec/core": 551.1869002823103, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.426076391233333, "core_hours": 5.426076391233333} {"step": 10500, "l2_params": 265.5463426737824, "train/loss": 4.234377443790436, "l2_grads": 1.40625, "lr": 0.0009999416404038136, "uptime": 19705.290008018, "examples_seen": 10752000.0, "progress": 0.09324795964583536, "epoch": 8.392348538480931, "img/sec/core": 550.9310152074711, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.451891278813888, "core_hours": 5.451891278813888} {"step": 10550, "l2_params": 266.0523657630674, "train/loss": 4.51037335395813, "l2_grads": 1.2109375, "lr": 0.0009999293594457805, "uptime": 19798.112667491, "examples_seen": 10803200.0, "progress": 0.09369199754891078, "epoch": 8.432312102949888, "img/sec/core": 551.589453380106, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.477675350889722, "core_hours": 5.477675350889722} {"step": 10600, "l2_params": 266.61389818073064, "train/loss": 4.1244789361953735, "l2_grads": 1.2734375, "lr": 0.0009999159067560098, "uptime": 19891.21349204, "examples_seen": 10854400.0, "progress": 0.09413603545198618, "epoch": 8.472275667418845, "img/sec/core": 549.9414236987155, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.50353669104222, "core_hours": 5.50353669104222} {"step": 10650, "l2_params": 266.9793528599461, "train/loss": 4.3804545402526855, "l2_grads": 1.34375, "lr": 0.0009999012823660334, "uptime": 19984.158262938, "examples_seen": 10905600.0, "progress": 0.09458007335506159, "epoch": 8.512239231887802, "img/sec/core": 550.8647716845512, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.529354682958332, "core_hours": 5.529354682958332} {"step": 10700, "l2_params": 267.5121821116283, "train/loss": 6.283819913864136, "l2_grads": 1.2265625, "lr": 0.0009998854863101274, "uptime": 20077.237966123, "examples_seen": 10956800.0, "progress": 0.09502411125813699, "epoch": 8.55220279635676, "img/sec/core": 550.0662147389629, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.555210156065277, "core_hours": 5.555210156065277} {"step": 10750, "l2_params": 268.0591155941633, "train/loss": 4.381614565849304, "l2_grads": 1.3203125, "lr": 0.0009998685186253136, "uptime": 20170.322938219, "examples_seen": 11008000.0, "progress": 0.0954681491612124, "epoch": 8.592166360825717, "img/sec/core": 550.0350792091003, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.581067092758611, "core_hours": 5.581067092758611} {"step": 10800, "l2_params": 268.5008869973419, "train/loss": 4.335466623306274, "l2_grads": 1.53125, "lr": 0.000999850379351362, "uptime": 20263.392729825, "examples_seen": 11059200.0, "progress": 0.09591218706428781, "epoch": 8.632129925294672, "img/sec/core": 550.1247946997695, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.606919812649165, "core_hours": 5.606919812649165} {"step": 10850, "l2_params": 269.0123955235381, "train/loss": 4.185073614120483, "l2_grads": 1.40625, "lr": 0.000999831068530787, "uptime": 20356.44201406, "examples_seen": 11110400.0, "progress": 0.09635622496736321, "epoch": 8.672093489763629, "img/sec/core": 550.2460381177189, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.632766836047778, "core_hours": 5.632766836047778} {"step": 10900, "l2_params": 269.61939138522195, "train/loss": 4.522606015205383, "l2_grads": 1.484375, "lr": 0.0009998105862088493, "uptime": 20449.523379252, "examples_seen": 11161600.0, "progress": 0.09680026287043862, "epoch": 8.712057054232586, "img/sec/core": 550.0563930749113, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.6586227708233325, "core_hours": 5.6586227708233325} {"step": 10950, "l2_params": 270.1065115614406, "train/loss": 5.650220990180969, "l2_grads": 1.140625, "lr": 0.0009997889324335543, "uptime": 20542.542969175, "examples_seen": 11212800.0, "progress": 0.09724430077351402, "epoch": 8.752020618701543, "img/sec/core": 550.4216911984169, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.684461545801943, "core_hours": 5.684461545801943} {"step": 11001, "l2_params": 270.6334939306467, "train/loss": 6.12806510925293, "l2_grads": 0.9921875, "lr": 0.0009997661072556545, "uptime": 20635.590012831, "examples_seen": 11264000.0, "progress": 0.09768833867658944, "epoch": 8.7919841831705, "img/sec/core": 550.2592880789393, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.710307946817498, "core_hours": 5.710307946817498} {"step": 11050, "l2_params": 271.0930070234775, "train/loss": 5.317749857902527, "l2_grads": 1.1328125, "lr": 0.000999742110728648, "uptime": 20728.820207411, "examples_seen": 11315200.0, "progress": 0.09813237657966484, "epoch": 8.831947747639457, "img/sec/core": 549.1783024872295, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.736205223089722, "core_hours": 5.736205223089722} {"step": 11100, "l2_params": 271.47079057740035, "train/loss": 6.116182088851929, "l2_grads": 0.9765625, "lr": 0.0009997169429087768, "uptime": 20821.922187096, "examples_seen": 11366400.0, "progress": 0.09857641448274025, "epoch": 8.871911312108413, "img/sec/core": 549.9346004588798, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.762066884113333, "core_hours": 5.762066884113333} {"step": 11150, "l2_params": 271.99153886986426, "train/loss": 4.1429537534713745, "l2_grads": 1.4765625, "lr": 0.0009996906038550288, "uptime": 20915.004467313, "examples_seen": 11417600.0, "progress": 0.09902045238581565, "epoch": 8.91187487657737, "img/sec/core": 550.0509858658238, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.787923073062499, "core_hours": 5.787923073062499} {"step": 11200, "l2_params": 272.50742759730997, "train/loss": 6.099519371986389, "l2_grads": 1.0546875, "lr": 0.0009996630936291385, "uptime": 21008.061879177, "examples_seen": 11468800.0, "progress": 0.09946449028889107, "epoch": 8.951838441046327, "img/sec/core": 550.1979796604173, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.813772354135833, "core_hours": 5.813772354135833} {"step": 11250, "l2_params": 272.9894275225004, "train/loss": 5.730342507362366, "l2_grads": 1.109375, "lr": 0.0009996344122955843, "uptime": 21101.110577557, "examples_seen": 11520000.0, "progress": 0.09990852819196647, "epoch": 8.991802005515284, "img/sec/core": 550.2495025873991, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.839619214796944, "core_hours": 5.839619214796944} {"step": 11300, "l2_params": 273.43771696419964, "train/loss": 5.577448725700378, "l2_grads": 1.0234375, "lr": 0.0009996045599215883, "uptime": 21194.263855544, "examples_seen": 11571200.0, "progress": 0.10035256609504187, "epoch": 9.031765569984241, "img/sec/core": 549.6317586069865, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.865495125348888, "core_hours": 5.865495125348888} {"step": 11350, "l2_params": 273.8958301640425, "train/loss": 4.461811780929565, "l2_grads": 1.265625, "lr": 0.0009995735365771188, "uptime": 21287.435182382, "examples_seen": 11622400.0, "progress": 0.10079660399811728, "epoch": 9.071729134453198, "img/sec/core": 549.5252857032148, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.891376049470555, "core_hours": 5.891376049470555} {"step": 11400, "l2_params": 274.36093180049795, "train/loss": 4.231853127479553, "l2_grads": 1.53125, "lr": 0.0009995413423348884, "uptime": 21380.568023771, "examples_seen": 11673600.0, "progress": 0.10124064190119268, "epoch": 9.111692698922155, "img/sec/core": 549.7523670103228, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.917246283189722, "core_hours": 5.917246283189722} {"step": 11450, "l2_params": 274.84333605710725, "train/loss": 4.087203919887543, "l2_grads": 1.28125, "lr": 0.0009995079772703531, "uptime": 21473.713353384, "examples_seen": 11724800.0, "progress": 0.1016846798042681, "epoch": 9.15165626339111, "img/sec/core": 549.6786603550224, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.943119985859998, "core_hours": 5.943119985859998} {"step": 11500, "l2_params": 275.29197302165613, "train/loss": 4.154758930206299, "l2_grads": 1.359375, "lr": 0.000999473441461715, "uptime": 21566.873658941, "examples_seen": 11776000.0, "progress": 0.1021287177073435, "epoch": 9.191619827860068, "img/sec/core": 549.5902970034019, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.9689978485147215, "core_hours": 5.9689978485147215} {"step": 11550, "l2_params": 275.73263647309915, "train/loss": 4.108599662780762, "l2_grads": 1.453125, "lr": 0.0009994377349899174, "uptime": 21660.048370693, "examples_seen": 11827200.0, "progress": 0.10257275561041891, "epoch": 9.231583392329025, "img/sec/core": 549.505322176664, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 5.994879712890277, "core_hours": 5.994879712890277} {"step": 11600, "l2_params": 276.16552724317347, "train/loss": 4.114003419876099, "l2_grads": 1.59375, "lr": 0.0009994008579386508, "uptime": 21753.14052043, "examples_seen": 11878400.0, "progress": 0.10301679351349431, "epoch": 9.271546956797982, "img/sec/core": 549.992670108576, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.020738643372777, "core_hours": 6.020738643372777} {"step": 11650, "l2_params": 276.65877120307204, "train/loss": 5.355946063995361, "l2_grads": 1.140625, "lr": 0.000999362810394347, "uptime": 21846.253861731, "examples_seen": 11929600.0, "progress": 0.10346083141656971, "epoch": 9.31151052126694, "img/sec/core": 549.8674978754146, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.046603460400832, "core_hours": 6.046603460400832} {"step": 11700, "l2_params": 277.07212402921823, "train/loss": 4.0554699301719666, "l2_grads": 1.6015625, "lr": 0.0009993235924461805, "uptime": 21939.723744195, "examples_seen": 11980800.0, "progress": 0.10390486931964513, "epoch": 9.351474085735896, "img/sec/core": 547.7700265614407, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.072567316640832, "core_hours": 6.072567316640832} {"step": 11750, "l2_params": 277.51312961619493, "train/loss": 4.148345053195953, "l2_grads": 1.3984375, "lr": 0.0009992832041860712, "uptime": 22032.85635787, "examples_seen": 12032000.0, "progress": 0.10434890722272053, "epoch": 9.391437650204852, "img/sec/core": 549.7537111829403, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.098437487106111, "core_hours": 6.098437487106111} {"step": 11800, "l2_params": 277.9181472700753, "train/loss": 4.0646162033081055, "l2_grads": 1.4140625, "lr": 0.0009992416457086796, "uptime": 22126.010221925, "examples_seen": 12083200.0, "progress": 0.10479294512579594, "epoch": 9.431401214673809, "img/sec/core": 549.628300655044, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.124313560454722, "core_hours": 6.124313560454722} {"step": 11850, "l2_params": 278.30389260774814, "train/loss": 4.567654728889465, "l2_grads": 1.234375, "lr": 0.000999198917111411, "uptime": 22219.181401215, "examples_seen": 12134400.0, "progress": 0.10523698302887134, "epoch": 9.471364779142766, "img/sec/core": 549.5261559439764, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.1501944435908324, "core_hours": 6.1501944435908324} {"step": 11900, "l2_params": 278.75046682275934, "train/loss": 5.757549405097961, "l2_grads": 1.0625, "lr": 0.0009991550184944118, "uptime": 22312.282536264, "examples_seen": 12185600.0, "progress": 0.10568102093194676, "epoch": 9.511328343611723, "img/sec/core": 549.9395895984786, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.176055869993332, "core_hours": 6.176055869993332} {"step": 11950, "l2_params": 279.14619405653735, "train/loss": 4.186077356338501, "l2_grads": 1.3125, "lr": 0.0009991099499605718, "uptime": 22405.430070079, "examples_seen": 12236800.0, "progress": 0.10612505883502216, "epoch": 9.55129190808068, "img/sec/core": 549.6656530025526, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.201930184941944, "core_hours": 6.201930184941944} {"step": 12000, "l2_params": 279.5701106651849, "train/loss": 5.941460371017456, "l2_grads": 0.98046875, "lr": 0.0009990637116155227, "uptime": 22498.564881113, "examples_seen": 12288000.0, "progress": 0.10656909673809756, "epoch": 9.591255472549637, "img/sec/core": 549.740740670087, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.227800965784722, "core_hours": 6.227800965784722} {"step": 12050, "l2_params": 279.9609522158849, "train/loss": 4.081629157066345, "l2_grads": 1.3046875, "lr": 0.000999016303567638, "uptime": 22591.946018648, "examples_seen": 12339200.0, "progress": 0.10701313464117297, "epoch": 9.631219037018592, "img/sec/core": 548.2906007737486, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.253740170655555, "core_hours": 6.253740170655555} {"step": 12100, "l2_params": 280.4301488060351, "train/loss": 6.0744253396987915, "l2_grads": 0.87890625, "lr": 0.0009989677259280318, "uptime": 22685.09386201, "examples_seen": 12390400.0, "progress": 0.10745717254424837, "epoch": 9.67118260148755, "img/sec/core": 549.6638263649535, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.279614571589444, "core_hours": 6.279614571589444} {"step": 12150, "l2_params": 280.85204397594964, "train/loss": 3.97029310464859, "l2_grads": 1.4140625, "lr": 0.0009989179788105597, "uptime": 22778.214294196, "examples_seen": 12441600.0, "progress": 0.10790121044732379, "epoch": 9.711146165956507, "img/sec/core": 549.8256268584662, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.305481358307777, "core_hours": 6.305481358307777} {"step": 12200, "l2_params": 281.24784547785873, "train/loss": 4.047131717205048, "l2_grads": 1.4296875, "lr": 0.0009988670623318197, "uptime": 22871.385650031, "examples_seen": 12492800.0, "progress": 0.10834524835039919, "epoch": 9.751109730425464, "img/sec/core": 549.5251146787273, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.331362290484166, "core_hours": 6.331362290484166} {"step": 12250, "l2_params": 281.62976270662074, "train/loss": 4.097707152366638, "l2_grads": 1.28125, "lr": 0.0009988149766111487, "uptime": 22964.582737847, "examples_seen": 12544000.0, "progress": 0.1087892862534746, "epoch": 9.79107329489442, "img/sec/core": 549.373389231702, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.3572503704330545, "core_hours": 6.3572503704330545} {"step": 12300, "l2_params": 282.0174191553267, "train/loss": 6.070562481880188, "l2_grads": 1.203125, "lr": 0.0009987617217706254, "uptime": 23057.950239779, "examples_seen": 12595200.0, "progress": 0.10923332415655, "epoch": 9.831036859363378, "img/sec/core": 548.370674383998, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.383185787636388, "core_hours": 6.383185787636388} {"step": 12350, "l2_params": 282.4192647700954, "train/loss": 6.102233409881592, "l2_grads": 1.0078125, "lr": 0.0009987072979350687, "uptime": 23151.392122652, "examples_seen": 12646400.0, "progress": 0.10967736205962542, "epoch": 9.871000423832333, "img/sec/core": 547.9341642717851, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.409141866212222, "core_hours": 6.409141866212222} {"step": 12400, "l2_params": 282.80630172765774, "train/loss": 4.12807959318161, "l2_grads": 1.46875, "lr": 0.0009986517052320355, "uptime": 23244.568288257, "examples_seen": 12697600.0, "progress": 0.11012139996270082, "epoch": 9.91096398830129, "img/sec/core": 549.4967480959783, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.4350241344358325, "core_hours": 6.4350241344358325} {"step": 12450, "l2_params": 283.1537642328259, "train/loss": 3.990184187889099, "l2_grads": 1.3671875, "lr": 0.0009985949437918255, "uptime": 23337.74188594, "examples_seen": 12748800.0, "progress": 0.11056543786577622, "epoch": 9.950927552770247, "img/sec/core": 549.511892566347, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.460905689347777, "core_hours": 6.460905689347777} {"step": 12500, "l2_params": 283.51115877234446, "train/loss": 3.9562981128692627, "l2_grads": 1.2734375, "lr": 0.0009985370137474742, "uptime": 23430.908542017, "examples_seen": 12800000.0, "progress": 0.11100947576885163, "epoch": 9.990891117239205, "img/sec/core": 549.5528352727713, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.486785316035833, "core_hours": 6.486785316035833, "val/acc@1": 0.3560068558673469, "val/loss": 3.0686384433386276, "z/secs/eval/val": 31.74769531399943} {"step": 12550, "l2_params": 283.93906318356846, "train/loss": 3.8697966933250427, "l2_grads": 1.3203125, "lr": 0.0009984779152347589, "uptime": 23555.419134452, "examples_seen": 12851200.0, "progress": 0.11145351367192703, "epoch": 10.030854681708162, "img/sec/core": 411.2099942559426, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.521371591712222, "core_hours": 6.521371591712222} {"step": 12601, "l2_params": 284.3591230114549, "train/loss": 3.9100040793418884, "l2_grads": 1.4296875, "lr": 0.0009984176483921936, "uptime": 23648.479607467998, "examples_seen": 12902400.0, "progress": 0.11189755157500245, "epoch": 10.070818246177119, "img/sec/core": 550.1798813251086, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.5472217231055545, "core_hours": 6.5472217231055545} {"step": 12650, "l2_params": 284.7365164306512, "train/loss": 4.046851277351379, "l2_grads": 1.3984375, "lr": 0.0009983562133610326, "uptime": 23741.598492294, "examples_seen": 12953600.0, "progress": 0.11234158947807785, "epoch": 10.110781810646076, "img/sec/core": 549.8347633315177, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.573088080001666, "core_hours": 6.573088080001666} {"step": 12700, "l2_params": 285.08170686637146, "train/loss": 3.882240056991577, "l2_grads": 1.375, "lr": 0.0009982936102852647, "uptime": 23834.751786479, "examples_seen": 13004800.0, "progress": 0.11278562738115326, "epoch": 10.150745375115031, "img/sec/core": 549.6316630340427, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.5989639950530545, "core_hours": 6.5989639950530545} {"step": 12750, "l2_params": 285.3847757236601, "train/loss": 3.9380346536636353, "l2_grads": 1.46875, "lr": 0.0009982298393116204, "uptime": 23927.887672774, "examples_seen": 13056000.0, "progress": 0.11322966528422866, "epoch": 10.190708939583988, "img/sec/core": 549.7343938707826, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.624835074579443, "core_hours": 6.624835074579443} {"step": 12800, "l2_params": 285.85534168034627, "train/loss": 4.226554751396179, "l2_grads": 1.390625, "lr": 0.0009981649005895668, "uptime": 24021.337593148, "examples_seen": 13107200.0, "progress": 0.11367370318730406, "epoch": 10.230672504052945, "img/sec/core": 547.8870371969223, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.650793385794444, "core_hours": 6.650793385794444} {"step": 12850, "l2_params": 286.1605909084312, "train/loss": 4.22257936000824, "l2_grads": 1.4296875, "lr": 0.000998098794271305, "uptime": 24114.539509991, "examples_seen": 13158400.0, "progress": 0.11411774109037948, "epoch": 10.270636068521902, "img/sec/core": 549.3449248071615, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.676682807139722, "core_hours": 6.676682807139722} {"step": 12900, "l2_params": 286.54264857630704, "train/loss": 3.8997915983200073, "l2_grads": 1.421875, "lr": 0.000998031520511775, "uptime": 24207.752174424, "examples_seen": 13209600.0, "progress": 0.11456177899345488, "epoch": 10.31059963299086, "img/sec/core": 549.2815843366521, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.702575213926666, "core_hours": 6.702575213926666} {"step": 12950, "l2_params": 286.9236861260434, "train/loss": 4.665942072868347, "l2_grads": 1.21875, "lr": 0.0009979630794686534, "uptime": 24300.951885107, "examples_seen": 13260800.0, "progress": 0.11500581689653029, "epoch": 10.350563197459817, "img/sec/core": 549.3579285256287, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.728464022449722, "core_hours": 6.728464022449722} {"step": 13000, "l2_params": 287.22798612883287, "train/loss": 5.189697265625, "l2_grads": 1.140625, "lr": 0.0009978934713023501, "uptime": 24394.214725482, "examples_seen": 13312000.0, "progress": 0.11544985479960569, "epoch": 10.390526761928772, "img/sec/core": 548.9860676999433, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.754370366998333, "core_hours": 6.754370366998333} {"step": 13050, "l2_params": 287.5596685703356, "train/loss": 4.730173349380493, "l2_grads": 1.1640625, "lr": 0.0009978226961760148, "uptime": 24487.686385249, "examples_seen": 13363200.0, "progress": 0.1158938927026811, "epoch": 10.430490326397729, "img/sec/core": 547.7596110695937, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.78033471693361, "core_hours": 6.78033471693361} {"step": 13100, "l2_params": 287.94320542562076, "train/loss": 5.968930006027222, "l2_grads": 1.0078125, "lr": 0.0009977507542555282, "uptime": 24580.974044075, "examples_seen": 13414400.0, "progress": 0.1163379306057565, "epoch": 10.470453890866686, "img/sec/core": 548.8400142563108, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.806247955496388, "core_hours": 6.806247955496388} {"step": 13150, "l2_params": 288.2465976802133, "train/loss": 5.424035906791687, "l2_grads": 1.046875, "lr": 0.0009976776457095075, "uptime": 24674.203726503998, "examples_seen": 13465600.0, "progress": 0.11678196850883191, "epoch": 10.510417455335643, "img/sec/core": 549.1813193613798, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.832145089504443, "core_hours": 6.832145089504443} {"step": 13200, "l2_params": 288.52867346271887, "train/loss": 4.145103216171265, "l2_grads": 1.28125, "lr": 0.0009976033707093054, "uptime": 24767.470656581998, "examples_seen": 13516800.0, "progress": 0.11722600641190732, "epoch": 10.5503810198046, "img/sec/core": 548.961994966287, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.858052570081665, "core_hours": 6.858052570081665} {"step": 13250, "l2_params": 288.9038568045821, "train/loss": 4.259054183959961, "l2_grads": 1.3046875, "lr": 0.0009975279294290053, "uptime": 24860.672030435, "examples_seen": 13568000.0, "progress": 0.11767004431498272, "epoch": 10.590344584273558, "img/sec/core": 549.3481252835817, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.883941840596388, "core_hours": 6.883941840596388} {"step": 13300, "l2_params": 289.24756913412426, "train/loss": 3.8683144450187683, "l2_grads": 1.4140625, "lr": 0.0009974513220454282, "uptime": 24955.770002672, "examples_seen": 13619200.0, "progress": 0.11811408221805814, "epoch": 10.630308148742513, "img/sec/core": 538.3921317733196, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.910357943995555, "core_hours": 6.910357943995555} {"step": 13350, "l2_params": 289.663343450742, "train/loss": 3.8664812445640564, "l2_grads": 1.3828125, "lr": 0.0009973735487381237, "uptime": 25048.846709311998, "examples_seen": 13670400.0, "progress": 0.11855812012113354, "epoch": 10.67027171321147, "img/sec/core": 550.0839237687258, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.936212584728888, "core_hours": 6.936212584728888} {"step": 13400, "l2_params": 289.836864810405, "train/loss": 3.9336403012275696, "l2_grads": 1.3203125, "lr": 0.00099729460968938, "uptime": 25142.03014021, "examples_seen": 13721600.0, "progress": 0.11900215802420895, "epoch": 10.710235277680427, "img/sec/core": 549.4539051265723, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.962096871089444, "core_hours": 6.962096871089444} {"step": 13450, "l2_params": 290.28622055438666, "train/loss": 3.986761152744293, "l2_grads": 1.3984375, "lr": 0.0009972145050842099, "uptime": 25235.212487737, "examples_seen": 13772800.0, "progress": 0.11944619592728435, "epoch": 10.750198842149384, "img/sec/core": 549.4602932724454, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 6.987980856513611, "core_hours": 6.987980856513611} {"step": 13500, "l2_params": 290.56653729852695, "train/loss": 3.7751710414886475, "l2_grads": 1.3515625, "lr": 0.0009971332351103644, "uptime": 25328.424547492, "examples_seen": 13824000.0, "progress": 0.11989023383035977, "epoch": 10.790162406618341, "img/sec/core": 549.2851475933026, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.013873095334444, "core_hours": 7.013873095334444} {"step": 13550, "l2_params": 290.9421950144801, "train/loss": 5.962488174438477, "l2_grads": 1.0625, "lr": 0.0009970507999583227, "uptime": 25423.677935273, "examples_seen": 13875200.0, "progress": 0.12033427173343517, "epoch": 10.830125971087298, "img/sec/core": 537.5136905126614, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.0403323697180555, "core_hours": 7.0403323697180555} {"step": 13600, "l2_params": 291.2835364946198, "train/loss": 3.8867709636688232, "l2_grads": 1.3671875, "lr": 0.0009969671998212965, "uptime": 25516.87148156, "examples_seen": 13926400.0, "progress": 0.12077830963651057, "epoch": 10.870089535556255, "img/sec/core": 549.3942664476415, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.066219465908888, "core_hours": 7.066219465908888} {"step": 13650, "l2_params": 291.59004927455516, "train/loss": 3.7679266929626465, "l2_grads": 1.4375, "lr": 0.0009968824348952274, "uptime": 25610.122169427, "examples_seen": 13977600.0, "progress": 0.12122234753958598, "epoch": 10.91005310002521, "img/sec/core": 549.0576120256088, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.0921224347608325, "core_hours": 7.0921224347608325} {"step": 13700, "l2_params": 291.9410156874587, "train/loss": 4.01311856508255, "l2_grads": 1.2890625, "lr": 0.0009967965053787867, "uptime": 25703.384506078, "examples_seen": 14028800.0, "progress": 0.12166638544266138, "epoch": 10.950016664494168, "img/sec/core": 548.9890328568148, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.118028639386111, "core_hours": 7.118028639386111} {"step": 13750, "l2_params": 292.21597956124424, "train/loss": 3.785797417163849, "l2_grads": 1.4765625, "lr": 0.000996709411473376, "uptime": 25796.554541283, "examples_seen": 14080000.0, "progress": 0.1221104233457368, "epoch": 10.989980228963125, "img/sec/core": 549.5329038713588, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.143909204720832, "core_hours": 7.143909204720832} {"step": 13800, "l2_params": 292.5488607694448, "train/loss": 4.735183119773865, "l2_grads": 1.328125, "lr": 0.0009966211533831257, "uptime": 25890.568707595, "examples_seen": 14131200.0, "progress": 0.1225544612488122, "epoch": 11.029943793432082, "img/sec/core": 544.5987770617945, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.170024250918611, "core_hours": 7.170024250918611} {"step": 13850, "l2_params": 292.8267539220076, "train/loss": 4.177849888801575, "l2_grads": 1.390625, "lr": 0.0009965317313148938, "uptime": 25983.971651634998, "examples_seen": 14182400.0, "progress": 0.12299849915188761, "epoch": 11.06990735790104, "img/sec/core": 548.1625930128606, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.195969513151943, "core_hours": 7.195969513151943} {"step": 13900, "l2_params": 293.1896425590547, "train/loss": 5.332221746444702, "l2_grads": 1.03125, "lr": 0.000996441145478268, "uptime": 26077.426501923, "examples_seen": 14233600.0, "progress": 0.12344253705496301, "epoch": 11.109870922369996, "img/sec/core": 547.8581351552701, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.2219291937875, "core_hours": 7.2219291937875} {"step": 13950, "l2_params": 293.46343984786887, "train/loss": 5.930721879005432, "l2_grads": 1.0546875, "lr": 0.000996349396085562, "uptime": 26170.871734654, "examples_seen": 14284800.0, "progress": 0.12388657495803841, "epoch": 11.149834486838952, "img/sec/core": 547.9145217326334, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.247886202879443, "core_hours": 7.247886202879443} {"step": 14000, "l2_params": 293.8154356971503, "train/loss": 3.8002726435661316, "l2_grads": 1.4453125, "lr": 0.0009962564833518185, "uptime": 26264.35732109, "examples_seen": 14336000.0, "progress": 0.12433061286111383, "epoch": 11.189798051307909, "img/sec/core": 547.6780106102403, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.273854421333889, "core_hours": 7.273854421333889} {"step": 14050, "l2_params": 294.0103417478499, "train/loss": 3.6948934197425842, "l2_grads": 1.4140625, "lr": 0.0009961624074948058, "uptime": 26359.17068676, "examples_seen": 14387200.0, "progress": 0.12477465076418923, "epoch": 11.229761615776866, "img/sec/core": 540.0082534587175, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.300191467353333, "core_hours": 7.300191467353333} {"step": 14100, "l2_params": 294.33759133991236, "train/loss": 5.3041932582855225, "l2_grads": 1.046875, "lr": 0.0009960671687350175, "uptime": 26454.179416657, "examples_seen": 14438400.0, "progress": 0.12521868866726463, "epoch": 11.269725180245823, "img/sec/core": 538.8978471294887, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.32658278121361, "core_hours": 7.32658278121361} {"step": 14150, "l2_params": 294.5762308159278, "train/loss": 5.75753390789032, "l2_grads": 1.140625, "lr": 0.0009959707672956735, "uptime": 26547.360451401, "examples_seen": 14489600.0, "progress": 0.12566272657034006, "epoch": 11.30968874471478, "img/sec/core": 549.4680343555268, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.352466401975833, "core_hours": 7.352466401975833} {"step": 14200, "l2_params": 294.92677686323685, "train/loss": 3.741651237010956, "l2_grads": 1.4453125, "lr": 0.0009958732034027198, "uptime": 26640.611492734, "examples_seen": 14540800.0, "progress": 0.12610676447341546, "epoch": 11.349652309183737, "img/sec/core": 549.0555308349367, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.378369469012777, "core_hours": 7.378369469012777} {"step": 14250, "l2_params": 295.20884010703975, "train/loss": 3.7325358390808105, "l2_grads": 1.375, "lr": 0.0009957744772848263, "uptime": 26735.248980049, "examples_seen": 14592000.0, "progress": 0.12655080237649086, "epoch": 11.389615873652692, "img/sec/core": 541.0118278983929, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.40465765993361, "core_hours": 7.40465765993361} {"step": 14300, "l2_params": 295.5213258022274, "train/loss": 5.9431471824646, "l2_grads": 0.96875, "lr": 0.0009956745891733876, "uptime": 26828.445243472, "examples_seen": 14643200.0, "progress": 0.12699484027956626, "epoch": 11.42957943812165, "img/sec/core": 549.378248864043, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.430545510884444, "core_hours": 7.430545510884444} {"step": 14350, "l2_params": 295.7522362618857, "train/loss": 4.224802851676941, "l2_grads": 1.265625, "lr": 0.0009955735393025191, "uptime": 26922.622660145, "examples_seen": 14694400.0, "progress": 0.12743887818264166, "epoch": 11.469543002590607, "img/sec/core": 543.6547508812597, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.456705904404722, "core_hours": 7.456705904404722} {"step": 14400, "l2_params": 296.0442042980026, "train/loss": 4.7113566398620605, "l2_grads": 1.234375, "lr": 0.0009954713279090599, "uptime": 27016.030778042, "examples_seen": 14745600.0, "progress": 0.12788291608571709, "epoch": 11.509506567059564, "img/sec/core": 548.1322303962608, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.482652603820555, "core_hours": 7.482652603820555} {"step": 14450, "l2_params": 296.35912662442803, "train/loss": 3.8772757053375244, "l2_grads": 1.4453125, "lr": 0.000995367955232576, "uptime": 27110.416656424, "examples_seen": 14796800.0, "progress": 0.12832695398879249, "epoch": 11.54947013152852, "img/sec/core": 542.4540289044379, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.50887090337111, "core_hours": 7.50887090337111} {"step": 14500, "l2_params": 296.63307659279377, "train/loss": 4.679425477981567, "l2_grads": 1.1328125, "lr": 0.0009952634215153488, "uptime": 27203.950520242, "examples_seen": 14848000.0, "progress": 0.1287709918918679, "epoch": 11.589433695997478, "img/sec/core": 547.3953273183057, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.5348525322094435, "core_hours": 7.5348525322094435} {"step": 14550, "l2_params": 296.93058196792816, "train/loss": 3.77439546585083, "l2_grads": 1.3359375, "lr": 0.0009951577270023867, "uptime": 27297.529579512, "examples_seen": 14899200.0, "progress": 0.1292150297949433, "epoch": 11.629397260466433, "img/sec/core": 547.1309542904773, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.560846715339999, "core_hours": 7.560846715339999} {"step": 14600, "l2_params": 297.11997211906044, "train/loss": 4.266339063644409, "l2_grads": 1.2578125, "lr": 0.0009950508719414124, "uptime": 27391.130529846, "examples_seen": 14950400.0, "progress": 0.12965906769801872, "epoch": 11.66936082493539, "img/sec/core": 547.0029932100201, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.586846979321666, "core_hours": 7.586846979321666} {"step": 14650, "l2_params": 297.42708533983586, "train/loss": 3.676560342311859, "l2_grads": 1.46875, "lr": 0.0009949428565828745, "uptime": 27484.704469874, "examples_seen": 15001600.0, "progress": 0.13010310560109412, "epoch": 11.709324389404347, "img/sec/core": 547.1608867242262, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.612839740440554, "core_hours": 7.612839740440554} {"step": 14700, "l2_params": 297.67000378328976, "train/loss": 4.21223247051239, "l2_grads": 1.359375, "lr": 0.0009948336811799378, "uptime": 27578.234621598, "examples_seen": 15052800.0, "progress": 0.13054714350416952, "epoch": 11.749287953873305, "img/sec/core": 547.4170527498646, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.638820338141666, "core_hours": 7.638820338141666} {"step": 14750, "l2_params": 297.9666114894419, "train/loss": 4.019024431705475, "l2_grads": 1.2734375, "lr": 0.0009947233459884877, "uptime": 27671.72592534, "examples_seen": 15104000.0, "progress": 0.13099118140724492, "epoch": 11.789251518342262, "img/sec/core": 547.6445182676212, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.664790144736666, "core_hours": 7.664790144736666} {"step": 14800, "l2_params": 298.30634143417694, "train/loss": 4.257505655288696, "l2_grads": 1.3046875, "lr": 0.000994611851267128, "uptime": 27765.279536272, "examples_seen": 15155200.0, "progress": 0.13143521931032032, "epoch": 11.829215082811219, "img/sec/core": 547.2797841786778, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.690777258884443, "core_hours": 7.690777258884443} {"step": 14850, "l2_params": 298.5384580544021, "train/loss": 5.0943403244018555, "l2_grads": 1.03125, "lr": 0.000994499197277177, "uptime": 27859.468210174, "examples_seen": 15206400.0, "progress": 0.13187925721339575, "epoch": 11.869178647280176, "img/sec/core": 543.5897744273503, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.716940779412777, "core_hours": 7.716940779412777} {"step": 14900, "l2_params": 298.7603922421047, "train/loss": 5.853678464889526, "l2_grads": 0.9296875, "lr": 0.0009943853842826744, "uptime": 27952.596985377, "examples_seen": 15257600.0, "progress": 0.13232329511647115, "epoch": 11.909142211749131, "img/sec/core": 549.7763702829255, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.742809883635832, "core_hours": 7.742809883635832} {"step": 14950, "l2_params": 299.05542784872046, "train/loss": 4.240916609764099, "l2_grads": 1.265625, "lr": 0.0009942704125503736, "uptime": 28045.814358647, "examples_seen": 15308800.0, "progress": 0.13276733301954655, "epoch": 11.949105776218088, "img/sec/core": 549.2538376049474, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.768703598433055, "core_hours": 7.768703598433055} {"step": 15000, "l2_params": 299.3136753800789, "train/loss": 4.821743607521057, "l2_grads": 1.296875, "lr": 0.0009941542823497457, "uptime": 28139.525219989, "examples_seen": 15360000.0, "progress": 0.13321137092262195, "epoch": 11.989069340687045, "img/sec/core": 546.3614277660421, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.794734393250277, "core_hours": 7.794734393250277, "val/acc@1": 0.4082828443877551, "val/loss": 2.727038163919838, "z/secs/eval/val": 31.74548770600086} {"step": 15050, "l2_params": 299.53834270423545, "train/loss": 5.423335075378418, "l2_grads": 1.1015625, "lr": 0.000994036993952975, "uptime": 28264.520954161, "examples_seen": 15411200.0, "progress": 0.13365540882569737, "epoch": 12.029032905156003, "img/sec/core": 409.6139787422374, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.8294554305202775, "core_hours": 7.8294554305202775} {"step": 15100, "l2_params": 299.8295544451047, "train/loss": 3.764861226081848, "l2_grads": 1.4140625, "lr": 0.000993918547634963, "uptime": 28357.675573645, "examples_seen": 15462400.0, "progress": 0.13409944672877278, "epoch": 12.06899646962496, "img/sec/core": 549.6238434938092, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.855331713710276, "core_hours": 7.855331713710276} {"step": 15150, "l2_params": 300.0835454958231, "train/loss": 3.744062304496765, "l2_grads": 1.3671875, "lr": 0.0009937989436733232, "uptime": 28450.936020441, "examples_seen": 15513600.0, "progress": 0.13454348463184818, "epoch": 12.108960034093917, "img/sec/core": 549.0001577195478, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.881237393375832, "core_hours": 7.881237393375832} {"step": 15200, "l2_params": 300.35762050481173, "train/loss": 4.537579774856567, "l2_grads": 1.25, "lr": 0.0009936781823483803, "uptime": 28545.323360027, "examples_seen": 15564800.0, "progress": 0.13498752253492358, "epoch": 12.148923598562872, "img/sec/core": 542.4456312104246, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.907456098816388, "core_hours": 7.907456098816388} {"step": 15250, "l2_params": 300.61813840272305, "train/loss": 3.652727484703064, "l2_grads": 1.3671875, "lr": 0.0009935562639431773, "uptime": 28638.548007959, "examples_seen": 15616000.0, "progress": 0.13543156043799898, "epoch": 12.18888716303183, "img/sec/core": 549.2109773087614, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.933351834353056, "core_hours": 7.933351834353056} {"step": 15300, "l2_params": 300.83826326538195, "train/loss": 5.912967681884766, "l2_grads": 1.1875, "lr": 0.0009934331887434637, "uptime": 28732.801469823997, "examples_seen": 15667200.0, "progress": 0.1358755983410744, "epoch": 12.228850727500786, "img/sec/core": 543.2161215822161, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.959533351537776, "core_hours": 7.959533351537776} {"step": 15350, "l2_params": 301.0288526324138, "train/loss": 4.32976770401001, "l2_grads": 1.234375, "lr": 0.000993308957037704, "uptime": 28826.028928531003, "examples_seen": 15718400.0, "progress": 0.1363196362441498, "epoch": 12.268814291969743, "img/sec/core": 549.1944187914708, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 7.985429867845278, "core_hours": 7.985429867845278} {"step": 15400, "l2_params": 301.34834364693296, "train/loss": 5.723307847976685, "l2_grads": 0.98046875, "lr": 0.000993183569117071, "uptime": 28921.066862047, "examples_seen": 15769600.0, "progress": 0.1367636741472252, "epoch": 12.3087778564387, "img/sec/core": 538.7322525419016, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.011829293821943, "core_hours": 8.011829293821943} {"step": 15450, "l2_params": 301.54131645156644, "train/loss": 4.395015120506287, "l2_grads": 1.1640625, "lr": 0.0009930570252754476, "uptime": 29015.962792347997, "examples_seen": 15820800.0, "progress": 0.1372077120503006, "epoch": 12.348741420907658, "img/sec/core": 539.5384168488584, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.038189274461109, "core_hours": 8.038189274461109} {"step": 15500, "l2_params": 301.8273205747162, "train/loss": 3.620955228805542, "l2_grads": 1.3828125, "lr": 0.0009929293258094272, "uptime": 29109.114990318998, "examples_seen": 15872000.0, "progress": 0.137651749953376, "epoch": 12.388704985376613, "img/sec/core": 549.6381310931462, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.06406488500861, "core_hours": 8.06406488500861} {"step": 15550, "l2_params": 301.99717458451704, "train/loss": 3.735977292060852, "l2_grads": 1.390625, "lr": 0.0009928004710183112, "uptime": 29203.334886874003, "examples_seen": 15923200.0, "progress": 0.13809578785645144, "epoch": 12.42866854984557, "img/sec/core": 543.4096392804856, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.090237078496111, "core_hours": 8.090237078496111} {"step": 15600, "l2_params": 302.2564069575284, "train/loss": 3.8277024030685425, "l2_grads": 1.3515625, "lr": 0.000992670461204108, "uptime": 29296.467876197003, "examples_seen": 15974400.0, "progress": 0.13853982575952684, "epoch": 12.468632114314527, "img/sec/core": 549.7514937744621, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.116107353308056, "core_hours": 8.116107353308056} {"step": 15650, "l2_params": 302.5051184355192, "train/loss": 5.83082902431488, "l2_grads": 0.9609375, "lr": 0.000992539296671535, "uptime": 29390.811562660998, "examples_seen": 16025600.0, "progress": 0.13898386366260224, "epoch": 12.508595678783484, "img/sec/core": 542.6966225189817, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.142313932881388, "core_hours": 8.142313932881388} {"step": 15700, "l2_params": 302.7867644185116, "train/loss": 3.680633246898651, "l2_grads": 1.328125, "lr": 0.0009924069777280152, "uptime": 29485.232451469998, "examples_seen": 16076800.0, "progress": 0.13942790156567764, "epoch": 12.548559243252441, "img/sec/core": 542.25289176816, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.168541957550554, "core_hours": 8.168541957550554} {"step": 15750, "l2_params": 302.99203269228053, "train/loss": 3.661282002925873, "l2_grads": 1.375, "lr": 0.0009922735046836758, "uptime": 29578.456683129003, "examples_seen": 16128000.0, "progress": 0.13987193946875306, "epoch": 12.588522807721398, "img/sec/core": 549.2134296936744, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.194437577455833, "core_hours": 8.194437577455833} {"step": 15800, "l2_params": 303.23045201834526, "train/loss": 5.47863233089447, "l2_grads": 1.125, "lr": 0.0009921388778513503, "uptime": 29671.751007458002, "examples_seen": 16179200.0, "progress": 0.14031597737182847, "epoch": 12.628486372190354, "img/sec/core": 548.8008018520502, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.220352667547223, "core_hours": 8.220352667547223} {"step": 15850, "l2_params": 303.54123323436227, "train/loss": 3.5303937792778015, "l2_grads": 1.46875, "lr": 0.0009920030975465765, "uptime": 29765.826426139003, "examples_seen": 16230400.0, "progress": 0.14076001527490387, "epoch": 12.66844993665931, "img/sec/core": 544.2441895859472, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.246484728291945, "core_hours": 8.246484728291945} {"step": 15900, "l2_params": 303.73319221115963, "train/loss": 3.5949536561965942, "l2_grads": 1.4609375, "lr": 0.0009918661640875956, "uptime": 29860.07096023, "examples_seen": 16281600.0, "progress": 0.14120405317797927, "epoch": 12.708413501128268, "img/sec/core": 543.2675803836402, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.272663765539443, "core_hours": 8.272663765539443} {"step": 15950, "l2_params": 303.8329386189782, "train/loss": 3.502232789993286, "l2_grads": 1.328125, "lr": 0.0009917280777953523, "uptime": 29953.236356341997, "examples_seen": 16332800.0, "progress": 0.14164809108105467, "epoch": 12.748377065597225, "img/sec/core": 549.5602674028426, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.29854304223722, "core_hours": 8.29854304223722} {"step": 16000, "l2_params": 304.20215350209554, "train/loss": 3.7795355319976807, "l2_grads": 1.3671875, "lr": 0.0009915888389934913, "uptime": 30047.746209347, "examples_seen": 16384000.0, "progress": 0.1420921289841301, "epoch": 12.788340630066182, "img/sec/core": 541.742457236605, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.324795779183054, "core_hours": 8.324795779183054} {"step": 16050, "l2_params": 304.3835759828789, "train/loss": 3.526919662952423, "l2_grads": 1.3125, "lr": 0.000991448448008361, "uptime": 30141.092571855002, "examples_seen": 16435200.0, "progress": 0.1425361668872055, "epoch": 12.82830419453514, "img/sec/core": 548.4948596214434, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.350725324324166, "core_hours": 8.350725324324166} {"step": 16100, "l2_params": 304.50266188286434, "train/loss": 3.5338127613067627, "l2_grads": 1.4375, "lr": 0.0009913069051690076, "uptime": 30235.423479164, "examples_seen": 16486400.0, "progress": 0.1429802047902809, "epoch": 12.868267759004096, "img/sec/core": 542.7701424760477, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.376928354132222, "core_hours": 8.376928354132222} {"step": 16150, "l2_params": 304.8054266979695, "train/loss": 5.663618445396423, "l2_grads": 0.94921875, "lr": 0.0009911642108071806, "uptime": 30330.043541563, "examples_seen": 16537600.0, "progress": 0.1434242426933563, "epoch": 12.908231323473052, "img/sec/core": 541.1114588373038, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.403211704798611, "core_hours": 8.403211704798611} {"step": 16200, "l2_params": 304.97044074231604, "train/loss": 3.6595309376716614, "l2_grads": 1.484375, "lr": 0.000991020365257324, "uptime": 30423.928279411997, "examples_seen": 16588800.0, "progress": 0.14386828059643172, "epoch": 12.948194887942009, "img/sec/core": 545.3495549228702, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.429290798645555, "core_hours": 8.429290798645555} {"step": 16250, "l2_params": 305.2035917578215, "train/loss": 5.672407150268555, "l2_grads": 1.140625, "lr": 0.0009908753688565829, "uptime": 30517.821110606998, "examples_seen": 16640000.0, "progress": 0.14431231849950713, "epoch": 12.988158452410966, "img/sec/core": 545.302547046066, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.455372140644165, "core_hours": 8.455372140644165} {"step": 16300, "l2_params": 305.41416631892054, "train/loss": 3.638067662715912, "l2_grads": 1.359375, "lr": 0.0009907292219447994, "uptime": 30612.258513582998, "examples_seen": 16691200.0, "progress": 0.14475635640258253, "epoch": 13.028122016879923, "img/sec/core": 542.1580685886895, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.481604752581942, "core_hours": 8.481604752581942} {"step": 16350, "l2_params": 305.67675063521966, "train/loss": 3.650536298751831, "l2_grads": 1.4140625, "lr": 0.0009905819248645124, "uptime": 30705.986351903997, "examples_seen": 16742400.0, "progress": 0.14520039430565793, "epoch": 13.06808558134888, "img/sec/core": 546.2624649962584, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.507640263226666, "core_hours": 8.507640263226666} {"step": 16400, "l2_params": 305.7820076957909, "train/loss": 3.5292214155197144, "l2_grads": 1.5234375, "lr": 0.0009904334779609547, "uptime": 30800.187861598, "examples_seen": 16793600.0, "progress": 0.14564443220873333, "epoch": 13.108049145817837, "img/sec/core": 543.5157054946901, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.533807349252777, "core_hours": 8.533807349252777} {"step": 16450, "l2_params": 306.0902277745281, "train/loss": 3.609117329120636, "l2_grads": 1.375, "lr": 0.0009902838815820574, "uptime": 30894.773393052, "examples_seen": 16844800.0, "progress": 0.14608847011180875, "epoch": 13.148012710286793, "img/sec/core": 541.3090058588826, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.56008110799, "core_hours": 8.56008110799} {"step": 16500, "l2_params": 306.23479554093785, "train/loss": 3.521499514579773, "l2_grads": 1.4765625, "lr": 0.0009901331360784409, "uptime": 30989.027111768, "examples_seen": 16896000.0, "progress": 0.14653250801488416, "epoch": 13.18797627475575, "img/sec/core": 543.2146412628465, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.58626269652222, "core_hours": 8.58626269652222} {"step": 16550, "l2_params": 306.41190793475823, "train/loss": 4.443980574607849, "l2_grads": 1.1328125, "lr": 0.0009899812418034237, "uptime": 31082.192543581998, "examples_seen": 16947200.0, "progress": 0.14697654591795956, "epoch": 13.227939839224707, "img/sec/core": 549.5600568053901, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.612141983137223, "core_hours": 8.612141983137223} {"step": 16600, "l2_params": 306.68341779431114, "train/loss": 3.545600116252899, "l2_grads": 1.34375, "lr": 0.0009898281991130135, "uptime": 31176.349980780997, "examples_seen": 16998400.0, "progress": 0.14742058382103496, "epoch": 13.267903403693664, "img/sec/core": 543.7701101803592, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.638296826803609, "core_hours": 8.638296826803609} {"step": 16650, "l2_params": 306.8016269208004, "train/loss": 3.4987664818763733, "l2_grads": 1.4296875, "lr": 0.0009896740083659115, "uptime": 31269.803820003002, "examples_seen": 17049600.0, "progress": 0.14786462172411036, "epoch": 13.307866968162621, "img/sec/core": 547.8640623674229, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.664256226587499, "core_hours": 8.664256226587499} {"step": 16700, "l2_params": 307.1641967254647, "train/loss": 3.613077461719513, "l2_grads": 1.46875, "lr": 0.0009895186699235097, "uptime": 31363.098389841998, "examples_seen": 17100800.0, "progress": 0.14830865962718578, "epoch": 13.347830532631578, "img/sec/core": 548.7993576513509, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.69017138487611, "core_hours": 8.69017138487611} {"step": 16750, "l2_params": 307.29504729778836, "train/loss": 3.621029496192932, "l2_grads": 1.4296875, "lr": 0.0009893621841498893, "uptime": 31458.745218223998, "examples_seen": 17152000.0, "progress": 0.14875269753026119, "epoch": 13.387794097100533, "img/sec/core": 535.3026427129884, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.716739948315555, "core_hours": 8.716739948315555} {"step": 16800, "l2_params": 307.48111286000153, "train/loss": 5.81423544883728, "l2_grads": 0.98046875, "lr": 0.0009892045514118205, "uptime": 31552.719770343003, "examples_seen": 17203200.0, "progress": 0.14919673543333659, "epoch": 13.42775766156949, "img/sec/core": 544.8283481592184, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.742843990570833, "core_hours": 8.742843990570833} {"step": 16850, "l2_params": 307.69633594869146, "train/loss": 3.5542191863059998, "l2_grads": 1.5546875, "lr": 0.0009890457720787625, "uptime": 31646.060528240003, "examples_seen": 17254400.0, "progress": 0.149640773336412, "epoch": 13.467721226038448, "img/sec/core": 548.5277937907721, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.768771978875556, "core_hours": 8.768771978875556} {"step": 16900, "l2_params": 307.84641152031884, "train/loss": 3.7111748456954956, "l2_grads": 1.2890625, "lr": 0.0009888858465228604, "uptime": 31740.207052216003, "examples_seen": 17305600.0, "progress": 0.15008481123948741, "epoch": 13.507684790507405, "img/sec/core": 543.8331426134436, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.794923791091112, "core_hours": 8.794923791091112} {"step": 16950, "l2_params": 308.1067866701211, "train/loss": 3.3956627249717712, "l2_grads": 1.34375, "lr": 0.0009887247751189483, "uptime": 31833.779265636997, "examples_seen": 17356800.0, "progress": 0.15052884914256282, "epoch": 13.547648354976362, "img/sec/core": 547.1709830101431, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.820916072596942, "core_hours": 8.820916072596942} {"step": 17000, "l2_params": 308.23728937703174, "train/loss": 5.6222875118255615, "l2_grads": 1.0234375, "lr": 0.0009885625582445436, "uptime": 31927.715809594, "examples_seen": 17408000.0, "progress": 0.15097288704563822, "epoch": 13.587611919445319, "img/sec/core": 545.0487940394692, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.847009557029445, "core_hours": 8.847009557029445} {"step": 17050, "l2_params": 308.432891619575, "train/loss": 5.843581676483154, "l2_grads": 0.93359375, "lr": 0.0009883991962798494, "uptime": 32021.24506069, "examples_seen": 17459200.0, "progress": 0.15141692494871362, "epoch": 13.627575483914274, "img/sec/core": 547.4223240325965, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.87298990455611, "core_hours": 8.87298990455611} {"step": 17100, "l2_params": 308.6800796967023, "train/loss": 3.544370710849762, "l2_grads": 1.3203125, "lr": 0.0009882346896077532, "uptime": 32114.542320842, "examples_seen": 17510400.0, "progress": 0.15186096285178902, "epoch": 13.667539048383231, "img/sec/core": 548.7835325130035, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.898905810153888, "core_hours": 8.898905810153888} {"step": 17150, "l2_params": 308.76474534627494, "train/loss": 5.254567503929138, "l2_grads": 1.125, "lr": 0.0009880690386138236, "uptime": 32207.910937594, "examples_seen": 17561600.0, "progress": 0.15230500075486444, "epoch": 13.707502612852188, "img/sec/core": 548.3641268456918, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.924841537029444, "core_hours": 8.924841537029444} {"step": 17200, "l2_params": 309.0374247284825, "train/loss": 3.4370498657226562, "l2_grads": 1.390625, "lr": 0.0009879022436863124, "uptime": 32302.120252605997, "examples_seen": 17612800.0, "progress": 0.15274903865793985, "epoch": 13.747466177321146, "img/sec/core": 543.4706747785967, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.951010791199444, "core_hours": 8.951010791199444} {"step": 17250, "l2_params": 309.23218294470905, "train/loss": 5.770762205123901, "l2_grads": 1.0625, "lr": 0.0009877343052161537, "uptime": 32397.091521134, "examples_seen": 17664000.0, "progress": 0.15319307656101525, "epoch": 13.787429741790103, "img/sec/core": 539.1104151136338, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 8.977391699123888, "core_hours": 8.977391699123888} {"step": 17300, "l2_params": 309.3296557679202, "train/loss": 5.844489216804504, "l2_grads": 1.015625, "lr": 0.0009875652235969612, "uptime": 32491.001358995, "examples_seen": 17715200.0, "progress": 0.15363711446409065, "epoch": 13.82739330625906, "img/sec/core": 545.2037951101938, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.003477765196388, "core_hours": 9.003477765196388} {"step": 17350, "l2_params": 309.65357249826377, "train/loss": 3.525345742702484, "l2_grads": 1.3671875, "lr": 0.000987394999225027, "uptime": 32585.267044452998, "examples_seen": 17766400.0, "progress": 0.15408115236716607, "epoch": 13.867356870728017, "img/sec/core": 543.1456818166681, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.029662677823609, "core_hours": 9.029662677823609} {"step": 17400, "l2_params": 309.7765717643323, "train/loss": 5.342049479484558, "l2_grads": 1.046875, "lr": 0.0009872236324993213, "uptime": 32679.392434835998, "examples_seen": 17817600.0, "progress": 0.15452519027024147, "epoch": 13.907320435196972, "img/sec/core": 543.9552472681924, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.055808619596664, "core_hours": 9.055808619596664} {"step": 17450, "l2_params": 309.9582680453733, "train/loss": 5.845421075820923, "l2_grads": 1.0234375, "lr": 0.0009870511238214935, "uptime": 32772.709417139995, "examples_seen": 17868800.0, "progress": 0.15496922817331688, "epoch": 13.94728399966593, "img/sec/core": 548.6675494199403, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.081730003569998, "core_hours": 9.081730003569998} {"step": 17500, "l2_params": 310.16520138216265, "train/loss": 3.633378267288208, "l2_grads": 1.4140625, "lr": 0.0009868774735958675, "uptime": 32867.332168746, "examples_seen": 17920000.0, "progress": 0.15541326607639228, "epoch": 13.987247564134886, "img/sec/core": 541.096080287228, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.108014101238332, "core_hours": 9.108014101238332, "val/acc@1": 0.44455516581632654, "val/loss": 2.5455575399861043, "z/secs/eval/val": 31.779365460002737} {"step": 17550, "l2_params": 310.35930380920996, "train/loss": 3.558207631111145, "l2_grads": 1.421875, "lr": 0.000986702682229445, "uptime": 32992.029772989, "examples_seen": 17971200.0, "progress": 0.15585730397946768, "epoch": 14.027211128603843, "img/sec/core": 410.5932933581263, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.142652324639164, "core_hours": 9.142652324639164} {"step": 17600, "l2_params": 310.4633618052821, "train/loss": 5.834508180618286, "l2_grads": 1.015625, "lr": 0.0009865267501319, "uptime": 33085.186096018006, "examples_seen": 18022400.0, "progress": 0.1563013418825431, "epoch": 14.0671746930728, "img/sec/core": 549.6137925501689, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.168529081036109, "core_hours": 9.168529081036109} {"step": 17650, "l2_params": 310.69556071066177, "train/loss": 3.7201985716819763, "l2_grads": 1.34375, "lr": 0.0009863496777155823, "uptime": 33179.610510344006, "examples_seen": 18073600.0, "progress": 0.1567453797856185, "epoch": 14.107138257541758, "img/sec/core": 542.2326457141902, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.194758085015556, "core_hours": 9.194758085015556} {"step": 17700, "l2_params": 310.86980890066746, "train/loss": 4.637186527252197, "l2_grads": 1.234375, "lr": 0.0009861714653955128, "uptime": 33272.751041711, "examples_seen": 18124800.0, "progress": 0.1571894176886939, "epoch": 14.147101822010713, "img/sec/core": 549.706977709408, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.22063045483972, "core_hours": 9.22063045483972} {"step": 17751, "l2_params": 311.0507723954604, "train/loss": 3.4458706378936768, "l2_grads": 1.40625, "lr": 0.000985992113589384, "uptime": 33367.080269938, "examples_seen": 18176000.0, "progress": 0.1576334555917693, "epoch": 14.18706538647967, "img/sec/core": 542.7798039096668, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.246833018236108, "core_hours": 9.246833018236108} {"step": 17800, "l2_params": 311.24435549600736, "train/loss": 3.46581369638443, "l2_grads": 1.5078125, "lr": 0.0009858116227175599, "uptime": 33460.285829777, "examples_seen": 18227200.0, "progress": 0.1580774934948447, "epoch": 14.227028950948627, "img/sec/core": 549.323453326617, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.272723451524719, "core_hours": 9.272723451524719} {"step": 17850, "l2_params": 311.45031988715715, "train/loss": 5.450862646102905, "l2_grads": 1.0546875, "lr": 0.0009856299932030743, "uptime": 33554.710879897, "examples_seen": 18278400.0, "progress": 0.15852153139792013, "epoch": 14.266992515417584, "img/sec/core": 542.2289946887221, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.29895263211361, "core_hours": 9.29895263211361} {"step": 17900, "l2_params": 311.60495103225253, "train/loss": 5.080316662788391, "l2_grads": 1.09375, "lr": 0.0009854472254716294, "uptime": 33647.88329128199, "examples_seen": 18329600.0, "progress": 0.15896556930099554, "epoch": 14.306956079886541, "img/sec/core": 549.5188891101623, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.32483385749833, "core_hours": 9.32483385749833} {"step": 17950, "l2_params": 311.77222129104126, "train/loss": 3.919737935066223, "l2_grads": 1.3828125, "lr": 0.0009852633199515948, "uptime": 33742.174297139005, "examples_seen": 18380800.0, "progress": 0.15940960720407094, "epoch": 14.346919644355498, "img/sec/core": 542.999828399818, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.351025803569721, "core_hours": 9.351025803569721} {"step": 18000, "l2_params": 311.9881542598012, "train/loss": 3.377547264099121, "l2_grads": 1.4140625, "lr": 0.0009850782770740069, "uptime": 33835.367364016, "examples_seen": 18432000.0, "progress": 0.15985364510714634, "epoch": 14.386883208824454, "img/sec/core": 549.397092678319, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.37691276659111, "core_hours": 9.37691276659111} {"step": 18050, "l2_params": 312.11999082384165, "train/loss": 5.676648378372192, "l2_grads": 1.0546875, "lr": 0.00098489209727257, "uptime": 33928.776980662995, "examples_seen": 18483200.0, "progress": 0.16029768301022176, "epoch": 14.426846773293411, "img/sec/core": 548.1234356574776, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.402859882326387, "core_hours": 9.402859882326387} {"step": 18100, "l2_params": 312.26140422779196, "train/loss": 3.461441993713379, "l2_grads": 1.4375, "lr": 0.0009847047809836505, "uptime": 34023.404950229, "examples_seen": 18534400.0, "progress": 0.16074172091329716, "epoch": 14.466810337762368, "img/sec/core": 541.0662432558149, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.429145429428052, "core_hours": 9.429145429428052} {"step": 18150, "l2_params": 312.42849181852796, "train/loss": 4.477432489395142, "l2_grads": 1.1875, "lr": 0.0009845163286462783, "uptime": 34117.553947060005, "examples_seen": 18585600.0, "progress": 0.16118575881637257, "epoch": 14.506773902231325, "img/sec/core": 543.8188586534019, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.455297928547775, "core_hours": 9.455297928547775} {"step": 18200, "l2_params": 312.5892122658746, "train/loss": 3.4731927514076233, "l2_grads": 1.453125, "lr": 0.000984326740702148, "uptime": 34210.839541987996, "examples_seen": 18636800.0, "progress": 0.16162979671944797, "epoch": 14.546737466700282, "img/sec/core": 548.8521570722497, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.481210593805553, "core_hours": 9.481210593805553} {"step": 18250, "l2_params": 312.78181979916127, "train/loss": 3.376075565814972, "l2_grads": 1.5078125, "lr": 0.0009841360175956153, "uptime": 34305.04463862399, "examples_seen": 18688000.0, "progress": 0.16207383462252337, "epoch": 14.58670103116924, "img/sec/core": 543.4950106556764, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.507378676204441, "core_hours": 9.507378676204441} {"step": 18300, "l2_params": 312.9356057711794, "train/loss": 4.659180402755737, "l2_grads": 1.1875, "lr": 0.0009839441597736943, "uptime": 34399.876957479006, "examples_seen": 18739200.0, "progress": 0.1625178725255988, "epoch": 14.626664595638195, "img/sec/core": 539.9003274219463, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.5337209869975, "core_hours": 9.5337209869975} {"step": 18350, "l2_params": 313.15996093500286, "train/loss": 3.395874798297882, "l2_grads": 1.453125, "lr": 0.0009837511676860629, "uptime": 34494.634711520004, "examples_seen": 18790400.0, "progress": 0.1629619104286742, "epoch": 14.666628160107152, "img/sec/core": 540.3251746326483, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.56004258534222, "core_hours": 9.56004258534222} {"step": 18400, "l2_params": 313.21152434796363, "train/loss": 4.49511981010437, "l2_grads": 1.1796875, "lr": 0.0009835570417850513, "uptime": 34587.755345977, "examples_seen": 18841600.0, "progress": 0.1634059483317496, "epoch": 14.706591724576109, "img/sec/core": 549.8244325605559, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.585909428246943, "core_hours": 9.585909428246943} {"step": 18450, "l2_params": 313.35864069036376, "train/loss": 3.3527831435203552, "l2_grads": 1.421875, "lr": 0.0009833617825256529, "uptime": 34680.981942942, "examples_seen": 18892800.0, "progress": 0.163849986234825, "epoch": 14.746555289045066, "img/sec/core": 549.1994952816319, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.611805705181665, "core_hours": 9.611805705181665} {"step": 18500, "l2_params": 313.6944531880306, "train/loss": 5.351852059364319, "l2_grads": 1.203125, "lr": 0.0009831653903655162, "uptime": 34775.350060649, "examples_seen": 18944000.0, "progress": 0.16429402413790042, "epoch": 14.786518853514023, "img/sec/core": 542.5561221743061, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.638019071211387, "core_hours": 9.638019071211387} {"step": 18550, "l2_params": 313.79060992164824, "train/loss": 3.437958538532257, "l2_grads": 1.3984375, "lr": 0.0009829678657649428, "uptime": 34868.632393612, "examples_seen": 18995200.0, "progress": 0.16473806204097582, "epoch": 14.82648241798298, "img/sec/core": 548.8713497368223, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.663930830367775, "core_hours": 9.663930830367775} {"step": 18600, "l2_params": 313.88026584840037, "train/loss": 5.6498188972473145, "l2_grads": 1.0546875, "lr": 0.0009827692091868908, "uptime": 34962.882561941005, "examples_seen": 19046400.0, "progress": 0.16518209994405122, "epoch": 14.866445982451937, "img/sec/core": 543.23510406129, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.690111432681388, "core_hours": 9.690111432681388} {"step": 18650, "l2_params": 314.052988040036, "train/loss": 4.63096559047699, "l2_grads": 1.125, "lr": 0.0009825694210969683, "uptime": 35056.442885507, "examples_seen": 19097600.0, "progress": 0.16562613784712663, "epoch": 14.906409546920893, "img/sec/core": 547.2405187214329, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.71610041144972, "core_hours": 9.71610041144972} {"step": 18700, "l2_params": 314.2318246906852, "train/loss": 3.3646782636642456, "l2_grads": 1.40625, "lr": 0.0009823685019634397, "uptime": 35150.265375979, "examples_seen": 19148800.0, "progress": 0.16607017575020203, "epoch": 14.94637311138985, "img/sec/core": 545.7113720006977, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.74216221435861, "core_hours": 9.74216221435861} {"step": 18750, "l2_params": 314.3723331770585, "train/loss": 3.5345045924186707, "l2_grads": 1.4765625, "lr": 0.0009821664522572176, "uptime": 35244.114081009, "examples_seen": 19200000.0, "progress": 0.16651421365327745, "epoch": 14.986336675858807, "img/sec/core": 545.5589396106819, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.768231299089164, "core_hours": 9.768231299089164} {"step": 18800, "l2_params": 314.58245671097507, "train/loss": 3.3735339641571045, "l2_grads": 1.390625, "lr": 0.000981963272451864, "uptime": 35337.558167478, "examples_seen": 19251200.0, "progress": 0.16695825155635285, "epoch": 15.026300240327764, "img/sec/core": 547.9212429026561, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.794187989774999, "core_hours": 9.794187989774999} {"step": 18850, "l2_params": 314.71681374143725, "train/loss": 3.4982117414474487, "l2_grads": 1.3671875, "lr": 0.000981758963023592, "uptime": 35431.098762049995, "examples_seen": 19302400.0, "progress": 0.16740228945942826, "epoch": 15.066263804796721, "img/sec/core": 547.3559392504359, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.82017148826722, "core_hours": 9.82017148826722} {"step": 18900, "l2_params": 314.8824231831423, "train/loss": 3.6728046536445618, "l2_grads": 1.3125, "lr": 0.0009815535244512609, "uptime": 35525.835478362, "examples_seen": 19353600.0, "progress": 0.16784632736250366, "epoch": 15.106227369265678, "img/sec/core": 540.4451620571399, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.84648724279833, "core_hours": 9.84648724279833} {"step": 18950, "l2_params": 315.06738490559445, "train/loss": 3.7020536065101624, "l2_grads": 1.34375, "lr": 0.0009813469572163755, "uptime": 35619.017632681, "examples_seen": 19404800.0, "progress": 0.16829036526557906, "epoch": 15.146190933734633, "img/sec/core": 549.461432547705, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.87237117455361, "core_hours": 9.87237117455361} {"step": 19000, "l2_params": 315.18217853181756, "train/loss": 4.556788325309753, "l2_grads": 1.140625, "lr": 0.0009811392618030873, "uptime": 35712.300664696, "examples_seen": 19456000.0, "progress": 0.16873440316865448, "epoch": 15.18615449820359, "img/sec/core": 548.8672365598674, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.89828312789111, "core_hours": 9.89828312789111} {"step": 19050, "l2_params": 315.34776654859553, "train/loss": 5.814199447631836, "l2_grads": 1.15625, "lr": 0.0009809304386981918, "uptime": 35807.486026331, "examples_seen": 19507200.0, "progress": 0.16917844107172988, "epoch": 15.226118062672548, "img/sec/core": 537.8978355551532, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.924723506123055, "core_hours": 9.924723506123055} {"step": 19100, "l2_params": 315.55089631319777, "train/loss": 3.4259961247444153, "l2_grads": 1.4609375, "lr": 0.0009807204883911281, "uptime": 35901.078003666, "examples_seen": 19558400.0, "progress": 0.16962247897480529, "epoch": 15.266081627141505, "img/sec/core": 547.0554363515432, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.950721277604996, "core_hours": 9.950721277604996} {"step": 19151, "l2_params": 315.6655991833961, "train/loss": 3.9423552751541138, "l2_grads": 1.34375, "lr": 0.0009805094113739755, "uptime": 35994.872053927, "examples_seen": 19609600.0, "progress": 0.17006651687788069, "epoch": 15.306045191610462, "img/sec/core": 545.8768424812254, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 9.976775180455274, "core_hours": 9.976775180455274} {"step": 19200, "l2_params": 315.7418471829479, "train/loss": 3.923916757106781, "l2_grads": 1.3828125, "lr": 0.0009802972081414554, "uptime": 36089.595892875004, "examples_seen": 19660800.0, "progress": 0.17051055478095611, "epoch": 15.346008756079419, "img/sec/core": 540.5186336261623, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.003087357940833, "core_hours": 10.003087357940833} {"step": 19250, "l2_params": 315.97032161363666, "train/loss": 3.5411665439605713, "l2_grads": 1.3828125, "lr": 0.000980083879190929, "uptime": 36183.765967663, "examples_seen": 19712000.0, "progress": 0.17095459268403151, "epoch": 15.385972320548374, "img/sec/core": 543.697136433868, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.02924571204861, "core_hours": 10.02924571204861} {"step": 19301, "l2_params": 316.0785278094472, "train/loss": 3.372646450996399, "l2_grads": 1.453125, "lr": 0.000979869425022396, "uptime": 36277.068729896, "examples_seen": 19763200.0, "progress": 0.17139863058710691, "epoch": 15.425935885017331, "img/sec/core": 548.7511706474717, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.05516314600222, "core_hours": 10.05516314600222} {"step": 19350, "l2_params": 316.224744236101, "train/loss": 5.61153244972229, "l2_grads": 0.94140625, "lr": 0.0009796538461384913, "uptime": 36370.479852274, "examples_seen": 19814400.0, "progress": 0.17184266849018232, "epoch": 15.465899449486288, "img/sec/core": 548.1146002380063, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.081110679996108, "core_hours": 10.081110679996108} {"step": 19400, "l2_params": 316.33911324765467, "train/loss": 3.6869648694992065, "l2_grads": 1.3671875, "lr": 0.0009794371430444893, "uptime": 36464.554658969995, "examples_seen": 19865600.0, "progress": 0.17228670639325772, "epoch": 15.505863013955246, "img/sec/core": 544.2477300586019, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.107242570744997, "core_hours": 10.107242570744997} {"step": 19450, "l2_params": 316.52600511500236, "train/loss": 3.446450650691986, "l2_grads": 1.4765625, "lr": 0.0009792193162482972, "uptime": 36559.530946426006, "examples_seen": 19916800.0, "progress": 0.17273074429633314, "epoch": 15.545826578424203, "img/sec/core": 539.0819263568033, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.13362487281611, "core_hours": 10.13362487281611} {"step": 19500, "l2_params": 316.6748628325273, "train/loss": 3.4951465129852295, "l2_grads": 1.3671875, "lr": 0.0009790003662604556, "uptime": 36654.697196921, "examples_seen": 19968000.0, "progress": 0.17317478219940854, "epoch": 15.58579014289316, "img/sec/core": 538.00585537086, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.160059942398055, "core_hours": 10.160059942398055} {"step": 19550, "l2_params": 316.79524699026814, "train/loss": 5.649278998374939, "l2_grads": 1.078125, "lr": 0.0009787802935941373, "uptime": 36747.853744677006, "examples_seen": 20019200.0, "progress": 0.17361882010248395, "epoch": 15.625753707362115, "img/sec/core": 549.6124666846346, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.185936761219164, "core_hours": 10.185936761219164} {"step": 19600, "l2_params": 316.9349471771573, "train/loss": 3.266789734363556, "l2_grads": 1.4453125, "lr": 0.0009785590987651492, "uptime": 36842.23507442699, "examples_seen": 20070400.0, "progress": 0.17406285800555935, "epoch": 15.665717271831072, "img/sec/core": 542.4801720385055, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.21215379726083, "core_hours": 10.21215379726083} {"step": 19650, "l2_params": 317.0742424028046, "train/loss": 5.6455979347229, "l2_grads": 1.09375, "lr": 0.0009783367822919261, "uptime": 36935.815281922, "examples_seen": 20121600.0, "progress": 0.17450689590863477, "epoch": 15.70568083630003, "img/sec/core": 547.1242410178805, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.238148299342777, "core_hours": 10.238148299342777} {"step": 19700, "l2_params": 317.2514421386647, "train/loss": 4.03640604019165, "l2_grads": 1.203125, "lr": 0.0009781133446955328, "uptime": 37030.20273484, "examples_seen": 20172800.0, "progress": 0.17495093381171017, "epoch": 15.745644400768986, "img/sec/core": 542.4449798903127, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.264367036264442, "core_hours": 10.264367036264442} {"step": 19750, "l2_params": 317.3213002891352, "train/loss": 5.130093932151794, "l2_grads": 1.1171875, "lr": 0.0009778887864996602, "uptime": 37124.347331034995, "examples_seen": 20224000.0, "progress": 0.17539497171478557, "epoch": 15.785607965237944, "img/sec/core": 543.8442785813187, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.290518312985276, "core_hours": 10.290518312985276} {"step": 19800, "l2_params": 317.45367218599785, "train/loss": 3.3891602754592896, "l2_grads": 1.40625, "lr": 0.0009776631082306275, "uptime": 37218.60469819, "examples_seen": 20275200.0, "progress": 0.17583900961786098, "epoch": 15.8255715297069, "img/sec/core": 543.1936149437108, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.316700914972776, "core_hours": 10.316700914972776} {"step": 19850, "l2_params": 317.64974323144037, "train/loss": 3.303731918334961, "l2_grads": 1.4140625, "lr": 0.0009774363104173775, "uptime": 37313.139049877995, "examples_seen": 20326400.0, "progress": 0.17628304752093638, "epoch": 15.865535094175858, "img/sec/core": 541.6020640727376, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.34296045710833, "core_hours": 10.34296045710833} {"step": 19900, "l2_params": 317.82010960653906, "train/loss": 4.758210778236389, "l2_grads": 1.1875, "lr": 0.0009772083935914765, "uptime": 37407.301053317, "examples_seen": 20377600.0, "progress": 0.1767270854240118, "epoch": 15.905498658644813, "img/sec/core": 543.7437408940483, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.36911656917472, "core_hours": 10.36911656917472} {"step": 19951, "l2_params": 317.9462614897563, "train/loss": 3.3394309282302856, "l2_grads": 1.4453125, "lr": 0.000976979358287116, "uptime": 37500.632484767004, "examples_seen": 20428800.0, "progress": 0.1771711233270872, "epoch": 15.94546222311377, "img/sec/core": 548.5826072155335, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.39504196679972, "core_hours": 10.39504196679972} {"step": 20000, "l2_params": 318.0160468509215, "train/loss": 3.5025235414505005, "l2_grads": 1.46875, "lr": 0.0009767492050411083, "uptime": 37596.247983812995, "examples_seen": 20480000.0, "progress": 0.1776151612301626, "epoch": 15.985425787582727, "img/sec/core": 535.4780397618277, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.421601827645832, "core_hours": 10.421601827645832, "val/acc@1": 0.4800502232142857, "val/loss": 2.3362899209771837, "z/secs/eval/val": 31.697127227002056} {"step": 20050, "l2_params": 318.1483691072846, "train/loss": 5.16718316078186, "l2_grads": 1.0859375, "lr": 0.0009765179343928833, "uptime": 37721.024408059995, "examples_seen": 20531200.0, "progress": 0.178059199133238, "epoch": 16.025389352051683, "img/sec/core": 410.33392573141396, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.456261945492221, "core_hours": 10.456261945492221} {"step": 20100, "l2_params": 318.2998567830733, "train/loss": 5.47935676574707, "l2_grads": 1.03125, "lr": 0.0009762855468844938, "uptime": 37814.233910241994, "examples_seen": 20582400.0, "progress": 0.17850323703631343, "epoch": 16.06535291652064, "img/sec/core": 549.3002194135538, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.482153473876108, "core_hours": 10.482153473876108} {"step": 20150, "l2_params": 318.4886980431959, "train/loss": 4.204646587371826, "l2_grads": 1.15625, "lr": 0.0009760520430606079, "uptime": 37908.66776676499, "examples_seen": 20633600.0, "progress": 0.17894727493938883, "epoch": 16.105316480989597, "img/sec/core": 542.1784292747842, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.508385100688054, "core_hours": 10.508385100688054} {"step": 20200, "l2_params": 318.5361660196531, "train/loss": 5.155698299407959, "l2_grads": 1.203125, "lr": 0.0009758174234685112, "uptime": 38002.150012332, "examples_seen": 20684800.0, "progress": 0.17939131284246423, "epoch": 16.145280045458556, "img/sec/core": 547.6975835299573, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.53435239112333, "core_hours": 10.53435239112333} {"step": 20250, "l2_params": 318.64980962158916, "train/loss": 3.3567128777503967, "l2_grads": 1.3671875, "lr": 0.0009755816886581035, "uptime": 38096.64705907401, "examples_seen": 20736000.0, "progress": 0.17983535074553963, "epoch": 16.18524360992751, "img/sec/core": 541.815874307534, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.560601570773887, "core_hours": 10.560601570773887} {"step": 20300, "l2_params": 318.84468416015267, "train/loss": 3.2834802865982056, "l2_grads": 1.4921875, "lr": 0.0009753448391818979, "uptime": 38191.014993239995, "examples_seen": 20787200.0, "progress": 0.18027938864861504, "epoch": 16.22520717439647, "img/sec/core": 542.5571774193764, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.586814885819997, "core_hours": 10.586814885819997} {"step": 20350, "l2_params": 318.98935406657773, "train/loss": 3.294914424419403, "l2_grads": 1.5234375, "lr": 0.0009751068755950216, "uptime": 38284.21148850799, "examples_seen": 20838400.0, "progress": 0.18072342655169046, "epoch": 16.265170738865425, "img/sec/core": 549.3768821753165, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.612702801172219, "core_hours": 10.612702801172219} {"step": 20400, "l2_params": 319.17169562644887, "train/loss": 5.482381820678711, "l2_grads": 1.1484375, "lr": 0.0009748677984552128, "uptime": 38378.842092144, "examples_seen": 20889600.0, "progress": 0.18116746445476586, "epoch": 16.30513430333438, "img/sec/core": 541.0511825216774, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.638989079959998, "core_hours": 10.638989079959998} {"step": 20450, "l2_params": 319.24412221732837, "train/loss": 3.391166865825653, "l2_grads": 1.421875, "lr": 0.000974627608322818, "uptime": 38473.251602526, "examples_seen": 20940800.0, "progress": 0.18161150235784126, "epoch": 16.34509786780334, "img/sec/core": 542.3182451940957, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.665213943954999, "core_hours": 10.665213943954999} {"step": 20500, "l2_params": 319.3791921202366, "train/loss": 3.226256847381592, "l2_grads": 1.484375, "lr": 0.0009743863057607944, "uptime": 38567.321590834006, "examples_seen": 20992000.0, "progress": 0.18205554026091667, "epoch": 16.385061432272295, "img/sec/core": 544.2756071401041, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.691344496262777, "core_hours": 10.691344496262777} {"step": 20550, "l2_params": 319.45500159940366, "train/loss": 3.2690482139587402, "l2_grads": 1.546875, "lr": 0.0009741438913347054, "uptime": 38661.896130488996, "examples_seen": 21043200.0, "progress": 0.18249957816399207, "epoch": 16.425024996741254, "img/sec/core": 541.3719187719522, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.717615201722499, "core_hours": 10.717615201722499} {"step": 20600, "l2_params": 319.54931489276817, "train/loss": 3.2709702849388123, "l2_grads": 1.453125, "lr": 0.0009739003656127207, "uptime": 38755.136257779, "examples_seen": 21094400.0, "progress": 0.1829436160670675, "epoch": 16.46498856121021, "img/sec/core": 549.1197994695345, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.743515237080832, "core_hours": 10.743515237080832} {"step": 20650, "l2_params": 319.71850564451614, "train/loss": 4.653696060180664, "l2_grads": 1.2890625, "lr": 0.0009736557291656145, "uptime": 38849.668659171, "examples_seen": 21145600.0, "progress": 0.1833876539701429, "epoch": 16.504952125679164, "img/sec/core": 541.6132378536503, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.769774237467498, "core_hours": 10.769774237467498} {"step": 20700, "l2_params": 319.81284199708114, "train/loss": 3.3412429094314575, "l2_grads": 1.4453125, "lr": 0.0009734099825667643, "uptime": 38942.996007087, "examples_seen": 21196800.0, "progress": 0.1838316918732183, "epoch": 16.544915690148123, "img/sec/core": 548.6066104233893, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.795698500777497, "core_hours": 10.795698500777497} {"step": 20750, "l2_params": 319.9634378526709, "train/loss": 3.350365459918976, "l2_grads": 1.375, "lr": 0.0009731631263921505, "uptime": 39038.29671876501, "examples_seen": 21248000.0, "progress": 0.1842757297762937, "epoch": 16.58487925461708, "img/sec/core": 537.2467749557848, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.822170920688054, "core_hours": 10.822170920688054} {"step": 20800, "l2_params": 320.00748129682455, "train/loss": 3.62092262506485, "l2_grads": 1.3984375, "lr": 0.0009729151612203525, "uptime": 39131.554164261004, "examples_seen": 21299200.0, "progress": 0.18471976767936912, "epoch": 16.624842819086037, "img/sec/core": 549.0178261659263, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.848075766659166, "core_hours": 10.848075766659166} {"step": 20850, "l2_params": 320.170143671201, "train/loss": 3.209819197654724, "l2_grads": 1.4453125, "lr": 0.0009726660876325496, "uptime": 39224.91035414999, "examples_seen": 21350400.0, "progress": 0.18516380558244452, "epoch": 16.664806383554993, "img/sec/core": 548.437120890199, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.874008041628331, "core_hours": 10.874008041628331} {"step": 20900, "l2_params": 320.2833477587658, "train/loss": 3.1148858070373535, "l2_grads": 1.4375, "lr": 0.0009724159062125193, "uptime": 39319.550348175995, "examples_seen": 21401600.0, "progress": 0.18560784348551992, "epoch": 16.70476994802395, "img/sec/core": 540.9974982239872, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.900296928857776, "core_hours": 10.900296928857776} {"step": 20951, "l2_params": 320.3963091576977, "train/loss": 5.6634544134140015, "l2_grads": 1.109375, "lr": 0.0009721646175466357, "uptime": 39413.653258876, "examples_seen": 21452800.0, "progress": 0.18605188138859532, "epoch": 16.744733512492907, "img/sec/core": 544.0851894924466, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.926436626274443, "core_hours": 10.926436626274443} {"step": 21000, "l2_params": 320.5211500309886, "train/loss": 5.120823979377747, "l2_grads": 1.109375, "lr": 0.0009719122222238677, "uptime": 39508.905129542996, "examples_seen": 21504000.0, "progress": 0.18649591929167073, "epoch": 16.784697076961862, "img/sec/core": 537.5222517045784, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.952895479237498, "core_hours": 10.952895479237498} {"step": 21050, "l2_params": 320.6525755685583, "train/loss": 3.2217625975608826, "l2_grads": 1.390625, "lr": 0.0009716587208357784, "uptime": 39602.335363884995, "examples_seen": 21555200.0, "progress": 0.18693995719474615, "epoch": 16.82466064143082, "img/sec/core": 548.0024786471575, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 10.978848322110276, "core_hours": 10.978848322110276} {"step": 21100, "l2_params": 320.7344233357249, "train/loss": 3.246973991394043, "l2_grads": 1.5234375, "lr": 0.000971404113976522, "uptime": 39697.014865061996, "examples_seen": 21606400.0, "progress": 0.18738399509782155, "epoch": 16.864624205899776, "img/sec/core": 540.7717548520128, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.00514818354833, "core_hours": 11.00514818354833} {"step": 21150, "l2_params": 320.924645251323, "train/loss": 3.331363618373871, "l2_grads": 1.421875, "lr": 0.0009711484022428453, "uptime": 39790.386372351, "examples_seen": 21657600.0, "progress": 0.18782803300089695, "epoch": 16.904587770368735, "img/sec/core": 548.3471509304138, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.03108471335083, "core_hours": 11.03108471335083} {"step": 21200, "l2_params": 320.99407059846914, "train/loss": 3.2788676619529724, "l2_grads": 1.4921875, "lr": 0.0009708915862340844, "uptime": 39885.21179682799, "examples_seen": 21708800.0, "progress": 0.18827207090397236, "epoch": 16.94455133483769, "img/sec/core": 539.9395814191037, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.057425109038887, "core_hours": 11.057425109038887} {"step": 21250, "l2_params": 321.13136640974125, "train/loss": 3.223505914211273, "l2_grads": 1.4921875, "lr": 0.0009706336665521626, "uptime": 39978.532658715005, "examples_seen": 21760000.0, "progress": 0.18871610880704778, "epoch": 16.98451489930665, "img/sec/core": 548.6447399295796, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.083347570674166, "core_hours": 11.083347570674166} {"step": 21300, "l2_params": 321.2190357766994, "train/loss": 4.420870780944824, "l2_grads": 1.2109375, "lr": 0.000970374643801591, "uptime": 40071.921917578, "examples_seen": 21811200.0, "progress": 0.18916014671012318, "epoch": 17.024478463775605, "img/sec/core": 548.2429202603583, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.109289031469443, "core_hours": 11.109289031469443} {"step": 21350, "l2_params": 321.33733005597094, "train/loss": 3.128492295742035, "l2_grads": 1.4453125, "lr": 0.0009701145185894661, "uptime": 40166.338461573, "examples_seen": 21862400.0, "progress": 0.18960418461319858, "epoch": 17.06444202824456, "img/sec/core": 542.2778448945429, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.13551584924583, "core_hours": 11.13551584924583} {"step": 21400, "l2_params": 321.4623948287925, "train/loss": 5.190064907073975, "l2_grads": 1.1171875, "lr": 0.0009698532915254676, "uptime": 40259.80782319, "examples_seen": 21913600.0, "progress": 0.19004822251627398, "epoch": 17.10440559271352, "img/sec/core": 547.773078945363, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.161479560806107, "core_hours": 11.161479560806107} {"step": 21450, "l2_params": 321.5184949238924, "train/loss": 3.2641876935958862, "l2_grads": 1.46875, "lr": 0.0009695909632218582, "uptime": 40354.891831832996, "examples_seen": 21964800.0, "progress": 0.19049226041934939, "epoch": 17.144369157182474, "img/sec/core": 538.4711975305158, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.187891785429166, "core_hours": 11.187891785429166} {"step": 21500, "l2_params": 321.6995016097126, "train/loss": 3.133400559425354, "l2_grads": 1.4140625, "lr": 0.0009693275342934815, "uptime": 40450.06493302999, "examples_seen": 22016000.0, "progress": 0.1909362983224248, "epoch": 17.184332721651433, "img/sec/core": 537.9671289056995, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.214328757983886, "core_hours": 11.214328757983886} {"step": 21550, "l2_params": 321.8615880094074, "train/loss": 5.512892246246338, "l2_grads": 0.984375, "lr": 0.0009690630053577604, "uptime": 40543.342598281, "examples_seen": 22067200.0, "progress": 0.1913803362255002, "epoch": 17.22429628612039, "img/sec/core": 548.8988158336331, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.240239220553608, "core_hours": 11.240239220553608} {"step": 21600, "l2_params": 321.93025769615457, "train/loss": 3.1392341256141663, "l2_grads": 1.4921875, "lr": 0.0009687973770346977, "uptime": 40637.634864181004, "examples_seen": 22118400.0, "progress": 0.19182437412857561, "epoch": 17.264259850589344, "img/sec/core": 542.9925722041454, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.266431516636942, "core_hours": 11.266431516636942} {"step": 21650, "l2_params": 322.02373535628163, "train/loss": 3.257896363735199, "l2_grads": 1.4921875, "lr": 0.0009685306499468692, "uptime": 40731.554850579996, "examples_seen": 22169600.0, "progress": 0.19226841203165101, "epoch": 17.304223415058303, "img/sec/core": 545.1448830335997, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.292520401747776, "core_hours": 11.292520401747776} {"step": 21700, "l2_params": 322.15138315995944, "train/loss": 5.295005559921265, "l2_grads": 1.1171875, "lr": 0.0009682628247194309, "uptime": 40825.78530989699, "examples_seen": 22220800.0, "progress": 0.19271244993472642, "epoch": 17.344186979527258, "img/sec/core": 543.3487257847257, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.31869552933583, "core_hours": 11.31869552933583} {"step": 21750, "l2_params": 322.2758850639464, "train/loss": 3.129788815975189, "l2_grads": 1.484375, "lr": 0.0009679939019801087, "uptime": 40920.197869712996, "examples_seen": 22272000.0, "progress": 0.19315648783780184, "epoch": 17.384150543996217, "img/sec/core": 542.3007288413949, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.34492124039583, "core_hours": 11.34492124039583} {"step": 21800, "l2_params": 322.375455905552, "train/loss": 3.136981427669525, "l2_grads": 1.46875, "lr": 0.0009677238823592026, "uptime": 41013.510198514996, "examples_seen": 22323200.0, "progress": 0.19360052574087724, "epoch": 17.424114108465172, "img/sec/core": 548.6949115656706, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.37084133172972, "core_hours": 11.37084133172972} {"step": 21850, "l2_params": 322.4380633354257, "train/loss": 2.9858816266059875, "l2_grads": 1.484375, "lr": 0.0009674527664895842, "uptime": 41108.195240677, "examples_seen": 22374400.0, "progress": 0.19404456364395264, "epoch": 17.46407767293413, "img/sec/core": 540.7401087956636, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.397142732330275, "core_hours": 11.397142732330275} {"step": 21900, "l2_params": 322.58082502200125, "train/loss": 5.3385947942733765, "l2_grads": 1.1328125, "lr": 0.0009671805550066915, "uptime": 41201.82152528, "examples_seen": 22425600.0, "progress": 0.19448860154702804, "epoch": 17.504041237403086, "img/sec/core": 546.854980063571, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.423150033608886, "core_hours": 11.423150033608886} {"step": 21950, "l2_params": 322.6680430653538, "train/loss": 3.3149490356445312, "l2_grads": 1.5234375, "lr": 0.0009669072485485337, "uptime": 41296.931268486005, "examples_seen": 22476800.0, "progress": 0.19493263945010347, "epoch": 17.544004801872042, "img/sec/core": 538.3254993034964, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.449569406721666, "core_hours": 11.449569406721666} {"step": 22000, "l2_params": 322.81726763178267, "train/loss": 3.2594716548919678, "l2_grads": 1.5234375, "lr": 0.0009666328477556844, "uptime": 41392.523106103006, "examples_seen": 22528000.0, "progress": 0.19537667735317887, "epoch": 17.583968366341, "img/sec/core": 535.6105842963103, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.476122694948609, "core_hours": 11.476122694948609} {"step": 22050, "l2_params": 322.89837313774126, "train/loss": 3.3989591002464294, "l2_grads": 1.4609375, "lr": 0.000966357353271283, "uptime": 41485.956286282, "examples_seen": 22579200.0, "progress": 0.19582071525625427, "epoch": 17.623931930809956, "img/sec/core": 547.9852007810601, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.502076356109443, "core_hours": 11.502076356109443} {"step": 22100, "l2_params": 322.9978442991145, "train/loss": 5.399383783340454, "l2_grads": 1.3828125, "lr": 0.000966080765741032, "uptime": 41580.50956686, "examples_seen": 22630400.0, "progress": 0.19626475315932967, "epoch": 17.663895495278915, "img/sec/core": 541.4936392160643, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.528341156269997, "core_hours": 11.528341156269997} {"step": 22150, "l2_params": 323.0848590879415, "train/loss": 3.1190225481987, "l2_grads": 1.4453125, "lr": 0.0009658030858131953, "uptime": 41674.345098968, "examples_seen": 22681600.0, "progress": 0.19670879106240508, "epoch": 17.70385905974787, "img/sec/core": 545.6355268606616, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.554406581855554, "core_hours": 11.554406581855554} {"step": 22200, "l2_params": 323.1656164027974, "train/loss": 5.009225487709045, "l2_grads": 1.109375, "lr": 0.0009655243141385982, "uptime": 41768.288676619995, "examples_seen": 22732800.0, "progress": 0.1971528289654805, "epoch": 17.743822624216826, "img/sec/core": 545.0079854278549, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.58050202009222, "core_hours": 11.58050202009222} {"step": 22250, "l2_params": 323.2681606823312, "train/loss": 5.386575222015381, "l2_grads": 1.2421875, "lr": 0.0009652444513706237, "uptime": 41862.68695511999, "examples_seen": 22784000.0, "progress": 0.1975968668685559, "epoch": 17.783786188685784, "img/sec/core": 542.3827723722903, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.606723764119998, "core_hours": 11.606723764119998} {"step": 22300, "l2_params": 323.46047925616045, "train/loss": 3.156839072704315, "l2_grads": 1.4375, "lr": 0.000964963498165213, "uptime": 41956.739520313, "examples_seen": 22835200.0, "progress": 0.1980409047716313, "epoch": 17.82374975315474, "img/sec/core": 544.3764334862664, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.63284947667361, "core_hours": 11.63284947667361} {"step": 22350, "l2_params": 323.49149911551, "train/loss": 3.569038212299347, "l2_grads": 1.5390625, "lr": 0.0009646814551808627, "uptime": 42051.136356510004, "examples_seen": 22886400.0, "progress": 0.1984849426747067, "epoch": 17.8637133176237, "img/sec/core": 542.3910595175769, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.659070820061665, "core_hours": 11.659070820061665} {"step": 22400, "l2_params": 323.5660780056177, "train/loss": 3.58547842502594, "l2_grads": 1.4453125, "lr": 0.0009643983230786233, "uptime": 42145.675472917006, "examples_seen": 22937600.0, "progress": 0.19892898057778213, "epoch": 17.903676882092654, "img/sec/core": 541.5747676292822, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.685331685730278, "core_hours": 11.685331685730278} {"step": 22450, "l2_params": 323.6839384217071, "train/loss": 4.912771224975586, "l2_grads": 1.109375, "lr": 0.0009641141025220983, "uptime": 42238.94568569701, "examples_seen": 22988800.0, "progress": 0.19937301848085753, "epoch": 17.943640446561613, "img/sec/core": 548.9426739142027, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.711240078169165, "core_hours": 11.711240078169165} {"step": 22500, "l2_params": 323.72125837670905, "train/loss": 3.2350139021873474, "l2_grads": 1.4765625, "lr": 0.0009638287941774426, "uptime": 42332.991320007, "examples_seen": 23040000.0, "progress": 0.19981705638393293, "epoch": 17.983604011030568, "img/sec/core": 544.4165524072506, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.737363865477498, "core_hours": 11.737363865477498, "val/acc@1": 0.5075534119897959, "val/loss": 2.164734316419582, "z/secs/eval/val": 31.805368171997543} {"step": 22550, "l2_params": 323.85759553776103, "train/loss": 3.132388651371002, "l2_grads": 1.4765625, "lr": 0.0009635423987133605, "uptime": 42457.853280804, "examples_seen": 23091200.0, "progress": 0.20026109428700833, "epoch": 18.023567575499523, "img/sec/core": 410.0528269233209, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.772047743476664, "core_hours": 11.772047743476664} {"step": 22600, "l2_params": 323.9938451865251, "train/loss": 5.436702132225037, "l2_grads": 1.203125, "lr": 0.0009632549168011038, "uptime": 42551.113990711005, "examples_seen": 23142400.0, "progress": 0.20070513219008373, "epoch": 18.063531139968482, "img/sec/core": 548.9986088574312, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.79795349622861, "core_hours": 11.79795349622861} {"step": 22650, "l2_params": 324.0741876508564, "train/loss": 3.1801717877388, "l2_grads": 1.484375, "lr": 0.0009629663491144714, "uptime": 42644.431311715, "examples_seen": 23193600.0, "progress": 0.20114917009315916, "epoch": 18.103494704437438, "img/sec/core": 548.6655580029683, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.823874974285275, "core_hours": 11.823874974285275} {"step": 22700, "l2_params": 324.17626378252925, "train/loss": 3.0391637682914734, "l2_grads": 1.359375, "lr": 0.0009626766963298065, "uptime": 42738.557448185995, "examples_seen": 23244800.0, "progress": 0.20159320799623456, "epoch": 18.143458268906397, "img/sec/core": 543.9509356232224, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.850021123304998, "core_hours": 11.850021123304998} {"step": 22750, "l2_params": 324.25072432696663, "train/loss": 3.120224893093109, "l2_grads": 1.4375, "lr": 0.0009623859591259959, "uptime": 42832.288488673, "examples_seen": 23296000.0, "progress": 0.20203724589930996, "epoch": 18.183421833375352, "img/sec/core": 546.2438028424632, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.876057523440275, "core_hours": 11.876057523440275} {"step": 22800, "l2_params": 324.3496979534589, "train/loss": 3.4523626565933228, "l2_grads": 1.3984375, "lr": 0.0009620941381844675, "uptime": 42927.459272625, "examples_seen": 23347200.0, "progress": 0.20248128380238536, "epoch": 18.22338539784431, "img/sec/core": 537.9802274805454, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.902493852315832, "core_hours": 11.902493852315832} {"step": 22850, "l2_params": 324.55053505530924, "train/loss": 5.518513083457947, "l2_grads": 1.046875, "lr": 0.0009618012341891903, "uptime": 43020.629344363, "examples_seen": 23398400.0, "progress": 0.20292532170546076, "epoch": 18.263348962313266, "img/sec/core": 549.5326883935122, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.92837442779861, "core_hours": 11.92837442779861} {"step": 22900, "l2_params": 324.5998317640507, "train/loss": 3.1722733974456787, "l2_grads": 1.5234375, "lr": 0.00096150724782667, "uptime": 43113.962901388004, "examples_seen": 23449600.0, "progress": 0.2033693596085362, "epoch": 18.30331252678222, "img/sec/core": 548.570113815406, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.954300415861109, "core_hours": 11.954300415861109} {"step": 22950, "l2_params": 324.6312376061298, "train/loss": 3.8707098364830017, "l2_grads": 1.328125, "lr": 0.0009612121797859512, "uptime": 43208.426280678, "examples_seen": 23500800.0, "progress": 0.2038133975116116, "epoch": 18.34327609125118, "img/sec/core": 542.0089815209573, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 11.980540243441665, "core_hours": 11.980540243441665} {"step": 23000, "l2_params": 324.77949400564455, "train/loss": 4.372118592262268, "l2_grads": 1.234375, "lr": 0.0009609160307586124, "uptime": 43301.72319161, "examples_seen": 23552000.0, "progress": 0.204257435414687, "epoch": 18.383239655720136, "img/sec/core": 548.7855866665867, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.006456052033888, "core_hours": 12.006456052033888} {"step": 23050, "l2_params": 324.816561813164, "train/loss": 4.771344542503357, "l2_grads": 1.1640625, "lr": 0.0009606188014387664, "uptime": 43396.159780167, "examples_seen": 23603200.0, "progress": 0.2047014733177624, "epoch": 18.423203220189095, "img/sec/core": 542.162744147587, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.032688437744165, "core_hours": 12.032688437744165} {"step": 23100, "l2_params": 324.9279818042377, "train/loss": 3.583170235157013, "l2_grads": 1.390625, "lr": 0.0009603204925230576, "uptime": 43491.472885789, "examples_seen": 23654400.0, "progress": 0.20514551122083782, "epoch": 18.46316678465805, "img/sec/core": 537.1769146108439, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.059164300416942, "core_hours": 12.059164300416942} {"step": 23150, "l2_params": 325.00209434421345, "train/loss": 4.671717047691345, "l2_grads": 1.2265625, "lr": 0.000960021104710661, "uptime": 43584.739158971, "examples_seen": 23705600.0, "progress": 0.20558954912391322, "epoch": 18.503130349127005, "img/sec/core": 548.9658614329659, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.085071598523054, "core_hours": 12.085071598523054} {"step": 23200, "l2_params": 325.1254490457299, "train/loss": 3.8292757868766785, "l2_grads": 1.375, "lr": 0.0009597206387032788, "uptime": 43679.249587877, "examples_seen": 23756800.0, "progress": 0.20603358702698862, "epoch": 18.543093913595964, "img/sec/core": 541.7391561191781, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.111324495441387, "core_hours": 12.111324495441387} {"step": 23250, "l2_params": 325.21797077594744, "train/loss": 3.253351330757141, "l2_grads": 1.484375, "lr": 0.0009594190952051431, "uptime": 43773.13530455899, "examples_seen": 23808000.0, "progress": 0.20647762493006402, "epoch": 18.58305747806492, "img/sec/core": 545.3438692215815, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.137403861186387, "core_hours": 12.137403861186387} {"step": 23300, "l2_params": 325.32307559659057, "train/loss": 3.177216112613678, "l2_grads": 1.453125, "lr": 0.0009591164749230098, "uptime": 43867.741966386995, "examples_seen": 23859200.0, "progress": 0.20692166283313942, "epoch": 18.62302104253388, "img/sec/core": 541.1881046292839, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.163683489471943, "core_hours": 12.163683489471943} {"step": 23350, "l2_params": 325.39085421660593, "train/loss": 3.7725818157196045, "l2_grads": 1.3125, "lr": 0.000958812778566158, "uptime": 43961.152243767996, "examples_seen": 23910400.0, "progress": 0.20736570073621485, "epoch": 18.662984607002834, "img/sec/core": 548.1195585274406, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.189630788744442, "core_hours": 12.189630788744442} {"step": 23400, "l2_params": 325.5016471012474, "train/loss": 3.333429992198944, "l2_grads": 1.6015625, "lr": 0.0009585080068463899, "uptime": 44054.60096127, "examples_seen": 23961600.0, "progress": 0.20780973863929025, "epoch": 18.702948171471792, "img/sec/core": 547.8940895995282, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.21558876582833, "core_hours": 12.21558876582833} {"step": 23450, "l2_params": 325.5879687436638, "train/loss": 3.491653084754944, "l2_grads": 1.296875, "lr": 0.0009582021604780281, "uptime": 44149.45784627, "examples_seen": 24012800.0, "progress": 0.20825377654236565, "epoch": 18.742911735940748, "img/sec/core": 539.7605034152178, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.241937900550552, "core_hours": 12.241937900550552} {"step": 23500, "l2_params": 325.67743249887997, "train/loss": 4.775983929634094, "l2_grads": 1.2421875, "lr": 0.0009578952401779134, "uptime": 44242.791128230994, "examples_seen": 24064000.0, "progress": 0.20869781444544105, "epoch": 18.782875300409703, "img/sec/core": 548.5717305151022, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.267863812206388, "core_hours": 12.267863812206388} {"step": 23550, "l2_params": 325.6839333066071, "train/loss": 3.20270437002182, "l2_grads": 1.5078125, "lr": 0.0009575872466654046, "uptime": 44336.972485719, "examples_seen": 24115200.0, "progress": 0.20914185234851648, "epoch": 18.822838864878662, "img/sec/core": 543.6320028252269, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.294025300397497, "core_hours": 12.294025300397497} {"step": 23600, "l2_params": 325.8380391151024, "train/loss": 4.890454292297363, "l2_grads": 1.2421875, "lr": 0.0009572781806623737, "uptime": 44430.95021092, "examples_seen": 24166400.0, "progress": 0.20958589025159188, "epoch": 18.862802429347617, "img/sec/core": 544.8099524700324, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.320130224064444, "core_hours": 12.320130224064444} {"step": 23650, "l2_params": 325.9182176103577, "train/loss": 3.2161659002304077, "l2_grads": 1.40625, "lr": 0.0009569680428932088, "uptime": 44524.260490898, "examples_seen": 24217600.0, "progress": 0.21002992815466728, "epoch": 18.902765993816576, "img/sec/core": 548.706959319703, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.346049746280555, "core_hours": 12.346049746280555} {"step": 23700, "l2_params": 325.97983306103464, "train/loss": 3.049364745616913, "l2_grads": 1.4765625, "lr": 0.0009566568340848092, "uptime": 44618.07990357099, "examples_seen": 24268800.0, "progress": 0.21047396605774268, "epoch": 18.94272955828553, "img/sec/core": 545.7292743715707, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.372110694245274, "core_hours": 12.372110694245274} {"step": 23750, "l2_params": 326.01700702139374, "train/loss": 2.914819598197937, "l2_grads": 1.5703125, "lr": 0.0009563445549665844, "uptime": 44711.446950196, "examples_seen": 24320000.0, "progress": 0.21091800396081808, "epoch": 18.98269312275449, "img/sec/core": 548.3733485288201, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.398045984974443, "core_hours": 12.398045984974443} {"step": 23800, "l2_params": 326.1768012352542, "train/loss": 3.0322022438049316, "l2_grads": 1.4140625, "lr": 0.0009560312062704532, "uptime": 44805.917349708005, "examples_seen": 24371200.0, "progress": 0.2113620418638935, "epoch": 19.022656687223446, "img/sec/core": 541.9687041071151, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.424287762616666, "core_hours": 12.424287762616666} {"step": 23850, "l2_params": 326.28121857341097, "train/loss": 3.3000404834747314, "l2_grads": 1.421875, "lr": 0.0009557167887308391, "uptime": 44899.294716644, "examples_seen": 24422400.0, "progress": 0.2118060797669689, "epoch": 19.0626202516924, "img/sec/core": 548.3127408710412, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.450225920098887, "core_hours": 12.450225920098887} {"step": 23900, "l2_params": 326.3611565309014, "train/loss": 5.471139669418335, "l2_grads": 1.15625, "lr": 0.0009554013030846728, "uptime": 44994.352247874005, "examples_seen": 24473600.0, "progress": 0.2122501176700443, "epoch": 19.10258381616136, "img/sec/core": 538.6211837978176, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.476630789884998, "core_hours": 12.476630789884998} {"step": 23950, "l2_params": 326.4169472277749, "train/loss": 3.0977379083633423, "l2_grads": 1.484375, "lr": 0.0009550847500713886, "uptime": 45087.592675376, "examples_seen": 24524800.0, "progress": 0.21269415557311971, "epoch": 19.142547380630315, "img/sec/core": 549.1180314343886, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.502530908635554, "core_hours": 12.502530908635554} {"step": 24000, "l2_params": 326.5149546728297, "train/loss": 4.746737003326416, "l2_grads": 1.2734375, "lr": 0.0009547671304329212, "uptime": 45182.022798013, "examples_seen": 24576000.0, "progress": 0.21313819347619511, "epoch": 19.182510945099274, "img/sec/core": 542.1998676928769, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.528761498256943, "core_hours": 12.528761498256943} {"step": 24050, "l2_params": 326.5151894557319, "train/loss": 3.3304486870765686, "l2_grads": 1.546875, "lr": 0.0009544484449137056, "uptime": 45275.45632095401, "examples_seen": 24627200.0, "progress": 0.21358223137927054, "epoch": 19.22247450956823, "img/sec/core": 547.983190490715, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.554715254629444, "core_hours": 12.554715254629444} {"step": 24100, "l2_params": 326.63191696416857, "train/loss": 3.018537759780884, "l2_grads": 1.453125, "lr": 0.0009541286942606756, "uptime": 45369.846279562, "examples_seen": 24678400.0, "progress": 0.21402626928234594, "epoch": 19.262438074037185, "img/sec/core": 542.4305800645216, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.580934687576107, "core_hours": 12.580934687576107} {"step": 24150, "l2_params": 326.7394765663846, "train/loss": 3.1293901801109314, "l2_grads": 1.6796875, "lr": 0.000953807879223261, "uptime": 45464.367763607996, "examples_seen": 24729600.0, "progress": 0.21447030718542134, "epoch": 19.302401638506144, "img/sec/core": 541.6757948392058, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.607190655366663, "core_hours": 12.607190655366663} {"step": 24200, "l2_params": 326.82529796609225, "train/loss": 3.0709208250045776, "l2_grads": 1.6796875, "lr": 0.000953486000553386, "uptime": 45557.810887117, "examples_seen": 24780800.0, "progress": 0.21491434508849674, "epoch": 19.3423652029751, "img/sec/core": 547.926889398853, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.63314707856361, "core_hours": 12.63314707856361} {"step": 24250, "l2_params": 326.9358003922559, "train/loss": 5.4850322008132935, "l2_grads": 1.28125, "lr": 0.0009531630590054684, "uptime": 45652.334043204, "examples_seen": 24832000.0, "progress": 0.21535838299157217, "epoch": 19.382328767444058, "img/sec/core": 541.6662130163554, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.659403510809998, "core_hours": 12.659403510809998} {"step": 24300, "l2_params": 326.9606036331059, "train/loss": 3.195912182331085, "l2_grads": 1.4921875, "lr": 0.0009528390553364168, "uptime": 45747.052647143006, "examples_seen": 24883200.0, "progress": 0.21580242089464757, "epoch": 19.422292331913013, "img/sec/core": 540.5485075875224, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.685714234126387, "core_hours": 12.685714234126387} {"step": 24350, "l2_params": 327.03420925560295, "train/loss": 3.8682308197021484, "l2_grads": 1.46875, "lr": 0.0009525139903056294, "uptime": 45841.824556027, "examples_seen": 24934400.0, "progress": 0.21624645879772297, "epoch": 19.462255896381972, "img/sec/core": 540.2444733140399, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.712039764371942, "core_hours": 12.712039764371942} {"step": 24400, "l2_params": 327.0774826971432, "train/loss": 4.557730436325073, "l2_grads": 1.3359375, "lr": 0.000952187864674992, "uptime": 45935.33854686, "examples_seen": 24985600.0, "progress": 0.21669049670079837, "epoch": 19.502219460850927, "img/sec/core": 547.511656212313, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.738015872936666, "core_hours": 12.738015872936666} {"step": 24450, "l2_params": 327.19395289720745, "train/loss": 2.9573726058006287, "l2_grads": 1.5546875, "lr": 0.0009518606792088751, "uptime": 46029.799255025006, "examples_seen": 25036800.0, "progress": 0.21713453460387377, "epoch": 19.542183025319883, "img/sec/core": 542.0243082506266, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.764254958538055, "core_hours": 12.764254958538055} {"step": 24500, "l2_params": 327.2491808502926, "train/loss": 3.0463441014289856, "l2_grads": 1.53125, "lr": 0.0009515324346741358, "uptime": 46124.282223190006, "examples_seen": 25088000.0, "progress": 0.2175785725069492, "epoch": 19.58214658978884, "img/sec/core": 541.8966083981045, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.790500227472778, "core_hours": 12.790500227472778} {"step": 24550, "l2_params": 327.42045044130566, "train/loss": 3.0606319904327393, "l2_grads": 1.4375, "lr": 0.0009512031318401106, "uptime": 46218.618359611995, "examples_seen": 25139200.0, "progress": 0.2180226104100246, "epoch": 19.622110154257797, "img/sec/core": 542.7400563763358, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.816704709812221, "core_hours": 12.816704709812221} {"step": 24600, "l2_params": 327.5060799769601, "train/loss": 3.0945587158203125, "l2_grads": 1.5390625, "lr": 0.000950872771478618, "uptime": 46311.875193584, "examples_seen": 25190400.0, "progress": 0.2184666483131, "epoch": 19.662073718726756, "img/sec/core": 549.0214263050315, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.842609385915553, "core_hours": 12.842609385915553} {"step": 24650, "l2_params": 327.6103150920122, "train/loss": 3.047233521938324, "l2_grads": 1.46875, "lr": 0.0009505413543639546, "uptime": 46407.462942091996, "examples_seen": 25241600.0, "progress": 0.2189106862161754, "epoch": 19.70203728319571, "img/sec/core": 535.6334969613381, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.869161538278886, "core_hours": 12.869161538278886} {"step": 24700, "l2_params": 327.61068770006955, "train/loss": 4.664072394371033, "l2_grads": 1.2890625, "lr": 0.0009502088812728944, "uptime": 46500.687068950996, "examples_seen": 25292800.0, "progress": 0.21935472411925083, "epoch": 19.742000847664666, "img/sec/core": 549.2140471043391, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.895057129073054, "core_hours": 12.895057129073054} {"step": 24750, "l2_params": 327.6657664330949, "train/loss": 3.198036015033722, "l2_grads": 1.6875, "lr": 0.0009498753529846866, "uptime": 46595.383803021, "examples_seen": 25344000.0, "progress": 0.21979876202232623, "epoch": 19.781964412133625, "img/sec/core": 540.6733453146675, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.921361777425831, "core_hours": 12.921361777425831} {"step": 24800, "l2_params": 327.66625223169154, "train/loss": 3.101788341999054, "l2_grads": 1.5390625, "lr": 0.0009495407702810517, "uptime": 46688.726376456994, "examples_seen": 25395200.0, "progress": 0.22024279992540163, "epoch": 19.82192797660258, "img/sec/core": 548.5171247727135, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.947290270046942, "core_hours": 12.947290270046942} {"step": 24850, "l2_params": 327.7761672549005, "train/loss": 2.980332672595978, "l2_grads": 1.5078125, "lr": 0.0009492051339461843, "uptime": 46783.468302066, "examples_seen": 25446400.0, "progress": 0.22068683782847703, "epoch": 19.86189154107154, "img/sec/core": 540.4154461806337, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.973607471604998, "core_hours": 12.973607471604998} {"step": 24900, "l2_params": 327.88032395363024, "train/loss": 3.5626622438430786, "l2_grads": 1.4140625, "lr": 0.0009488684447667458, "uptime": 46876.795347417006, "examples_seen": 25497600.0, "progress": 0.22113087573155243, "epoch": 19.901855105540495, "img/sec/core": 548.608388998449, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 12.999531650869166, "core_hours": 12.999531650869166} {"step": 24950, "l2_params": 327.94179707018895, "train/loss": 3.2122238278388977, "l2_grads": 1.4765625, "lr": 0.000948530703531867, "uptime": 46971.933090969, "examples_seen": 25548800.0, "progress": 0.22157491363462786, "epoch": 19.941818670009454, "img/sec/core": 538.1670627075243, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.025958801855833, "core_hours": 13.025958801855833} {"step": 25000, "l2_params": 328.00581019768157, "train/loss": 3.0395094752311707, "l2_grads": 1.4453125, "lr": 0.0009481919110331444, "uptime": 47065.279147451, "examples_seen": 25600000.0, "progress": 0.22201895153770326, "epoch": 19.98178223447841, "img/sec/core": 548.4966578087214, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.05188826198972, "core_hours": 13.05188826198972, "val/acc@1": 0.5249720982142857, "val/loss": 2.07406330473569, "z/secs/eval/val": 31.816826572998252} {"step": 25050, "l2_params": 328.11576475098695, "train/loss": 5.485339879989624, "l2_grads": 1.2578125, "lr": 0.000947852068064637, "uptime": 47190.391014092995, "examples_seen": 25651200.0, "progress": 0.22246298944077866, "epoch": 20.021745798947364, "img/sec/core": 409.2337631449894, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.086641558279164, "core_hours": 13.086641558279164} {"step": 25100, "l2_params": 328.2013095790067, "train/loss": 3.03182452917099, "l2_grads": 1.5390625, "lr": 0.000947511175422868, "uptime": 47283.751580351, "examples_seen": 25702400.0, "progress": 0.22290702734385406, "epoch": 20.061709363416323, "img/sec/core": 548.4114123570031, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.112575048906388, "core_hours": 13.112575048906388} {"step": 25150, "l2_params": 328.27466229706187, "train/loss": 3.415267586708069, "l2_grads": 1.3359375, "lr": 0.0009471692339068186, "uptime": 47378.41221617701, "examples_seen": 25753600.0, "progress": 0.22335106524692946, "epoch": 20.10167292788528, "img/sec/core": 540.8795277279911, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.138869669969164, "core_hours": 13.138869669969164} {"step": 25200, "l2_params": 328.2931563166905, "train/loss": 3.1775516867637634, "l2_grads": 1.609375, "lr": 0.0009468262443179307, "uptime": 47472.526950671, "examples_seen": 25804800.0, "progress": 0.2237951031500049, "epoch": 20.141636492354237, "img/sec/core": 544.0168351456814, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.165012651773054, "core_hours": 13.165012651773054} {"step": 25250, "l2_params": 328.39096958693915, "train/loss": 4.767263770103455, "l2_grads": 1.3984375, "lr": 0.0009464822074601006, "uptime": 47566.498625466, "examples_seen": 25856000.0, "progress": 0.2242391410530803, "epoch": 20.181600056823193, "img/sec/core": 544.8450302891048, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.191115894771665, "core_hours": 13.191115894771665} {"step": 25300, "l2_params": 328.4644018478258, "train/loss": 3.0375990867614746, "l2_grads": 1.5234375, "lr": 0.0009461371241396807, "uptime": 47660.986504235, "examples_seen": 25907200.0, "progress": 0.2246831789561557, "epoch": 20.22156362129215, "img/sec/core": 541.8684456359731, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.217362527763054, "core_hours": 13.217362527763054} {"step": 25350, "l2_params": 328.513404050162, "train/loss": 3.1018818020820618, "l2_grads": 1.578125, "lr": 0.000945790995165475, "uptime": 47754.319103959, "examples_seen": 25958400.0, "progress": 0.2251272168592311, "epoch": 20.261527185761107, "img/sec/core": 548.5757404316331, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.243288249908609, "core_hours": 13.243288249908609} {"step": 25400, "l2_params": 328.571542877746, "train/loss": 2.9297956228256226, "l2_grads": 1.5625, "lr": 0.0009454438213487387, "uptime": 47848.735399525, "examples_seen": 26009600.0, "progress": 0.22557125476230652, "epoch": 20.301490750230062, "img/sec/core": 542.2792717408603, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.269514998676943, "core_hours": 13.269514998676943} {"step": 25450, "l2_params": 328.6536426039958, "train/loss": 3.051647186279297, "l2_grads": 1.5703125, "lr": 0.0009450956035031757, "uptime": 47942.278810389995, "examples_seen": 26060800.0, "progress": 0.22601529266538192, "epoch": 20.34145431469902, "img/sec/core": 547.3394601132354, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.295499279472775, "core_hours": 13.295499279472775} {"step": 25500, "l2_params": 328.74518324655725, "train/loss": 2.9081966876983643, "l2_grads": 1.59375, "lr": 0.0009447463424449376, "uptime": 48036.616043236994, "examples_seen": 26112000.0, "progress": 0.22645933056845732, "epoch": 20.381417879167977, "img/sec/core": 542.7337484346028, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.32170406637472, "core_hours": 13.32170406637472} {"step": 25550, "l2_params": 328.80638032463344, "train/loss": 3.1525155305862427, "l2_grads": 1.4921875, "lr": 0.0009443960389926206, "uptime": 48130.192426327994, "examples_seen": 26163200.0, "progress": 0.22690336847153272, "epoch": 20.421381443636935, "img/sec/core": 547.1466016185905, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.34769750612222, "core_hours": 13.34769750612222} {"step": 25600, "l2_params": 328.8765411166856, "train/loss": 2.937541663646698, "l2_grads": 1.6328125, "lr": 0.0009440446939672631, "uptime": 48225.283261417004, "examples_seen": 26214400.0, "progress": 0.22734740637460812, "epoch": 20.46134500810589, "img/sec/core": 538.4325413913792, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.374111626980275, "core_hours": 13.374111626980275} {"step": 25650, "l2_params": 328.94388739523265, "train/loss": 4.284030318260193, "l2_grads": 1.3828125, "lr": 0.000943692308192347, "uptime": 48318.524949700004, "examples_seen": 26265600.0, "progress": 0.22779144427768355, "epoch": 20.501308572574846, "img/sec/core": 549.110606455361, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.400012095947776, "core_hours": 13.400012095947776} {"step": 25700, "l2_params": 329.0747504842175, "train/loss": 3.0474813580513, "l2_grads": 1.59375, "lr": 0.0009433388824937919, "uptime": 48411.82529838401, "examples_seen": 26316800.0, "progress": 0.22823548218075895, "epoch": 20.541272137043805, "img/sec/core": 548.7653660696218, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.42592885947111, "core_hours": 13.42592885947111} {"step": 25750, "l2_params": 329.1539966575296, "train/loss": 3.0828505754470825, "l2_grads": 1.6015625, "lr": 0.0009429844176999541, "uptime": 48507.146871068006, "examples_seen": 26368000.0, "progress": 0.22867952008383435, "epoch": 20.58123570151276, "img/sec/core": 537.1291991764905, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.452407074105555, "core_hours": 13.452407074105555} {"step": 25801, "l2_params": 329.1968609239576, "train/loss": 3.0738348960876465, "l2_grads": 1.6328125, "lr": 0.000942628914641627, "uptime": 48600.42799562799, "examples_seen": 26419200.0, "progress": 0.22912355798690975, "epoch": 20.62119926598172, "img/sec/core": 548.8784600476165, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.478318497594442, "core_hours": 13.478318497594442} {"step": 25850, "l2_params": 329.23367609733134, "train/loss": 4.672877073287964, "l2_grads": 1.3125, "lr": 0.0009422723741520368, "uptime": 48694.872375019, "examples_seen": 26470400.0, "progress": 0.22956759588998518, "epoch": 20.661162830450674, "img/sec/core": 542.1180204703356, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.504553047425276, "core_hours": 13.504553047425276} {"step": 25900, "l2_params": 329.270281028747, "train/loss": 2.8967264890670776, "l2_grads": 1.4140625, "lr": 0.0009419147970668408, "uptime": 48788.189404189994, "examples_seen": 26521600.0, "progress": 0.23001163379306058, "epoch": 20.701126394919633, "img/sec/core": 548.6672738603716, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.53047444441722, "core_hours": 13.53047444441722} {"step": 25950, "l2_params": 329.3433793526712, "train/loss": 5.438694357872009, "l2_grads": 1.1953125, "lr": 0.0009415561842241264, "uptime": 48882.725483402, "examples_seen": 26572800.0, "progress": 0.23045567169613598, "epoch": 20.74108995938859, "img/sec/core": 541.5921669988026, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.556734466420554, "core_hours": 13.556734466420554} {"step": 26000, "l2_params": 329.4104449026131, "train/loss": 2.947916090488434, "l2_grads": 1.53125, "lr": 0.0009411965364644084, "uptime": 48977.199470417996, "examples_seen": 26624000.0, "progress": 0.23089970959921138, "epoch": 20.781053523857544, "img/sec/core": 541.9481236811805, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.582977240591665, "core_hours": 13.582977240591665} {"step": 26050, "l2_params": 329.4713583554153, "train/loss": 3.1458851099014282, "l2_grads": 1.6328125, "lr": 0.000940835854630628, "uptime": 49070.670303127, "examples_seen": 26675200.0, "progress": 0.23134374750228678, "epoch": 20.821017088326503, "img/sec/core": 547.7644578111424, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.608941360788608, "core_hours": 13.608941360788608} {"step": 26100, "l2_params": 329.57475264061867, "train/loss": 3.597045421600342, "l2_grads": 1.6328125, "lr": 0.0009404741395681484, "uptime": 49164.949504863995, "examples_seen": 26726400.0, "progress": 0.2317877854053622, "epoch": 20.860980652795458, "img/sec/core": 543.0678140744787, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.635130027937775, "core_hours": 13.635130027937775} {"step": 26150, "l2_params": 329.65394971469703, "train/loss": 3.407767176628113, "l2_grads": 1.5390625, "lr": 0.0009401113921247558, "uptime": 49259.009689567, "examples_seen": 26777600.0, "progress": 0.2322318233084376, "epoch": 20.900944217264417, "img/sec/core": 544.3323353198178, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.661257857021944, "core_hours": 13.661257857021944} {"step": 26200, "l2_params": 329.660281755609, "train/loss": 5.199564337730408, "l2_grads": 1.1953125, "lr": 0.0009397476131506551, "uptime": 49352.663089562004, "examples_seen": 26828800.0, "progress": 0.232675861211513, "epoch": 20.940907781733372, "img/sec/core": 546.6966495902457, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.687272690353888, "core_hours": 13.687272690353888} {"step": 26250, "l2_params": 329.696815626683, "train/loss": 3.0965209007263184, "l2_grads": 1.5234375, "lr": 0.0009393828034984707, "uptime": 49446.396970423, "examples_seen": 26880000.0, "progress": 0.2331198991145884, "epoch": 20.98087134620233, "img/sec/core": 546.2272502717077, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.713309879481944, "core_hours": 13.713309879481944} {"step": 26300, "l2_params": 329.75748664738455, "train/loss": 5.554034113883972, "l2_grads": 1.2265625, "lr": 0.0009390169640232402, "uptime": 49541.222179047996, "examples_seen": 26931200.0, "progress": 0.23356393701766381, "epoch": 21.020834910671287, "img/sec/core": 539.9408104914177, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.739650215211109, "core_hours": 13.739650215211109} {"step": 26350, "l2_params": 329.7638300265055, "train/loss": 3.681181848049164, "l2_grads": 1.3984375, "lr": 0.0009386500955824175, "uptime": 49635.2588062, "examples_seen": 26982400.0, "progress": 0.23400797492073924, "epoch": 21.060798475140242, "img/sec/core": 544.4686985342311, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.76577150053111, "core_hours": 13.76577150053111} {"step": 26400, "l2_params": 329.86127973314404, "train/loss": 4.637747406959534, "l2_grads": 1.3828125, "lr": 0.000938282199035866, "uptime": 49730.003966747, "examples_seen": 27033600.0, "progress": 0.23445201282381464, "epoch": 21.1007620396092, "img/sec/core": 540.3969944681505, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.792089600683054, "core_hours": 13.792089600683054} {"step": 26450, "l2_params": 330.0190261442323, "train/loss": 3.4136067628860474, "l2_grads": 1.4453125, "lr": 0.0009379132752458597, "uptime": 49824.652747235, "examples_seen": 27084800.0, "progress": 0.23489605072689004, "epoch": 21.140725604078156, "img/sec/core": 540.9472761932783, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.818380928596387, "core_hours": 13.818380928596387} {"step": 26500, "l2_params": 330.067921809758, "train/loss": 2.977169930934906, "l2_grads": 1.5390625, "lr": 0.000937543325077081, "uptime": 49918.915996626994, "examples_seen": 27136000.0, "progress": 0.23534008862996544, "epoch": 21.180689168547115, "img/sec/core": 543.1597184506535, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.84456516453861, "core_hours": 13.84456516453861} {"step": 26550, "l2_params": 330.12863407929717, "train/loss": 5.2515764236450195, "l2_grads": 1.2421875, "lr": 0.0009371723493966155, "uptime": 50013.051273459, "examples_seen": 27187200.0, "progress": 0.23578412653304087, "epoch": 21.22065273301607, "img/sec/core": 543.8981189950207, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.870713852547498, "core_hours": 13.870713852547498} {"step": 26600, "l2_params": 330.2619876230839, "train/loss": 5.498393177986145, "l2_grads": 1.34375, "lr": 0.000936800349073955, "uptime": 50107.630881516, "examples_seen": 27238400.0, "progress": 0.23622816443611627, "epoch": 21.260616297485026, "img/sec/core": 541.3429073330852, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.896985965896665, "core_hours": 13.896985965896665} {"step": 26650, "l2_params": 330.28647455419286, "train/loss": 4.642292261123657, "l2_grads": 1.265625, "lr": 0.0009364273249809921, "uptime": 50202.02481246099, "examples_seen": 27289600.0, "progress": 0.23667220233919167, "epoch": 21.300579861953985, "img/sec/core": 542.407753204309, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.923206502270274, "core_hours": 13.923206502270274} {"step": 26700, "l2_params": 330.3020590237253, "train/loss": 2.912128984928131, "l2_grads": 1.5703125, "lr": 0.0009360532779920185, "uptime": 50295.808398630004, "examples_seen": 27340800.0, "progress": 0.23711624024226707, "epoch": 21.34054342642294, "img/sec/core": 545.9377497863486, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.94925749842833, "core_hours": 13.94925749842833} {"step": 26750, "l2_params": 330.3536501685542, "train/loss": 5.311055779457092, "l2_grads": 1.359375, "lr": 0.0009356782089837228, "uptime": 50391.019527701006, "examples_seen": 27392000.0, "progress": 0.23756027814534247, "epoch": 21.3805069908919, "img/sec/core": 537.7522617321199, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 13.975705034281388, "core_hours": 13.975705034281388} {"step": 26800, "l2_params": 330.4052258685537, "train/loss": 5.392000317573547, "l2_grads": 1.3203125, "lr": 0.000935302118835191, "uptime": 50486.704027026004, "examples_seen": 27443200.0, "progress": 0.2380043160484179, "epoch": 21.420470555360854, "img/sec/core": 535.091894310867, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.002284061871666, "core_hours": 14.002284061871666} {"step": 26850, "l2_params": 330.41176665923234, "train/loss": 3.1117276549339294, "l2_grads": 1.5703125, "lr": 0.0009349250084279001, "uptime": 50581.14169186501, "examples_seen": 27494400.0, "progress": 0.2384483539514933, "epoch": 21.460434119829813, "img/sec/core": 542.156565256943, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.028516746549165, "core_hours": 14.028516746549165} {"step": 26900, "l2_params": 330.4782800044316, "train/loss": 4.447545289993286, "l2_grads": 1.265625, "lr": 0.0009345468786457198, "uptime": 50676.695197855996, "examples_seen": 27545600.0, "progress": 0.2388923918545687, "epoch": 21.50039768429877, "img/sec/core": 535.8254463716326, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.05505938710222, "core_hours": 14.05505938710222} {"step": 26950, "l2_params": 330.61171996013695, "train/loss": 4.9872413873672485, "l2_grads": 1.2265625, "lr": 0.0009341677303749086, "uptime": 50771.053616777004, "examples_seen": 27596800.0, "progress": 0.2393364297576441, "epoch": 21.540361248767724, "img/sec/core": 542.6118897018141, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.081270059024721, "core_hours": 14.081270059024721} {"step": 27000, "l2_params": 330.6843637632418, "train/loss": 2.833685040473938, "l2_grads": 1.515625, "lr": 0.0009337875645041122, "uptime": 50865.04851988499, "examples_seen": 27648000.0, "progress": 0.23978046766071953, "epoch": 21.580324813236683, "img/sec/core": 544.7103864895047, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.107379754332497, "core_hours": 14.107379754332497} {"step": 27050, "l2_params": 330.7389453934931, "train/loss": 2.937008798122406, "l2_grads": 1.5546875, "lr": 0.0009334063819243609, "uptime": 50960.007068609004, "examples_seen": 27699200.0, "progress": 0.24022450556379493, "epoch": 21.620288377705638, "img/sec/core": 539.1826295577913, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.133757128978054, "core_hours": 14.133757128978054} {"step": 27100, "l2_params": 330.77540441221214, "train/loss": 3.125913679599762, "l2_grads": 1.453125, "lr": 0.0009330241835290697, "uptime": 51053.423822896, "examples_seen": 27750400.0, "progress": 0.24066854346687033, "epoch": 21.660251942174597, "img/sec/core": 548.0815555066449, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.159706227391109, "core_hours": 14.159706227391109} {"step": 27150, "l2_params": 330.78763279151246, "train/loss": 5.406050205230713, "l2_grads": 1.2109375, "lr": 0.0009326409702140319, "uptime": 51148.27006651201, "examples_seen": 27801600.0, "progress": 0.24111258136994573, "epoch": 21.700215506643552, "img/sec/core": 539.8210624691573, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.186052406173332, "core_hours": 14.186052406173332} {"step": 27200, "l2_params": 330.9149366717979, "train/loss": 5.327722549438477, "l2_grads": 1.1640625, "lr": 0.000932256742877421, "uptime": 51243.152674939, "examples_seen": 27852800.0, "progress": 0.24155661927302113, "epoch": 21.74017907111251, "img/sec/core": 539.6141700656722, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.212408686291942, "core_hours": 14.212408686291942} {"step": 27250, "l2_params": 330.91518456396045, "train/loss": 5.100048661231995, "l2_grads": 1.34375, "lr": 0.000931871502419787, "uptime": 51337.509689030005, "examples_seen": 27904000.0, "progress": 0.24200065717609656, "epoch": 21.780142635581466, "img/sec/core": 542.6199683536063, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.238618967983887, "core_hours": 14.238618967983887} {"step": 27300, "l2_params": 331.02728951893073, "train/loss": 3.9145056009292603, "l2_grads": 1.40625, "lr": 0.0009314852497440542, "uptime": 51431.408379924, "examples_seen": 27955200.0, "progress": 0.24244469507917196, "epoch": 21.82010620005042, "img/sec/core": 545.2685177240561, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.264701937676666, "core_hours": 14.264701937676666} {"step": 27350, "l2_params": 331.0517139431353, "train/loss": 3.358723819255829, "l2_grads": 1.515625, "lr": 0.0009310979857555206, "uptime": 51525.453451356996, "examples_seen": 28006400.0, "progress": 0.24288873298224736, "epoch": 21.86006976451938, "img/sec/core": 544.4198108401262, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.290825568630277, "core_hours": 14.290825568630277} {"step": 27400, "l2_params": 331.1002742396365, "train/loss": 3.7318462133407593, "l2_grads": 1.4765625, "lr": 0.000930709711361852, "uptime": 51620.868377909006, "examples_seen": 28057600.0, "progress": 0.24333277088532276, "epoch": 21.900033328988336, "img/sec/core": 536.6036725091975, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.317329714894722, "core_hours": 14.317329714894722} {"step": 27450, "l2_params": 331.173136719111, "train/loss": 2.948315978050232, "l2_grads": 1.546875, "lr": 0.000930320427473085, "uptime": 51715.273874927996, "examples_seen": 28108800.0, "progress": 0.24377680878839816, "epoch": 21.939996893457295, "img/sec/core": 542.3413002073067, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.343553464066666, "core_hours": 14.343553464066666} {"step": 27500, "l2_params": 331.2036420981244, "train/loss": 4.2180140018463135, "l2_grads": 1.328125, "lr": 0.0009299301350016202, "uptime": 51809.110848511, "examples_seen": 28160000.0, "progress": 0.2442208466914736, "epoch": 21.97996045792625, "img/sec/core": 545.6271450902437, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.36961929006194, "core_hours": 14.36961929006194, "val/acc@1": 0.5446229272959183, "val/loss": 1.9976830962969332, "z/secs/eval/val": 31.767556471000717} {"step": 27550, "l2_params": 331.2578463103742, "train/loss": 3.256359338760376, "l2_grads": 1.421875, "lr": 0.0009295388348622241, "uptime": 51933.874299064, "examples_seen": 28211200.0, "progress": 0.244664884594549, "epoch": 22.019924022395205, "img/sec/core": 410.37659485259155, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.404275804104442, "core_hours": 14.404275804104442} {"step": 27600, "l2_params": 331.31246610309205, "train/loss": 2.8400657176971436, "l2_grads": 1.6328125, "lr": 0.0009291465279720226, "uptime": 52028.437957568996, "examples_seen": 28262400.0, "progress": 0.2451089224976244, "epoch": 22.059887586864164, "img/sec/core": 541.4342127773325, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.430543487022499, "core_hours": 14.430543487022499} {"step": 27650, "l2_params": 331.354915578636, "train/loss": 2.8800345063209534, "l2_grads": 1.640625, "lr": 0.0009287532152505033, "uptime": 52122.540020884, "examples_seen": 28313600.0, "progress": 0.2455529604006998, "epoch": 22.09985115133312, "img/sec/core": 544.0900889560045, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.456682949054443, "core_hours": 14.456682949054443} {"step": 27700, "l2_params": 331.3670636309152, "train/loss": 3.5407009720802307, "l2_grads": 1.3515625, "lr": 0.0009283588976195102, "uptime": 52216.731047384994, "examples_seen": 28364800.0, "progress": 0.24599699830377522, "epoch": 22.13981471580208, "img/sec/core": 543.5761972448178, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.482847123082498, "core_hours": 14.482847123082498} {"step": 27750, "l2_params": 331.4519475801696, "train/loss": 3.4517678022384644, "l2_grads": 1.3984375, "lr": 0.000927963576003242, "uptime": 52312.49393045899, "examples_seen": 28416000.0, "progress": 0.24644103620685062, "epoch": 22.179778280271034, "img/sec/core": 534.6539113743668, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.509447923936387, "core_hours": 14.509447923936387} {"step": 27800, "l2_params": 331.530354532677, "train/loss": 5.463787913322449, "l2_grads": 1.1953125, "lr": 0.0009275672513282529, "uptime": 52406.421975209, "examples_seen": 28467200.0, "progress": 0.24688507410992602, "epoch": 22.219741844739993, "img/sec/core": 545.098113521593, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.535539047478055, "core_hours": 14.535539047478055} {"step": 27850, "l2_params": 331.6029016383904, "train/loss": 2.8477694392204285, "l2_grads": 1.5859375, "lr": 0.0009271699245234455, "uptime": 52501.075471567994, "examples_seen": 28518400.0, "progress": 0.24732911201300142, "epoch": 22.259705409208948, "img/sec/core": 540.9203248637795, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.561831685355553, "core_hours": 14.561831685355553} {"step": 27900, "l2_params": 331.65735124192935, "train/loss": 2.8616190552711487, "l2_grads": 1.640625, "lr": 0.0009267715965200722, "uptime": 52595.55537350899, "examples_seen": 28569600.0, "progress": 0.24777314991607682, "epoch": 22.299668973677903, "img/sec/core": 541.9141949572917, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.588076102561386, "core_hours": 14.588076102561386} {"step": 27950, "l2_params": 331.73600402607417, "train/loss": 4.8251789808273315, "l2_grads": 1.2421875, "lr": 0.000926372268251733, "uptime": 52690.253347592006, "examples_seen": 28620800.0, "progress": 0.24821718781915225, "epoch": 22.339632538146862, "img/sec/core": 540.6662655224404, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.614381095362223, "core_hours": 14.614381095362223} {"step": 28000, "l2_params": 331.79663034191594, "train/loss": 5.409395337104797, "l2_grads": 1.546875, "lr": 0.0009259719406543708, "uptime": 52784.28821219799, "examples_seen": 28672000.0, "progress": 0.24866122572222765, "epoch": 22.379596102615817, "img/sec/core": 544.478903803691, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.640501891086108, "core_hours": 14.640501891086108} {"step": 28050, "l2_params": 331.79669803680235, "train/loss": 2.93552166223526, "l2_grads": 1.6796875, "lr": 0.0009255706146662708, "uptime": 52878.89351735001, "examples_seen": 28723200.0, "progress": 0.24910526362530305, "epoch": 22.419559667084776, "img/sec/core": 541.1958654721809, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.666781142517221, "core_hours": 14.666781142517221} {"step": 28100, "l2_params": 331.80311132884214, "train/loss": 2.780928671360016, "l2_grads": 1.5859375, "lr": 0.0009251682912280589, "uptime": 52973.11355257699, "examples_seen": 28774400.0, "progress": 0.24954930152837845, "epoch": 22.45952323155373, "img/sec/core": 543.4088394962873, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.692953374524718, "core_hours": 14.692953374524718} {"step": 28150, "l2_params": 331.88749240847795, "train/loss": 2.851654529571533, "l2_grads": 1.6171875, "lr": 0.0009247649712826991, "uptime": 53066.923573686, "examples_seen": 28825600.0, "progress": 0.24999333943145388, "epoch": 22.499486796022687, "img/sec/core": 545.7839087415441, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.719011713721667, "core_hours": 14.719011713721667} {"step": 28200, "l2_params": 331.97194617448474, "train/loss": 3.25130158662796, "l2_grads": 1.5, "lr": 0.0009243606557754892, "uptime": 53161.595940436004, "examples_seen": 28876800.0, "progress": 0.25043737733452925, "epoch": 22.539450360491646, "img/sec/core": 540.8125069399034, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.745309593374442, "core_hours": 14.745309593374442} {"step": 28250, "l2_params": 332.068593488228, "train/loss": 4.66940712928772, "l2_grads": 1.3046875, "lr": 0.0009239553456540635, "uptime": 53256.552396129, "examples_seen": 28928000.0, "progress": 0.25088141523760465, "epoch": 22.5794139249606, "img/sec/core": 539.1945142259071, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.771686386622497, "core_hours": 14.771686386622497} {"step": 28300, "l2_params": 332.0686420121787, "train/loss": 3.3180335760116577, "l2_grads": 1.4765625, "lr": 0.0009235490418683851, "uptime": 53349.704982147, "examples_seen": 28979200.0, "progress": 0.2513254531406801, "epoch": 22.61937748942956, "img/sec/core": 549.6358414580576, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.797562104960832, "core_hours": 14.797562104960832} {"step": 28350, "l2_params": 332.0746427527627, "train/loss": 2.9313390254974365, "l2_grads": 1.796875, "lr": 0.0009231417453707457, "uptime": 53444.076761249, "examples_seen": 29030400.0, "progress": 0.2517694910437555, "epoch": 22.659341053898515, "img/sec/core": 542.5350723192782, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.82377648804472, "core_hours": 14.82377648804472} {"step": 28400, "l2_params": 332.1111756743704, "train/loss": 4.366518974304199, "l2_grads": 1.40625, "lr": 0.0009227334571157655, "uptime": 53538.73953305899, "examples_seen": 29081600.0, "progress": 0.2522135289468309, "epoch": 22.699304618367474, "img/sec/core": 540.8673232468341, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.850071702436386, "core_hours": 14.850071702436386} {"step": 28450, "l2_params": 332.1475325791801, "train/loss": 3.209397315979004, "l2_grads": 1.6328125, "lr": 0.0009223241780603879, "uptime": 53632.634620649, "examples_seen": 29132800.0, "progress": 0.2526575668499063, "epoch": 22.73926818283643, "img/sec/core": 545.2894428680464, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.876153671211389, "core_hours": 14.876153671211389} {"step": 28500, "l2_params": 332.2199125767449, "train/loss": 4.907149314880371, "l2_grads": 1.40625, "lr": 0.0009219139091638795, "uptime": 53726.63582521099, "examples_seen": 29184000.0, "progress": 0.2531016047529817, "epoch": 22.779231747305385, "img/sec/core": 544.6738713463282, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.902265116923052, "core_hours": 14.902265116923052} {"step": 28550, "l2_params": 332.2920490462795, "train/loss": 3.3113178610801697, "l2_grads": 1.4609375, "lr": 0.0009215026513878257, "uptime": 53820.594449353, "examples_seen": 29235200.0, "progress": 0.2535456426560571, "epoch": 22.819195311774344, "img/sec/core": 544.9207081046565, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.928364734740276, "core_hours": 14.928364734740276} {"step": 28600, "l2_params": 332.358734088635, "train/loss": 2.916654050350189, "l2_grads": 1.5, "lr": 0.0009210904056961307, "uptime": 53915.555021324006, "examples_seen": 29286400.0, "progress": 0.2539896805591325, "epoch": 22.8591588762433, "img/sec/core": 539.1711416358685, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.954742671398888, "core_hours": 14.954742671398888} {"step": 28650, "l2_params": 332.3772124080184, "train/loss": 2.9733678102493286, "l2_grads": 1.5234375, "lr": 0.0009206771730550133, "uptime": 54010.11410149399, "examples_seen": 29337600.0, "progress": 0.2544337184622079, "epoch": 22.899122440712258, "img/sec/core": 541.4604277871007, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 14.98100908255722, "core_hours": 14.98100908255722} {"step": 28700, "l2_params": 332.3953635873626, "train/loss": 4.7747578620910645, "l2_grads": 1.328125, "lr": 0.0009202629544330066, "uptime": 54104.570774647, "examples_seen": 29388800.0, "progress": 0.2548777563652833, "epoch": 22.939086005181213, "img/sec/core": 542.0474625129666, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.007247047321943, "core_hours": 15.007247047321943} {"step": 28750, "l2_params": 332.4072958759517, "train/loss": 2.815446972846985, "l2_grads": 1.6640625, "lr": 0.0009198477508009541, "uptime": 54199.558115302, "examples_seen": 29440000.0, "progress": 0.25532179426835877, "epoch": 22.979049569650172, "img/sec/core": 539.0191961048778, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.033632419726109, "core_hours": 15.033632419726109} {"step": 28800, "l2_params": 332.47962666671395, "train/loss": 2.8121220469474792, "l2_grads": 1.578125, "lr": 0.0009194315631320064, "uptime": 54293.986817198995, "examples_seen": 29491200.0, "progress": 0.25576583217143417, "epoch": 23.019013134119128, "img/sec/core": 542.2080254354019, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.059862614697497, "core_hours": 15.059862614697497} {"step": 28850, "l2_params": 332.54318034937205, "train/loss": 5.225890040397644, "l2_grads": 1.4609375, "lr": 0.0009190143924016231, "uptime": 54387.909107693995, "examples_seen": 29542400.0, "progress": 0.25620987007450957, "epoch": 23.058976698588083, "img/sec/core": 545.1315095720067, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.085952139834998, "core_hours": 15.085952139834998} {"step": 28900, "l2_params": 332.57942983359254, "train/loss": 2.8779857754707336, "l2_grads": 1.6015625, "lr": 0.0009185962395875661, "uptime": 54482.484028333, "examples_seen": 29593600.0, "progress": 0.25665390797758497, "epoch": 23.09894026305704, "img/sec/core": 541.3697379185012, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.11222295112361, "core_hours": 15.11222295112361} {"step": 28950, "l2_params": 332.60946711900357, "train/loss": 5.125243067741394, "l2_grads": 1.25, "lr": 0.0009181771056699002, "uptime": 54576.964049179005, "examples_seen": 29644800.0, "progress": 0.2570979458806604, "epoch": 23.138903827525997, "img/sec/core": 541.9135129474053, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.13846740135861, "core_hours": 15.13846740135861} {"step": 29000, "l2_params": 332.712057906777, "train/loss": 2.839268684387207, "l2_grads": 1.609375, "lr": 0.0009177569916309891, "uptime": 54672.362568265, "examples_seen": 29696000.0, "progress": 0.2575419837837358, "epoch": 23.178867391994956, "img/sec/core": 536.6959622700845, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.164966989993609, "core_hours": 15.164966989993609} {"step": 29050, "l2_params": 332.7211978636355, "train/loss": 3.631060302257538, "l2_grads": 1.4609375, "lr": 0.0009173358984554937, "uptime": 54765.774771376, "examples_seen": 29747200.0, "progress": 0.2579860216868112, "epoch": 23.21883095646391, "img/sec/core": 548.1082588230893, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.19091482419111, "core_hours": 15.19091482419111} {"step": 29100, "l2_params": 332.7394197932896, "train/loss": 2.7771106958389282, "l2_grads": 1.6171875, "lr": 0.0009169138271303703, "uptime": 54860.309019759006, "examples_seen": 29798400.0, "progress": 0.2584300595898866, "epoch": 23.258794520932867, "img/sec/core": 541.6026559238586, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.217174337630833, "core_hours": 15.217174337630833} {"step": 29150, "l2_params": 332.8325111354809, "train/loss": 2.896610200405121, "l2_grads": 1.640625, "lr": 0.0009164907786448665, "uptime": 54954.676150939005, "examples_seen": 29849600.0, "progress": 0.258874097492962, "epoch": 23.298758085401825, "img/sec/core": 542.5617941308338, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.243387429625276, "core_hours": 15.243387429625276} {"step": 29200, "l2_params": 332.90481407509714, "train/loss": 2.8826907873153687, "l2_grads": 1.6015625, "lr": 0.0009160667539905218, "uptime": 55049.630905161, "examples_seen": 29900800.0, "progress": 0.25931813539603743, "epoch": 23.33872164987078, "img/sec/core": 539.2041759204519, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.269763750242499, "core_hours": 15.269763750242499} {"step": 29250, "l2_params": 332.9861958709775, "train/loss": 2.713820219039917, "l2_grads": 1.609375, "lr": 0.0009156417541611634, "uptime": 55144.223588370005, "examples_seen": 29952000.0, "progress": 0.25976217329911283, "epoch": 23.37868521433974, "img/sec/core": 541.268079761228, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.296039495578333, "core_hours": 15.296039495578333} {"step": 29300, "l2_params": 333.0586179169517, "train/loss": 2.9780408143997192, "l2_grads": 1.5625, "lr": 0.0009152157801529028, "uptime": 55238.732182258, "examples_seen": 30003200.0, "progress": 0.26020621120218823, "epoch": 23.418648778808695, "img/sec/core": 541.7496747510165, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.322291882769443, "core_hours": 15.322291882769443} {"step": 29350, "l2_params": 333.05874106529615, "train/loss": 2.840332806110382, "l2_grads": 1.703125, "lr": 0.0009147888329641353, "uptime": 55333.629363739994, "examples_seen": 30054400.0, "progress": 0.26065024910526363, "epoch": 23.458612343277654, "img/sec/core": 539.5313032528123, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.348652210958885, "core_hours": 15.348652210958885} {"step": 29400, "l2_params": 333.13096265770616, "train/loss": 4.2575448751449585, "l2_grads": 1.3046875, "lr": 0.0009143609135955377, "uptime": 55428.449911431, "examples_seen": 30105600.0, "progress": 0.26109428700833903, "epoch": 23.49857590774661, "img/sec/core": 539.9673514526571, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.374991251984165, "core_hours": 15.374991251984165} {"step": 29450, "l2_params": 333.1308805766136, "train/loss": 2.9204058051109314, "l2_grads": 1.7890625, "lr": 0.0009139320230500652, "uptime": 55523.04274258501, "examples_seen": 30156800.0, "progress": 0.26153832491141443, "epoch": 23.538539472215565, "img/sec/core": 541.2672332075812, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.401267038415831, "core_hours": 15.401267038415831} {"step": 29500, "l2_params": 333.14312509321724, "train/loss": 2.9001948833465576, "l2_grads": 1.6484375, "lr": 0.0009135021623329497, "uptime": 55617.588759802005, "examples_seen": 30208000.0, "progress": 0.26198236281448983, "epoch": 23.578503036684523, "img/sec/core": 541.5352386815781, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.42752982097611, "core_hours": 15.42752982097611} {"step": 29550, "l2_params": 333.23659598887093, "train/loss": 3.5593379735946655, "l2_grads": 1.390625, "lr": 0.0009130713324516961, "uptime": 55711.318884287, "examples_seen": 30259200.0, "progress": 0.26242640071756523, "epoch": 23.61846660115348, "img/sec/core": 546.2491411520151, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.453565966666387, "core_hours": 15.453565966666387} {"step": 29600, "l2_params": 333.29365600444976, "train/loss": 2.8961108326911926, "l2_grads": 1.5625, "lr": 0.0009126395344160805, "uptime": 55805.15654398099, "examples_seen": 30310400.0, "progress": 0.26287043862064063, "epoch": 23.658430165622438, "img/sec/core": 545.6231556388003, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.479631983248053, "core_hours": 15.479631983248053} {"step": 29650, "l2_params": 333.3568977673366, "train/loss": 3.5303152203559875, "l2_grads": 1.5859375, "lr": 0.0009122067692381491, "uptime": 55899.85876105999, "examples_seen": 30361600.0, "progress": 0.2633144765237161, "epoch": 23.698393730091393, "img/sec/core": 540.6420417516623, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.505938154658885, "core_hours": 15.505938154658885} {"step": 29700, "l2_params": 333.3990854746193, "train/loss": 2.8325895071029663, "l2_grads": 1.640625, "lr": 0.0009117730379322153, "uptime": 55993.442528237996, "examples_seen": 30412800.0, "progress": 0.2637585144267915, "epoch": 23.738357294560352, "img/sec/core": 547.1034298353698, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.531933645541665, "core_hours": 15.531933645541665} {"step": 29750, "l2_params": 333.40814362335993, "train/loss": 5.097580075263977, "l2_grads": 1.359375, "lr": 0.0009113383415148558, "uptime": 56088.370301888994, "examples_seen": 30464000.0, "progress": 0.2642025523298669, "epoch": 23.778320859029307, "img/sec/core": 539.3574296626514, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.55830247155583, "core_hours": 15.55830247155583} {"step": 29800, "l2_params": 333.4141451520916, "train/loss": 3.2382481694221497, "l2_grads": 1.53125, "lr": 0.0009109026810049097, "uptime": 56183.905740129994, "examples_seen": 30515200.0, "progress": 0.2646465902329423, "epoch": 23.818284423498262, "img/sec/core": 535.9267821731383, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.584840093289442, "core_hours": 15.584840093289442} {"step": 29850, "l2_params": 333.51028961825153, "train/loss": 2.905417323112488, "l2_grads": 1.5078125, "lr": 0.000910466057423475, "uptime": 56278.1164903, "examples_seen": 30566400.0, "progress": 0.2650906281360177, "epoch": 23.85824798796722, "img/sec/core": 543.4623958264931, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.611009746114442, "core_hours": 15.611009746114442} {"step": 29900, "l2_params": 333.5735664268828, "train/loss": 3.1088554859161377, "l2_grads": 1.5625, "lr": 0.0009100284717939087, "uptime": 56373.691329821, "examples_seen": 30617600.0, "progress": 0.2655346660390931, "epoch": 23.898211552436177, "img/sec/core": 535.7058432596015, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.637558312648054, "core_hours": 15.637558312648054} {"step": 29950, "l2_params": 333.5796147473643, "train/loss": 2.9559887647628784, "l2_grads": 1.6796875, "lr": 0.0009095899251418212, "uptime": 56467.511704895005, "examples_seen": 30668800.0, "progress": 0.2659787039421685, "epoch": 23.938175116905136, "img/sec/core": 545.7236763295472, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.663619527946388, "core_hours": 15.663619527946388} {"step": 30000, "l2_params": 333.62783783684404, "train/loss": 4.156064391136169, "l2_grads": 1.390625, "lr": 0.0009091504184950754, "uptime": 56562.401066720995, "examples_seen": 30720000.0, "progress": 0.2664227418452439, "epoch": 23.97813868137409, "img/sec/core": 539.5757650250373, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.689977684009165, "core_hours": 15.689977684009165, "val/acc@1": 0.5635762117346939, "val/loss": 1.8838995226791926, "z/secs/eval/val": 31.671478449999995} {"step": 30050, "l2_params": 333.687870211913, "train/loss": 4.739919900894165, "l2_grads": 1.46875, "lr": 0.0009087099528837858, "uptime": 56687.18019042, "examples_seen": 30771200.0, "progress": 0.2668667797483193, "epoch": 24.018102245843046, "img/sec/core": 410.3250486315902, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.72463855170333, "core_hours": 15.72463855170333} {"step": 30100, "l2_params": 333.6998879747714, "train/loss": 2.8319886326789856, "l2_grads": 1.6171875, "lr": 0.0009082685293403128, "uptime": 56782.080393771, "examples_seen": 30822400.0, "progress": 0.26731081765139475, "epoch": 24.058065810312005, "img/sec/core": 539.5141231745545, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.75099971930083, "core_hours": 15.75099971930083} {"step": 30150, "l2_params": 333.7718698944123, "train/loss": 5.001183748245239, "l2_grads": 1.5, "lr": 0.000907826148899262, "uptime": 56875.625971573, "examples_seen": 30873600.0, "progress": 0.26775485555447015, "epoch": 24.09802937478096, "img/sec/core": 547.3267812655821, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.77698460202361, "core_hours": 15.77698460202361} {"step": 30200, "l2_params": 333.7960891046546, "train/loss": 5.281230449676514, "l2_grads": 1.34375, "lr": 0.0009073828125974818, "uptime": 56970.482730145, "examples_seen": 30924800.0, "progress": 0.26819889345754555, "epoch": 24.13799293924992, "img/sec/core": 539.7612228245875, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.803333701626944, "core_hours": 15.803333701626944} {"step": 30250, "l2_params": 333.77215077476507, "train/loss": 2.7661863565444946, "l2_grads": 1.609375, "lr": 0.0009069385214740631, "uptime": 57065.159550148994, "examples_seen": 30976000.0, "progress": 0.26864293136062095, "epoch": 24.177956503718875, "img/sec/core": 540.7870690823742, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.829632818294721, "core_hours": 15.829632818294721} {"step": 30300, "l2_params": 333.86838227015073, "train/loss": 2.9299726486206055, "l2_grads": 1.578125, "lr": 0.0009064932765703317, "uptime": 57160.266291338005, "examples_seen": 31027200.0, "progress": 0.26908696926369635, "epoch": 24.217920068187833, "img/sec/core": 538.3424913934479, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.856051357513886, "core_hours": 15.856051357513886} {"step": 30350, "l2_params": 333.89251258591815, "train/loss": 2.918467879295349, "l2_grads": 1.796875, "lr": 0.0009060470789298505, "uptime": 57254.704644722995, "examples_seen": 31078400.0, "progress": 0.26953100716677175, "epoch": 24.25788363265679, "img/sec/core": 542.1526124166149, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.882284233454165, "core_hours": 15.882284233454165} {"step": 30400, "l2_params": 333.9285921982423, "train/loss": 3.3357405066490173, "l2_grads": 1.4453125, "lr": 0.0009055999295984157, "uptime": 57350.353879199, "examples_seen": 31129600.0, "progress": 0.26997504506984715, "epoch": 24.297847197125744, "img/sec/core": 535.2891769650759, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.908853465253054, "core_hours": 15.908853465253054} {"step": 30450, "l2_params": 333.982533986154, "train/loss": 3.4732001423835754, "l2_grads": 1.578125, "lr": 0.0009051518296240534, "uptime": 57445.512495817005, "examples_seen": 31180800.0, "progress": 0.27041908297292255, "epoch": 24.337810761594703, "img/sec/core": 538.0490156297192, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.93528641431361, "core_hours": 15.93528641431361} {"step": 30500, "l2_params": 334.06048292188046, "train/loss": 2.797013521194458, "l2_grads": 1.546875, "lr": 0.000904702780057017, "uptime": 57540.799580716994, "examples_seen": 31232000.0, "progress": 0.27086312087599795, "epoch": 24.37777432606366, "img/sec/core": 537.3236053315595, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.961755049008053, "core_hours": 15.961755049008053} {"step": 30550, "l2_params": 334.1086380673957, "train/loss": 3.656630039215088, "l2_grads": 1.421875, "lr": 0.0009042527819497874, "uptime": 57635.502750709, "examples_seen": 31283200.0, "progress": 0.27130715877907335, "epoch": 24.417737890532617, "img/sec/core": 540.6366017560206, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 15.988061485116942, "core_hours": 15.988061485116942} {"step": 30600, "l2_params": 334.1087535214956, "train/loss": 2.8373261094093323, "l2_grads": 1.703125, "lr": 0.0009038018363570673, "uptime": 57729.897541647995, "examples_seen": 31334400.0, "progress": 0.2717511966821488, "epoch": 24.457701455001573, "img/sec/core": 542.4028115395489, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.014282260377776, "core_hours": 16.014282260377776} {"step": 30650, "l2_params": 334.16234914474956, "train/loss": 2.8284703493118286, "l2_grads": 1.6484375, "lr": 0.0009033499443357809, "uptime": 57824.51603208399, "examples_seen": 31385600.0, "progress": 0.2721952345852242, "epoch": 24.497665019470528, "img/sec/core": 541.1204486995363, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.040565174387776, "core_hours": 16.040565174387776} {"step": 30700, "l2_params": 334.23469164879117, "train/loss": 2.8657193183898926, "l2_grads": 1.59375, "lr": 0.0009028971069450698, "uptime": 57919.391614349006, "examples_seen": 31436800.0, "progress": 0.2726392724882996, "epoch": 24.537628583939487, "img/sec/core": 539.6541320504225, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.066919502794722, "core_hours": 16.066919502794722} {"step": 30750, "l2_params": 334.3004239265933, "train/loss": 2.792861223220825, "l2_grads": 1.828125, "lr": 0.0009024433252462924, "uptime": 58013.399027823005, "examples_seen": 31488000.0, "progress": 0.273083310391375, "epoch": 24.577592148408442, "img/sec/core": 544.6378972458506, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.093032673204167, "core_hours": 16.093032673204167} {"step": 30800, "l2_params": 334.32450115166927, "train/loss": 2.831694483757019, "l2_grads": 1.6796875, "lr": 0.0009019886003030189, "uptime": 58107.39747064799, "examples_seen": 31539200.0, "progress": 0.2735273482944504, "epoch": 24.6175557128774, "img/sec/core": 544.6898742282701, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.119143351766663, "core_hours": 16.119143351766663} {"step": 30850, "l2_params": 334.3547336148017, "train/loss": 2.6220422983169556, "l2_grads": 1.6953125, "lr": 0.0009015329331810322, "uptime": 58202.445019770996, "examples_seen": 31590400.0, "progress": 0.2739713861975258, "epoch": 24.657519277346356, "img/sec/core": 538.6777510037759, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.145545448745274, "core_hours": 16.145545448745274} {"step": 30900, "l2_params": 334.37281833400425, "train/loss": 2.9132912158966064, "l2_grads": 1.609375, "lr": 0.0009010763249483218, "uptime": 58296.728024127995, "examples_seen": 31641600.0, "progress": 0.2744154241006012, "epoch": 24.697482841815315, "img/sec/core": 543.0459110756907, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.171735172177776, "core_hours": 16.171735172177776} {"step": 30950, "l2_params": 334.4325446979181, "train/loss": 2.7289111018180847, "l2_grads": 1.6328125, "lr": 0.0009006187766750842, "uptime": 58391.447782510004, "examples_seen": 31692800.0, "progress": 0.2748594620036766, "epoch": 24.73744640628427, "img/sec/core": 540.5419193903781, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.198046216172777, "core_hours": 16.198046216172777} {"step": 31001, "l2_params": 334.43881108414286, "train/loss": 3.0891324281692505, "l2_grads": 1.578125, "lr": 0.0009001602894337176, "uptime": 58487.001314103996, "examples_seen": 31744000.0, "progress": 0.275303499906752, "epoch": 24.777409970753226, "img/sec/core": 535.8253028003744, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.224588863837777, "core_hours": 16.224588863837777} {"step": 31050, "l2_params": 334.51076828939676, "train/loss": 4.362314462661743, "l2_grads": 1.2890625, "lr": 0.000899700864298823, "uptime": 58581.567309355, "examples_seen": 31795200.0, "progress": 0.27574753780982747, "epoch": 24.817373535222185, "img/sec/core": 541.4208338219426, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.250857195851943, "core_hours": 16.250857195851943} {"step": 31100, "l2_params": 334.54661921724374, "train/loss": 3.3159183859825134, "l2_grads": 1.4296875, "lr": 0.0008992405023471972, "uptime": 58675.55518959199, "examples_seen": 31846400.0, "progress": 0.27619157571290287, "epoch": 24.85733709969114, "img/sec/core": 544.7510878093831, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.27696494036222, "core_hours": 16.27696494036222} {"step": 31150, "l2_params": 334.58262683481865, "train/loss": 2.952472448348999, "l2_grads": 1.671875, "lr": 0.000898779204657835, "uptime": 58770.042265044, "examples_seen": 31897600.0, "progress": 0.27663561361597827, "epoch": 24.8973006641601, "img/sec/core": 541.8730525320263, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.30321135021, "core_hours": 16.30321135021} {"step": 31200, "l2_params": 334.58265602230114, "train/loss": 2.8867727518081665, "l2_grads": 1.6484375, "lr": 0.0008983169723119233, "uptime": 58864.530035802, "examples_seen": 31948800.0, "progress": 0.27707965151905367, "epoch": 24.937264228629054, "img/sec/core": 541.8690650574389, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.329457953198332, "core_hours": 16.329457953198332} {"step": 31250, "l2_params": 334.58276547533796, "train/loss": 5.149297475814819, "l2_grads": 1.4453125, "lr": 0.00089785380639284, "uptime": 58959.28620335, "examples_seen": 32000000.0, "progress": 0.27752368942212907, "epoch": 24.977227793098013, "img/sec/core": 540.3342212427747, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.355779110850555, "core_hours": 16.355779110850555} {"step": 31300, "l2_params": 334.62489056077777, "train/loss": 2.8001259565353394, "l2_grads": 1.6015625, "lr": 0.0008973897079861508, "uptime": 59053.883493406, "examples_seen": 32051200.0, "progress": 0.27796772732520447, "epoch": 25.01719135756697, "img/sec/core": 541.2417202405054, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.38205613586611, "core_hours": 16.38205613586611} {"step": 31350, "l2_params": 334.6488350098316, "train/loss": 2.806091070175171, "l2_grads": 1.7578125, "lr": 0.0008969246781796072, "uptime": 59148.321473332995, "examples_seen": 32102400.0, "progress": 0.2784117652282799, "epoch": 25.057154922035924, "img/sec/core": 542.1547563764044, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.408288908068055, "core_hours": 16.408288908068055} {"step": 31400, "l2_params": 334.7027993118484, "train/loss": 4.416810750961304, "l2_grads": 1.34375, "lr": 0.0008964587180631436, "uptime": 59242.812364219004, "examples_seen": 32153600.0, "progress": 0.2788558031313553, "epoch": 25.097118486504883, "img/sec/core": 541.8511723185061, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.43453637775861, "core_hours": 16.43453637775861} {"step": 31450, "l2_params": 334.7268796860733, "train/loss": 3.5924564003944397, "l2_grads": 1.4375, "lr": 0.0008959918287288739, "uptime": 59338.926361555, "examples_seen": 32204800.0, "progress": 0.2792998410344307, "epoch": 25.137082050973838, "img/sec/core": 532.7007659562241, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.461234710351942, "core_hours": 16.461234710351942} {"step": 31500, "l2_params": 334.7747931212489, "train/loss": 2.8510640263557434, "l2_grads": 1.6015625, "lr": 0.000895524011271092, "uptime": 59433.355078784996, "examples_seen": 32256000.0, "progress": 0.27974387893750613, "epoch": 25.177045615442797, "img/sec/core": 542.2079373935649, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.4874649095825, "core_hours": 16.4874649095825} {"step": 31550, "l2_params": 334.79869184705603, "train/loss": 2.8488420248031616, "l2_grads": 1.6796875, "lr": 0.0008950552667862644, "uptime": 59528.782824010006, "examples_seen": 32307200.0, "progress": 0.28018791684058153, "epoch": 25.217009179911752, "img/sec/core": 536.5315913027077, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.51397261658944, "core_hours": 16.51397261658944} {"step": 31600, "l2_params": 334.8466752088745, "train/loss": 2.673866629600525, "l2_grads": 1.6953125, "lr": 0.000894585596373033, "uptime": 59623.39602635401, "examples_seen": 32358400.0, "progress": 0.28063195474365693, "epoch": 25.256972744380707, "img/sec/core": 541.1506928371784, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.540254061684998, "core_hours": 16.540254061684998} {"step": 31650, "l2_params": 334.8584457811054, "train/loss": 5.318825840950012, "l2_grads": 1.3515625, "lr": 0.0008941150011322088, "uptime": 59718.037543112005, "examples_seen": 32409600.0, "progress": 0.28107599264673233, "epoch": 25.296936308849666, "img/sec/core": 540.9887938601022, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.566543371895555, "core_hours": 16.566543371895555} {"step": 31700, "l2_params": 334.9632573717041, "train/loss": 2.737419545650482, "l2_grads": 1.5859375, "lr": 0.0008936434821667703, "uptime": 59813.760449476, "examples_seen": 32460800.0, "progress": 0.28152003054980773, "epoch": 25.33689987331862, "img/sec/core": 534.8771986227235, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.593133068107775, "core_hours": 16.593133068107775} {"step": 31750, "l2_params": 334.96313929669935, "train/loss": 5.329114079475403, "l2_grads": 1.484375, "lr": 0.0008931710405818614, "uptime": 59907.967278694996, "examples_seen": 32512000.0, "progress": 0.28196406845288313, "epoch": 25.37686343778758, "img/sec/core": 543.4850150935019, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.61930163177972, "core_hours": 16.61930163177972} {"step": 31800, "l2_params": 334.9871601433964, "train/loss": 2.6134799122810364, "l2_grads": 1.6953125, "lr": 0.0008926976774847883, "uptime": 60003.761350625995, "examples_seen": 32563200.0, "progress": 0.28240810635595853, "epoch": 25.416827002256536, "img/sec/core": 534.4798375089391, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.645911096204998, "core_hours": 16.645911096204998} {"step": 31850, "l2_params": 335.0111326275218, "train/loss": 2.7863855957984924, "l2_grads": 1.8984375, "lr": 0.0008922233939850159, "uptime": 60098.702548304005, "examples_seen": 32614400.0, "progress": 0.28285214425903393, "epoch": 25.456790566725495, "img/sec/core": 539.281168262138, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.672283651115556, "core_hours": 16.672283651115556} {"step": 31900, "l2_params": 335.0474881803138, "train/loss": 2.8544947504997253, "l2_grads": 1.6328125, "lr": 0.000891748191194167, "uptime": 60193.985026883995, "examples_seen": 32665600.0, "progress": 0.28329618216210933, "epoch": 25.49675413119445, "img/sec/core": 537.3495816128861, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.698751006276662, "core_hours": 16.698751006276662} {"step": 31950, "l2_params": 335.0832714835597, "train/loss": 5.250809907913208, "l2_grads": 1.484375, "lr": 0.0008912720702260207, "uptime": 60288.96621594, "examples_seen": 32716800.0, "progress": 0.2837402200651848, "epoch": 25.536717695663405, "img/sec/core": 539.0541064906258, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.725134669903333, "core_hours": 16.725134669903333} {"step": 32000, "l2_params": 335.0952246307197, "train/loss": 4.847177028656006, "l2_grads": 1.2734375, "lr": 0.0008907950321965062, "uptime": 60383.349971132004, "examples_seen": 32768000.0, "progress": 0.2841842579682602, "epoch": 25.576681260132364, "img/sec/core": 542.4662315654447, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.751352379678888, "core_hours": 16.751352379678888} {"step": 32050, "l2_params": 335.20895273275073, "train/loss": 5.336175084114075, "l2_grads": 1.4140625, "lr": 0.0008903170782237021, "uptime": 60478.058783894, "examples_seen": 32819200.0, "progress": 0.2846282958713356, "epoch": 25.61664482460132, "img/sec/core": 540.6043905192156, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.777660383223886, "core_hours": 16.777660383223886} {"step": 32100, "l2_params": 335.2567739691288, "train/loss": 2.749865710735321, "l2_grads": 1.640625, "lr": 0.0008898382094278355, "uptime": 60572.344425585005, "examples_seen": 32870400.0, "progress": 0.285072333774411, "epoch": 25.65660838907028, "img/sec/core": 543.0307211335162, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.803850839249165, "core_hours": 16.803850839249165} {"step": 32150, "l2_params": 335.28075630264703, "train/loss": 2.7491270303726196, "l2_grads": 1.578125, "lr": 0.0008893584269312756, "uptime": 60666.955937872, "examples_seen": 32921600.0, "progress": 0.2855163716774864, "epoch": 25.696571953539234, "img/sec/core": 541.1603594781271, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.830131814884442, "core_hours": 16.830131814884442} {"step": 32200, "l2_params": 335.28091067416887, "train/loss": 3.575689733028412, "l2_grads": 1.5546875, "lr": 0.0008888777318585339, "uptime": 60761.510101067004, "examples_seen": 32972800.0, "progress": 0.2859604095805618, "epoch": 25.736535518008193, "img/sec/core": 541.4885846370165, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.856396860216385, "core_hours": 16.856396860216385} {"step": 32250, "l2_params": 335.28686994311306, "train/loss": 4.354565382003784, "l2_grads": 1.375, "lr": 0.0008883961253362617, "uptime": 60856.201624981, "examples_seen": 33024000.0, "progress": 0.2864044474836372, "epoch": 25.776499082477148, "img/sec/core": 540.7030944659899, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.88270006130361, "core_hours": 16.88270006130361} {"step": 32300, "l2_params": 335.34675238614955, "train/loss": 3.0977229475975037, "l2_grads": 1.5078125, "lr": 0.0008879136084932451, "uptime": 60950.954384804005, "examples_seen": 33075200.0, "progress": 0.2868484853867126, "epoch": 25.816462646946103, "img/sec/core": 540.3536540322641, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.909020272365556, "core_hours": 16.909020272365556} {"step": 32350, "l2_params": 335.4243449884601, "train/loss": 4.597370505332947, "l2_grads": 1.296875, "lr": 0.0008874301824604047, "uptime": 61045.748808175005, "examples_seen": 33126400.0, "progress": 0.287292523289788, "epoch": 25.856426211415062, "img/sec/core": 540.1161606270515, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.935352056635274, "core_hours": 16.935352056635274} {"step": 32400, "l2_params": 335.4484492576691, "train/loss": 2.8984803557395935, "l2_grads": 1.6875, "lr": 0.0008869458483707925, "uptime": 61140.457463828, "examples_seen": 33177600.0, "progress": 0.28773656119286345, "epoch": 25.896389775884018, "img/sec/core": 540.6052873096559, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.961660016538886, "core_hours": 16.961660016538886} {"step": 32450, "l2_params": 335.4546020537839, "train/loss": 2.78726589679718, "l2_grads": 1.6171875, "lr": 0.0008864606073595869, "uptime": 61235.126056844994, "examples_seen": 33228800.0, "progress": 0.28818059909593885, "epoch": 25.936353340352976, "img/sec/core": 540.8340651139335, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 16.987956847932498, "core_hours": 16.987956847932498} {"step": 32500, "l2_params": 335.51431775987595, "train/loss": 2.679034411907196, "l2_grads": 1.6484375, "lr": 0.000885974460564094, "uptime": 61330.37838191101, "examples_seen": 33280000.0, "progress": 0.28862463699901425, "epoch": 25.976316904821932, "img/sec/core": 537.5196874671457, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.0144158271175, "core_hours": 17.0144158271175, "val/acc@1": 0.5753348214285714, "val/loss": 1.810582921821244, "z/secs/eval/val": 31.74794992299576} {"step": 32550, "l2_params": 335.5681312388365, "train/loss": 2.6717347502708435, "l2_grads": 1.6875, "lr": 0.0008854874091237414, "uptime": 61455.129190155, "examples_seen": 33331200.0, "progress": 0.28906867490208965, "epoch": 26.016280469290887, "img/sec/core": 410.41818262100935, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.049068829407496, "core_hours": 17.049068829407496} {"step": 32600, "l2_params": 335.59192545364897, "train/loss": 4.9882766008377075, "l2_grads": 1.890625, "lr": 0.0008849994541800784, "uptime": 61550.089708222, "examples_seen": 33382400.0, "progress": 0.28951271280516505, "epoch": 26.056244033759846, "img/sec/core": 539.171447694433, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.075446751092777, "core_hours": 17.075446751092777} {"step": 32650, "l2_params": 335.59809307879715, "train/loss": 2.6120097041130066, "l2_grads": 1.6328125, "lr": 0.0008845105968767709, "uptime": 61645.51773090601, "examples_seen": 33433600.0, "progress": 0.28995675070824045, "epoch": 26.0962075982288, "img/sec/core": 536.5300313257093, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.101954535171668, "core_hours": 17.101954535171668} {"step": 32700, "l2_params": 335.598162916791, "train/loss": 2.7067596316337585, "l2_grads": 1.5859375, "lr": 0.0008840208383595995, "uptime": 61740.297775657, "examples_seen": 33484800.0, "progress": 0.29040078861131585, "epoch": 26.13617116269776, "img/sec/core": 540.1980990250885, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.128282325380276, "core_hours": 17.128282325380276} {"step": 32750, "l2_params": 335.6696432133832, "train/loss": 3.0247220396995544, "l2_grads": 1.6953125, "lr": 0.0008835301797764589, "uptime": 61834.971981069, "examples_seen": 33536000.0, "progress": 0.29084482651439125, "epoch": 26.176134727166716, "img/sec/core": 540.8020038530168, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.154580715772497, "core_hours": 17.154580715772497} {"step": 32800, "l2_params": 335.6935756874303, "train/loss": 3.189127564430237, "l2_grads": 1.6015625, "lr": 0.0008830386222773504, "uptime": 61929.642305188, "examples_seen": 33587200.0, "progress": 0.29128886441746665, "epoch": 26.216098291635674, "img/sec/core": 540.8241756481524, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.180878028027774, "core_hours": 17.180878028027774} {"step": 32850, "l2_params": 335.70598854084733, "train/loss": 2.789216637611389, "l2_grads": 1.609375, "lr": 0.0008825461670143845, "uptime": 62024.89015104101, "examples_seen": 33638400.0, "progress": 0.2917329023205421, "epoch": 26.25606185610463, "img/sec/core": 537.5449653634582, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.207335762986943, "core_hours": 17.207335762986943} {"step": 32900, "l2_params": 335.7296028218803, "train/loss": 5.347182750701904, "l2_grads": 1.65625, "lr": 0.0008820528151417752, "uptime": 62119.65869023801, "examples_seen": 33689600.0, "progress": 0.2921769402236175, "epoch": 26.296025420573585, "img/sec/core": 540.2636827984404, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.233660357208333, "core_hours": 17.233660357208333} {"step": 32950, "l2_params": 335.75372880468507, "train/loss": 4.648711323738098, "l2_grads": 1.3671875, "lr": 0.000881558567815838, "uptime": 62214.591321900996, "examples_seen": 33740800.0, "progress": 0.2926209781266929, "epoch": 26.335988985042544, "img/sec/core": 539.3298289860995, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.260030532670275, "core_hours": 17.260030532670275} {"step": 33000, "l2_params": 335.75367645045975, "train/loss": 4.545159339904785, "l2_grads": 1.3203125, "lr": 0.0008810634261949867, "uptime": 62308.91140431301, "examples_seen": 33792000.0, "progress": 0.2930650160297683, "epoch": 26.3759525495115, "img/sec/core": 542.8324349457778, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.2862305555625, "core_hours": 17.2862305555625} {"step": 33050, "l2_params": 335.8072974424841, "train/loss": 2.689807653427124, "l2_grads": 1.703125, "lr": 0.0008805673914397323, "uptime": 62404.171444754, "examples_seen": 33843200.0, "progress": 0.2935090539328437, "epoch": 26.415916113980458, "img/sec/core": 537.4761522562728, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.312691677907218, "core_hours": 17.312691677907218} {"step": 33100, "l2_params": 335.8131208699825, "train/loss": 2.7121562361717224, "l2_grads": 1.609375, "lr": 0.0008800704647126781, "uptime": 62499.602048185, "examples_seen": 33894400.0, "progress": 0.2939530918359191, "epoch": 26.455879678449413, "img/sec/core": 536.5155218474536, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.339200178860274, "core_hours": 17.339200178860274} {"step": 33150, "l2_params": 335.84922386671525, "train/loss": 2.8299570083618164, "l2_grads": 1.59375, "lr": 0.0008795726471785187, "uptime": 62594.53099134301, "examples_seen": 33945600.0, "progress": 0.2943971297389945, "epoch": 26.49584324291837, "img/sec/core": 539.3507848789243, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.3655693297375, "core_hours": 17.3655693297375} {"step": 33200, "l2_params": 335.8790763150482, "train/loss": 2.9062135219573975, "l2_grads": 1.6875, "lr": 0.0008790739400040357, "uptime": 62689.552583219, "examples_seen": 33996800.0, "progress": 0.2948411676420699, "epoch": 26.535806807387328, "img/sec/core": 538.8249027317703, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.391964216369722, "core_hours": 17.391964216369722} {"step": 33250, "l2_params": 335.92662482397105, "train/loss": 3.124774217605591, "l2_grads": 1.5859375, "lr": 0.0008785743443580957, "uptime": 62784.92190657501, "examples_seen": 34048000.0, "progress": 0.2952852055451453, "epoch": 26.575770371856283, "img/sec/core": 536.8602628003916, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.41845569507972, "core_hours": 17.41845569507972} {"step": 33300, "l2_params": 335.9329738067179, "train/loss": 3.544905126094818, "l2_grads": 1.453125, "lr": 0.0008780738614116489, "uptime": 62880.49030521601, "examples_seen": 34099200.0, "progress": 0.2957292434482207, "epoch": 26.615733936325242, "img/sec/core": 535.7419474227161, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.44500247248, "core_hours": 17.44500247248} {"step": 33350, "l2_params": 335.93292438744373, "train/loss": 2.852914273738861, "l2_grads": 1.6171875, "lr": 0.0008775724923377239, "uptime": 62975.334507133, "examples_seen": 34150400.0, "progress": 0.29617328135129617, "epoch": 26.655697500794197, "img/sec/core": 539.8326831281911, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.47134808412361, "core_hours": 17.47134808412361} {"step": 33400, "l2_params": 335.9775819111671, "train/loss": 2.790065348148346, "l2_grads": 1.7734375, "lr": 0.0008770702383114287, "uptime": 63070.44085189, "examples_seen": 34201600.0, "progress": 0.29661731925437157, "epoch": 26.695661065263156, "img/sec/core": 538.3447353677095, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.497766513222775, "core_hours": 17.497766513222775} {"step": 33450, "l2_params": 336.01349867090534, "train/loss": 2.5692005157470703, "l2_grads": 1.6484375, "lr": 0.0008765671005099422, "uptime": 63166.734525684005, "examples_seen": 34252800.0, "progress": 0.29706135715744697, "epoch": 26.73562462973211, "img/sec/core": 531.70678802358, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.524514755943333, "core_hours": 17.524514755943333} {"step": 33500, "l2_params": 336.03752725932634, "train/loss": 2.703332841396332, "l2_grads": 1.671875, "lr": 0.0008760630801125159, "uptime": 63260.989010460005, "examples_seen": 34304000.0, "progress": 0.29750539506052237, "epoch": 26.775588194201067, "img/sec/core": 543.2102262473671, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.550696557269998, "core_hours": 17.550696557269998} {"step": 33550, "l2_params": 336.10919740186375, "train/loss": 3.3487257957458496, "l2_grads": 1.625, "lr": 0.0008755581783004698, "uptime": 63356.16675573701, "examples_seen": 34355200.0, "progress": 0.29794943296359777, "epoch": 26.815551758670026, "img/sec/core": 537.9408794670256, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.577134819846943, "core_hours": 17.577134819846943} {"step": 33600, "l2_params": 336.1330230424965, "train/loss": 2.5366216897964478, "l2_grads": 1.7109375, "lr": 0.0008750523962571909, "uptime": 63451.276771652, "examples_seen": 34406400.0, "progress": 0.29839347086667317, "epoch": 26.85551532313898, "img/sec/core": 538.3239557625658, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.60355426871222, "core_hours": 17.60355426871222} {"step": 33650, "l2_params": 336.1390863192832, "train/loss": 2.6970945596694946, "l2_grads": 1.6875, "lr": 0.0008745457351681281, "uptime": 63546.46792228501, "examples_seen": 34457600.0, "progress": 0.29883750876974857, "epoch": 26.89547888760794, "img/sec/core": 537.8651235910858, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.629996254999167, "core_hours": 17.629996254999167} {"step": 33700, "l2_params": 336.13919671813414, "train/loss": 4.402178049087524, "l2_grads": 1.40625, "lr": 0.0008740381962207908, "uptime": 63641.650735046, "examples_seen": 34508800.0, "progress": 0.299281546672824, "epoch": 26.935442452076895, "img/sec/core": 537.9122397713293, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.656435925210552, "core_hours": 17.656435925210552} {"step": 33750, "l2_params": 336.1927446026126, "train/loss": 3.139077663421631, "l2_grads": 1.4765625, "lr": 0.0008735297806047466, "uptime": 63736.904437492005, "examples_seen": 34560000.0, "progress": 0.2997255845758994, "epoch": 26.975406016545854, "img/sec/core": 537.511914867811, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.68289528700111, "core_hours": 17.68289528700111} {"step": 33800, "l2_params": 336.24036928587265, "train/loss": 2.588611125946045, "l2_grads": 1.7109375, "lr": 0.0008730204895116172, "uptime": 63832.109213145, "examples_seen": 34611200.0, "progress": 0.30016962247897483, "epoch": 27.01536958101481, "img/sec/core": 537.7881482186973, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.70934105801583, "core_hours": 17.70934105801583} {"step": 33850, "l2_params": 336.2881600093884, "train/loss": 5.127264022827148, "l2_grads": 1.390625, "lr": 0.000872510324135076, "uptime": 63927.307401631, "examples_seen": 34662400.0, "progress": 0.30061366038205023, "epoch": 27.055333145483765, "img/sec/core": 537.8253600648053, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.73578499926194, "core_hours": 17.73578499926194} {"step": 33900, "l2_params": 336.3743874251204, "train/loss": 2.9496272802352905, "l2_grads": 1.671875, "lr": 0.0008719992856708454, "uptime": 64023.840960627, "examples_seen": 34713600.0, "progress": 0.30105769828512563, "epoch": 27.095296709952724, "img/sec/core": 530.3855004674676, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.76259987676083, "core_hours": 17.76259987676083} {"step": 33950, "l2_params": 336.4192156697875, "train/loss": 3.7934746742248535, "l2_grads": 1.578125, "lr": 0.000871487375316695, "uptime": 64120.451023443005, "examples_seen": 34764800.0, "progress": 0.30150173618820103, "epoch": 27.13526027442168, "img/sec/core": 529.965497460763, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.789436005320834, "core_hours": 17.789436005320834} {"step": 34000, "l2_params": 336.43415467173884, "train/loss": 2.6248812675476074, "l2_grads": 1.6875, "lr": 0.0008709745942724376, "uptime": 64215.07870876501, "examples_seen": 34816000.0, "progress": 0.30194577409127643, "epoch": 27.175223838890638, "img/sec/core": 541.067868518329, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.815721473465832, "core_hours": 17.815721473465832} {"step": 34050, "l2_params": 336.5232915880415, "train/loss": 2.7167059183120728, "l2_grads": 1.671875, "lr": 0.0008704609437399269, "uptime": 64311.608967748005, "examples_seen": 34867200.0, "progress": 0.30238981199435183, "epoch": 27.215187403359593, "img/sec/core": 530.4036323886727, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.842535434294444, "core_hours": 17.842535434294444} {"step": 34100, "l2_params": 336.5413424756496, "train/loss": 2.6597037315368652, "l2_grads": 1.6484375, "lr": 0.0008699464249230544, "uptime": 64406.54444779201, "examples_seen": 34918400.0, "progress": 0.30283384989742723, "epoch": 27.25515096782855, "img/sec/core": 539.3136472925344, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.868906400973334, "core_hours": 17.868906400973334} {"step": 34150, "l2_params": 336.5414425863849, "train/loss": 2.8174372911453247, "l2_grads": 1.796875, "lr": 0.0008694310390277452, "uptime": 64502.363563331004, "examples_seen": 34969600.0, "progress": 0.30327788780050263, "epoch": 27.295114532297507, "img/sec/core": 534.3401440515687, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.895522821956387, "core_hours": 17.895522821956387} {"step": 34200, "l2_params": 336.58291633758313, "train/loss": 2.605795204639435, "l2_grads": 1.6484375, "lr": 0.0008689147872619597, "uptime": 64597.78479205101, "examples_seen": 35020800.0, "progress": 0.30372192570357803, "epoch": 27.335078096766463, "img/sec/core": 536.5682321093956, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.922028718823057, "core_hours": 17.922028718823057} {"step": 34250, "l2_params": 336.597913352768, "train/loss": 2.733199179172516, "l2_grads": 1.6484375, "lr": 0.0008683976708356841, "uptime": 64693.88706596401, "examples_seen": 35072000.0, "progress": 0.3041659636066535, "epoch": 27.37504166123542, "img/sec/core": 532.7657496049617, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.94872379491, "core_hours": 17.94872379491} {"step": 34300, "l2_params": 336.61293435951774, "train/loss": 2.6141759157180786, "l2_grads": 1.7421875, "lr": 0.0008678796909609348, "uptime": 64788.175939066, "examples_seen": 35123200.0, "progress": 0.3046100015097289, "epoch": 27.415005225704377, "img/sec/core": 543.0121107144538, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 17.974915148549442, "core_hours": 17.974915148549442} {"step": 34350, "l2_params": 336.61009702900327, "train/loss": 4.408644199371338, "l2_grads": 1.484375, "lr": 0.0008673608488517499, "uptime": 64884.018158605, "examples_seen": 35174400.0, "progress": 0.3050540394128043, "epoch": 27.454968790173336, "img/sec/core": 534.2113344856866, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.001537987310275, "core_hours": 18.001537987310275} {"step": 34400, "l2_params": 336.6102304827127, "train/loss": 2.5715590119361877, "l2_grads": 1.9453125, "lr": 0.0008668411457241881, "uptime": 64978.778681639, "examples_seen": 35225600.0, "progress": 0.3054980773158797, "epoch": 27.49493235464229, "img/sec/core": 540.309385814921, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.02786035481972, "core_hours": 18.02786035481972} {"step": 34450, "l2_params": 336.61923268360647, "train/loss": 2.798732042312622, "l2_grads": 1.765625, "lr": 0.0008663205827963272, "uptime": 65074.816038476, "examples_seen": 35276800.0, "progress": 0.3059421152189551, "epoch": 27.534895919111246, "img/sec/core": 533.1258760786253, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.054537398385552, "core_hours": 18.054537398385552} {"step": 34500, "l2_params": 336.6551070945048, "train/loss": 2.864436388015747, "l2_grads": 1.828125, "lr": 0.0008657991612882597, "uptime": 65170.072248337005, "examples_seen": 35328000.0, "progress": 0.3063861531220305, "epoch": 27.574859483580205, "img/sec/core": 537.4977660218526, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.080997456680276, "core_hours": 18.080997456680276} {"step": 34550, "l2_params": 336.6552622862147, "train/loss": 3.1604140400886536, "l2_grads": 1.6953125, "lr": 0.0008652768824220903, "uptime": 65264.779010771, "examples_seen": 35379200.0, "progress": 0.3068301910251059, "epoch": 27.61482304804916, "img/sec/core": 540.6160941852677, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.10730489068972, "core_hours": 18.10730489068972} {"step": 34600, "l2_params": 336.67911889744886, "train/loss": 3.2575881481170654, "l2_grads": 1.5625, "lr": 0.0008647537474219342, "uptime": 65359.014697623, "examples_seen": 35430400.0, "progress": 0.3072742289281813, "epoch": 27.65478661251812, "img/sec/core": 543.3185846080913, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.133481470370832, "core_hours": 18.133481470370832} {"step": 34650, "l2_params": 336.75046544372066, "train/loss": 2.956891894340515, "l2_grads": 1.78125, "lr": 0.0008642297575139114, "uptime": 65453.739453013, "examples_seen": 35481600.0, "progress": 0.3077182668312567, "epoch": 27.694750176987075, "img/sec/core": 540.5134042226119, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.159793902423605, "core_hours": 18.159793902423605} {"step": 34700, "l2_params": 336.7742906629936, "train/loss": 2.734802484512329, "l2_grads": 1.78125, "lr": 0.0008637049139261466, "uptime": 65548.969748337, "examples_seen": 35532800.0, "progress": 0.30816230473433215, "epoch": 27.734713741456034, "img/sec/core": 537.6440325613141, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.18624676223583, "core_hours": 18.18624676223583} {"step": 34750, "l2_params": 336.77730784321705, "train/loss": 4.537001729011536, "l2_grads": 1.5703125, "lr": 0.0008631792178887662, "uptime": 65643.334281004, "examples_seen": 35584000.0, "progress": 0.30860634263740755, "epoch": 27.77467730592499, "img/sec/core": 542.5767346368732, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.21245913242111, "core_hours": 18.21245913242111} {"step": 34800, "l2_params": 336.7950711068602, "train/loss": 2.710032820701599, "l2_grads": 1.671875, "lr": 0.0008626526706338938, "uptime": 65737.80552044901, "examples_seen": 35635200.0, "progress": 0.30905038054048295, "epoch": 27.814640870393944, "img/sec/core": 541.9638855252465, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.23870114337806, "core_hours": 18.23870114337806} {"step": 34850, "l2_params": 336.8190671330455, "train/loss": 3.3982707262039185, "l2_grads": 1.59375, "lr": 0.0008621252733956471, "uptime": 65833.507922569, "examples_seen": 35686400.0, "progress": 0.30949441844355835, "epoch": 27.854604434862903, "img/sec/core": 534.9917960868537, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.265285143966942, "core_hours": 18.265285143966942} {"step": 34901, "l2_params": 336.8248527726428, "train/loss": 4.986044764518738, "l2_grads": 1.5, "lr": 0.000861597027410137, "uptime": 65928.163702688, "examples_seen": 35737600.0, "progress": 0.30993845634663375, "epoch": 27.89456799933186, "img/sec/core": 540.9072740790738, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.291578416222226, "core_hours": 18.291578416222226} {"step": 34950, "l2_params": 336.9023397417084, "train/loss": 2.665165662765503, "l2_grads": 1.7265625, "lr": 0.0008610679339154646, "uptime": 66023.397927856, "examples_seen": 35788800.0, "progress": 0.31038249424970915, "epoch": 27.934531563800817, "img/sec/core": 537.6218466594584, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.31803236765778, "core_hours": 18.31803236765778} {"step": 35000, "l2_params": 336.90229046462787, "train/loss": 3.570364773273468, "l2_grads": 1.4921875, "lr": 0.0008605379941517158, "uptime": 66118.497449131, "examples_seen": 35840000.0, "progress": 0.31082653215278455, "epoch": 27.974495128269773, "img/sec/core": 538.3833621196195, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.344448901345277, "core_hours": 18.344448901345277, "val/acc@1": 0.5856784119897959, "val/loss": 1.7729346381158244, "z/secs/eval/val": 31.752287566007} {"step": 35050, "l2_params": 336.9022919139539, "train/loss": 2.604325532913208, "l2_grads": 1.859375, "lr": 0.0008600072093609602, "uptime": 66244.320321051, "examples_seen": 35891200.0, "progress": 0.31127057005585995, "epoch": 28.014458692738728, "img/sec/core": 406.9212474545532, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.37939969910083, "core_hours": 18.37939969910083} {"step": 35100, "l2_params": 336.94993368822617, "train/loss": 4.998532056808472, "l2_grads": 1.421875, "lr": 0.0008594755807872491, "uptime": 66339.84267375, "examples_seen": 35942400.0, "progress": 0.31171460795893535, "epoch": 28.054422257207687, "img/sec/core": 536.000198417803, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.405933685961664, "core_hours": 18.405933685961664} {"step": 35150, "l2_params": 337.0688507653147, "train/loss": 3.1975119709968567, "l2_grads": 1.5625, "lr": 0.0008589431096766096, "uptime": 66434.750153079, "examples_seen": 35993600.0, "progress": 0.3121586458620108, "epoch": 28.094385821676642, "img/sec/core": 539.4727619149008, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.432296874664168, "core_hours": 18.432296874664168} {"step": 35200, "l2_params": 337.07493197451663, "train/loss": 2.6278752088546753, "l2_grads": 1.8046875, "lr": 0.0008584097972770451, "uptime": 66529.578031557, "examples_seen": 36044800.0, "progress": 0.3126026837650862, "epoch": 28.1343493861456, "img/sec/core": 539.9256086054861, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.458637952019167, "core_hours": 18.458637952019167} {"step": 35250, "l2_params": 337.0751695421587, "train/loss": 2.677825093269348, "l2_grads": 1.6640625, "lr": 0.0008578756448385308, "uptime": 66624.468182087, "examples_seen": 36096000.0, "progress": 0.3130467216681616, "epoch": 28.174312950614556, "img/sec/core": 539.571280201646, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.48499632716639, "core_hours": 18.48499632716639} {"step": 35300, "l2_params": 337.075324540469, "train/loss": 2.6050431728363037, "l2_grads": 1.8203125, "lr": 0.0008573406536130098, "uptime": 66719.760291194, "examples_seen": 36147200.0, "progress": 0.313490759571237, "epoch": 28.214276515083515, "img/sec/core": 537.2952753360545, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.51146635747389, "core_hours": 18.51146635747389} {"step": 35350, "l2_params": 337.0752477656139, "train/loss": 2.5608890056610107, "l2_grads": 1.75, "lr": 0.0008568048248543921, "uptime": 66815.140587517, "examples_seen": 36198400.0, "progress": 0.3139347974743124, "epoch": 28.25424007955247, "img/sec/core": 536.7985000446583, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.53796088423028, "core_hours": 18.53796088423028} {"step": 35400, "l2_params": 337.0931285917143, "train/loss": 2.6000850796699524, "l2_grads": 1.75, "lr": 0.0008562681598185502, "uptime": 66911.580917752, "examples_seen": 36249600.0, "progress": 0.3143788353773878, "epoch": 28.294203644021426, "img/sec/core": 530.8982235465263, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.564749864851112, "core_hours": 18.564749864851112} {"step": 35450, "l2_params": 337.1109085277982, "train/loss": 3.146098017692566, "l2_grads": 1.6484375, "lr": 0.0008557306597633163, "uptime": 67006.09218689101, "examples_seen": 36300800.0, "progress": 0.3148228732804632, "epoch": 28.334167208490385, "img/sec/core": 541.7343398985973, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.591002995167504, "core_hours": 18.591002995167504} {"step": 35500, "l2_params": 337.1110997203852, "train/loss": 2.7066810727119446, "l2_grads": 1.8515625, "lr": 0.0008551923259484803, "uptime": 67101.67064969901, "examples_seen": 36352000.0, "progress": 0.3152669111835386, "epoch": 28.37413077295934, "img/sec/core": 535.685535169692, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.617552568169724, "core_hours": 18.617552568169724} {"step": 35550, "l2_params": 337.1469029661811, "train/loss": 2.6584076285362244, "l2_grads": 1.671875, "lr": 0.0008546531596357863, "uptime": 67196.424369759, "examples_seen": 36403200.0, "progress": 0.315710949086614, "epoch": 28.4140943374283, "img/sec/core": 540.348178072418, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.643873045964163, "core_hours": 18.643873045964163} {"step": 35600, "l2_params": 337.1469565523319, "train/loss": 2.7428696155548096, "l2_grads": 1.7734375, "lr": 0.0008541131620889297, "uptime": 67291.604420594, "examples_seen": 36454400.0, "progress": 0.3161549869896894, "epoch": 28.454057901897254, "img/sec/core": 537.9278488594077, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.67031194897389, "core_hours": 18.67031194897389} {"step": 35650, "l2_params": 337.1827053065037, "train/loss": 3.8474008440971375, "l2_grads": 1.453125, "lr": 0.0008535723345735527, "uptime": 67386.80776598101, "examples_seen": 36505600.0, "progress": 0.31659902489276487, "epoch": 28.49402146636621, "img/sec/core": 537.7962275576298, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.696757322692502, "core_hours": 18.696757322692502} {"step": 35700, "l2_params": 337.23013516365944, "train/loss": 5.158587574958801, "l2_grads": 1.4921875, "lr": 0.0008530306783572445, "uptime": 67482.684681438, "examples_seen": 36556800.0, "progress": 0.31704306279584027, "epoch": 28.53398503083517, "img/sec/core": 534.0180142003901, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.723389799208334, "core_hours": 18.723389799208334} {"step": 35750, "l2_params": 337.2361946419193, "train/loss": 2.6559524536132812, "l2_grads": 1.7890625, "lr": 0.000852488194709536, "uptime": 67577.351936998, "examples_seen": 36608000.0, "progress": 0.31748710069891567, "epoch": 28.573948595304124, "img/sec/core": 540.8417060061984, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.74968625908611, "core_hours": 18.74968625908611} {"step": 35800, "l2_params": 337.2836242156777, "train/loss": 4.400918364524841, "l2_grads": 1.59375, "lr": 0.0008519448849018982, "uptime": 67672.62886464801, "examples_seen": 36659200.0, "progress": 0.31793113860199107, "epoch": 28.613912159773083, "img/sec/core": 537.3808881419981, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.776152072322226, "core_hours": 18.776152072322226} {"step": 35850, "l2_params": 337.3074016429598, "train/loss": 2.6917667984962463, "l2_grads": 1.65625, "lr": 0.0008514007502077368, "uptime": 67767.358641567, "examples_seen": 36710400.0, "progress": 0.31837517650506647, "epoch": 28.653875724242038, "img/sec/core": 540.484752157547, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.802465899244165, "core_hours": 18.802465899244165} {"step": 35900, "l2_params": 337.34306826008003, "train/loss": 4.346687316894531, "l2_grads": 1.5546875, "lr": 0.0008508557919023919, "uptime": 67862.96574063701, "examples_seen": 36761600.0, "progress": 0.31881921440814187, "epoch": 28.693839288710997, "img/sec/core": 535.5250865054265, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.829023426763612, "core_hours": 18.829023426763612} {"step": 35950, "l2_params": 337.34917636904794, "train/loss": 5.168338656425476, "l2_grads": 1.53125, "lr": 0.0008503100112631335, "uptime": 67958.664419345, "examples_seen": 36812800.0, "progress": 0.31926325231121727, "epoch": 28.733802853179952, "img/sec/core": 535.0126113676696, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.85560639307139, "core_hours": 18.85560639307139} {"step": 36000, "l2_params": 337.3609898906511, "train/loss": 5.2739750146865845, "l2_grads": 1.734375, "lr": 0.00084976340956916, "uptime": 68054.452847274, "examples_seen": 36864000.0, "progress": 0.31970729021429267, "epoch": 28.773766417648908, "img/sec/core": 534.5113298857952, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.882214289718334, "core_hours": 18.882214289718334} {"step": 36050, "l2_params": 337.4322154151853, "train/loss": 5.004815459251404, "l2_grads": 1.4375, "lr": 0.0008492159881015932, "uptime": 68150.193113364, "examples_seen": 36915200.0, "progress": 0.3201513281173681, "epoch": 28.813729982117867, "img/sec/core": 534.7802141250722, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.908808808076667, "core_hours": 18.908808808076667} {"step": 36100, "l2_params": 337.4855075013407, "train/loss": 2.8424474000930786, "l2_grads": 1.6953125, "lr": 0.0008486677481434762, "uptime": 68245.30248435901, "examples_seen": 36966400.0, "progress": 0.32059536602044353, "epoch": 28.853693546586822, "img/sec/core": 538.3276060430227, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.9352280777975, "core_hours": 18.9352280777975} {"step": 36150, "l2_params": 337.5329295278092, "train/loss": 3.7861942648887634, "l2_grads": 1.421875, "lr": 0.0008481186909797721, "uptime": 68339.885491546, "examples_seen": 37017600.0, "progress": 0.32103940392351893, "epoch": 28.89365711105578, "img/sec/core": 541.3234525180632, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.961501135349444, "core_hours": 18.961501135349444} {"step": 36200, "l2_params": 337.53303657753264, "train/loss": 2.8372327089309692, "l2_grads": 1.9296875, "lr": 0.0008475688178973571, "uptime": 68435.710171732, "examples_seen": 37068800.0, "progress": 0.32148344182659433, "epoch": 28.933620675524736, "img/sec/core": 534.3091143180897, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 18.98811910206778, "core_hours": 18.98811910206778} {"step": 36250, "l2_params": 337.53310456855564, "train/loss": 2.7475082874298096, "l2_grads": 1.671875, "lr": 0.000847018130185021, "uptime": 68531.407271074, "examples_seen": 37120000.0, "progress": 0.32192747972966973, "epoch": 28.973584239993695, "img/sec/core": 535.021441109982, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.014701629662778, "core_hours": 19.014701629662778} {"step": 36300, "l2_params": 337.5450186988952, "train/loss": 2.901374876499176, "l2_grads": 1.703125, "lr": 0.0008464666291334619, "uptime": 68626.014357745, "examples_seen": 37171200.0, "progress": 0.32237151763274513, "epoch": 29.01354780446265, "img/sec/core": 541.1856743675694, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.04098137596028, "core_hours": 19.04098137596028} {"step": 36350, "l2_params": 337.5926420883422, "train/loss": 2.4862632751464844, "l2_grads": 1.75, "lr": 0.0008459143160352867, "uptime": 68722.455741205, "examples_seen": 37222400.0, "progress": 0.32281555553582053, "epoch": 29.053511368931606, "img/sec/core": 530.8924256694914, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.06777064914361, "core_hours": 19.06777064914361} {"step": 36400, "l2_params": 337.6163225467631, "train/loss": 2.6415178775787354, "l2_grads": 1.78125, "lr": 0.0008453611921850025, "uptime": 68817.088370589, "examples_seen": 37273600.0, "progress": 0.32325959343889593, "epoch": 29.093474933400564, "img/sec/core": 541.03960054035, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.094057490639166, "core_hours": 19.094057490639166} {"step": 36450, "l2_params": 337.6164613877706, "train/loss": 2.7870015501976013, "l2_grads": 1.6796875, "lr": 0.0008448072588790184, "uptime": 68912.249885682, "examples_seen": 37324800.0, "progress": 0.32370363134197133, "epoch": 29.13343849786952, "img/sec/core": 538.0326274751131, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.120491244831666, "core_hours": 19.120491244831666} {"step": 36500, "l2_params": 337.65198690043644, "train/loss": 3.279016435146332, "l2_grads": 1.625, "lr": 0.0008442525174156404, "uptime": 69007.871749225, "examples_seen": 37376000.0, "progress": 0.32414766924504673, "epoch": 29.17340206233848, "img/sec/core": 535.4423988712286, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.147052873593612, "core_hours": 19.147052873593612} {"step": 36550, "l2_params": 337.6636726972195, "train/loss": 2.689819097518921, "l2_grads": 1.8515625, "lr": 0.0008436969690950684, "uptime": 69103.139728814, "examples_seen": 37427200.0, "progress": 0.3245917071481222, "epoch": 29.213365626807434, "img/sec/core": 537.4313617322878, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.173516201257222, "core_hours": 19.173516201257222} {"step": 36600, "l2_params": 337.68752891911777, "train/loss": 3.8774919509887695, "l2_grads": 1.53125, "lr": 0.0008431406152193937, "uptime": 69197.850378089, "examples_seen": 37478400.0, "progress": 0.3250357450511976, "epoch": 29.25332919127639, "img/sec/core": 540.5939077804783, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.19982471494472, "core_hours": 19.19982471494472} {"step": 36650, "l2_params": 337.687854259022, "train/loss": 2.6813268661499023, "l2_grads": 1.8046875, "lr": 0.0008425834570925954, "uptime": 69292.788209772, "examples_seen": 37529600.0, "progress": 0.325479782954273, "epoch": 29.293292755745348, "img/sec/core": 539.3002883293119, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.226196334856663, "core_hours": 19.226196334856663} {"step": 36700, "l2_params": 337.6878311237503, "train/loss": 3.0342270135879517, "l2_grads": 1.6796875, "lr": 0.0008420254960205381, "uptime": 69387.684810923, "examples_seen": 37580800.0, "progress": 0.3259238208573484, "epoch": 29.333256320214304, "img/sec/core": 539.5346027043398, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.252556501843056, "core_hours": 19.252556501843056} {"step": 36750, "l2_params": 337.7353881114807, "train/loss": 3.355013906955719, "l2_grads": 1.7421875, "lr": 0.000841466733310967, "uptime": 69482.57941507001, "examples_seen": 37632000.0, "progress": 0.3263678587604238, "epoch": 29.373219884683262, "img/sec/core": 539.5459569090393, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.278916114106114, "core_hours": 19.278916114106114} {"step": 36800, "l2_params": 337.74729510621177, "train/loss": 2.6488969922065735, "l2_grads": 1.7421875, "lr": 0.0008409071702735081, "uptime": 69577.399892781, "examples_seen": 37683200.0, "progress": 0.3268118966634992, "epoch": 29.413183449152218, "img/sec/core": 539.9677499627705, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.3052551356925, "core_hours": 19.3052551356925} {"step": 36850, "l2_params": 337.79466737159646, "train/loss": 3.543965458869934, "l2_grads": 1.625, "lr": 0.0008403468082196611, "uptime": 69673.325858625, "examples_seen": 37734400.0, "progress": 0.3272559345665746, "epoch": 29.453147013621177, "img/sec/core": 533.7449516355655, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.331901237315833, "core_hours": 19.331901237315833} {"step": 36900, "l2_params": 337.8066156402395, "train/loss": 3.0703747272491455, "l2_grads": 1.6640625, "lr": 0.0008397856484628017, "uptime": 69768.100569117, "examples_seen": 37785600.0, "progress": 0.32769997246965, "epoch": 29.493110578090132, "img/sec/core": 540.2285033022902, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.358227545785834, "core_hours": 19.358227545785834} {"step": 36950, "l2_params": 337.81253324467923, "train/loss": 2.776106536388397, "l2_grads": 1.703125, "lr": 0.000839223692318171, "uptime": 69864.112959772, "examples_seen": 37836800.0, "progress": 0.3281440103727254, "epoch": 29.533074142559087, "img/sec/core": 533.2645052447073, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.38489765430111, "core_hours": 19.38489765430111} {"step": 37000, "l2_params": 337.8244115036871, "train/loss": 5.151435136795044, "l2_grads": 1.4609375, "lr": 0.0008386609411028795, "uptime": 69958.189281535, "examples_seen": 37888000.0, "progress": 0.32858804827580085, "epoch": 29.573037707028046, "img/sec/core": 544.2389651349686, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.411029965901943, "core_hours": 19.411029965901943} {"step": 37050, "l2_params": 337.82442162127654, "train/loss": 2.5555036067962646, "l2_grads": 1.7109375, "lr": 0.0008380973961359007, "uptime": 70052.835698578, "examples_seen": 37939200.0, "progress": 0.32903208617887625, "epoch": 29.613001271497, "img/sec/core": 540.9607843553148, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.437320637302776, "core_hours": 19.437320637302776} {"step": 37100, "l2_params": 337.8481566519566, "train/loss": 2.842576265335083, "l2_grads": 1.828125, "lr": 0.0008375330587380681, "uptime": 70145.96375715401, "examples_seen": 37990400.0, "progress": 0.32947612408195165, "epoch": 29.65296483596596, "img/sec/core": 549.7806008509336, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.46318954246278, "core_hours": 19.46318954246278} {"step": 37150, "l2_params": 337.85997151417996, "train/loss": 2.574140965938568, "l2_grads": 1.7890625, "lr": 0.0008369679302320718, "uptime": 70239.094836602, "examples_seen": 38041600.0, "progress": 0.32992016198502705, "epoch": 29.692928400434916, "img/sec/core": 549.7627677406111, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.48905928675389, "core_hours": 19.48905928675389} {"step": 37200, "l2_params": 337.85990503415394, "train/loss": 2.682533860206604, "l2_grads": 1.796875, "lr": 0.000836402011942458, "uptime": 70332.149913147, "examples_seen": 38092800.0, "progress": 0.33036419988810245, "epoch": 29.732891964903875, "img/sec/core": 550.2117874809236, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.5149079191275, "core_hours": 19.5149079191275} {"step": 37250, "l2_params": 337.8836115601606, "train/loss": 2.7368807196617126, "l2_grads": 1.6640625, "lr": 0.0008358353051956227, "uptime": 70425.119005844, "examples_seen": 38144000.0, "progress": 0.33080823779117785, "epoch": 29.77285552937283, "img/sec/core": 550.720659035283, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.540732667098887, "core_hours": 19.540732667098887} {"step": 37300, "l2_params": 337.9074609244926, "train/loss": 2.6292994618415833, "l2_grads": 1.7734375, "lr": 0.0008352678113198105, "uptime": 70518.09425769, "examples_seen": 38195200.0, "progress": 0.33125227569425325, "epoch": 29.812819093841785, "img/sec/core": 550.6841765247904, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.566559125945, "core_hours": 19.566559125945} {"step": 37350, "l2_params": 337.9313013811017, "train/loss": 4.610148668289185, "l2_grads": 1.4375, "lr": 0.0008346995316451096, "uptime": 70611.03869224801, "examples_seen": 38246400.0, "progress": 0.33169631359732865, "epoch": 29.852782658310744, "img/sec/core": 550.8667651105345, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.592377024433336, "core_hours": 19.592377024433336} {"step": 37400, "l2_params": 337.9430743252109, "train/loss": 2.5789798498153687, "l2_grads": 1.8671875, "lr": 0.0008341304675034508, "uptime": 70703.954947128, "examples_seen": 38297600.0, "progress": 0.33214035150040405, "epoch": 29.8927462227797, "img/sec/core": 551.0338321979003, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.618187095233335, "core_hours": 19.618187095233335} {"step": 37450, "l2_params": 337.9670292952036, "train/loss": 3.537649393081665, "l2_grads": 1.5234375, "lr": 0.0008335606202286049, "uptime": 70796.788295883, "examples_seen": 38348800.0, "progress": 0.3325843894034795, "epoch": 29.93270978724866, "img/sec/core": 551.5259406953576, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.643974136554167, "core_hours": 19.643974136554167} {"step": 37500, "l2_params": 337.96683280778456, "train/loss": 3.7222540974617004, "l2_grads": 1.59375, "lr": 0.0008329899911561761, "uptime": 70889.571322517, "examples_seen": 38400000.0, "progress": 0.3330284273065549, "epoch": 29.972673351717614, "img/sec/core": 551.8250681988056, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.669747199508056, "core_hours": 19.669747199508056, "val/acc@1": 0.597297512755102, "val/loss": 1.7245371645810652, "z/secs/eval/val": 31.594735258986475} {"step": 37550, "l2_params": 337.96712609411065, "train/loss": 3.3789762258529663, "l2_grads": 1.6328125, "lr": 0.0008324185816236015, "uptime": 71013.553359112, "examples_seen": 38451200.0, "progress": 0.3334724652096303, "epoch": 30.01263691618657, "img/sec/core": 412.96305018161667, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.70418665411778, "core_hours": 19.70418665411778} {"step": 37600, "l2_params": 337.96736881363637, "train/loss": 2.8782562613487244, "l2_grads": 1.78125, "lr": 0.0008318463929701478, "uptime": 71106.212233853, "examples_seen": 38502400.0, "progress": 0.3339165031127057, "epoch": 30.052600480655528, "img/sec/core": 552.5644482853359, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.729925230434723, "core_hours": 19.729925230434723} {"step": 37650, "l2_params": 338.00296290075255, "train/loss": 2.5796953439712524, "l2_grads": 1.6953125, "lr": 0.0008312734265369077, "uptime": 71198.906343554, "examples_seen": 38553600.0, "progress": 0.3343605410157811, "epoch": 30.092564045124483, "img/sec/core": 552.3544070400459, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.755673594240555, "core_hours": 19.755673594240555} {"step": 37700, "l2_params": 338.03242003125604, "train/loss": 2.680768609046936, "l2_grads": 1.7890625, "lr": 0.000830699683666797, "uptime": 71291.591103172, "examples_seen": 38604800.0, "progress": 0.3348045789188565, "epoch": 30.132527609593442, "img/sec/core": 552.4101288175088, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.781419360801113, "core_hours": 19.781419360801113} {"step": 37750, "l2_params": 338.0620623610589, "train/loss": 2.579594314098358, "l2_grads": 1.71875, "lr": 0.0008301251657045516, "uptime": 71384.277338432, "examples_seen": 38656000.0, "progress": 0.3352486168219319, "epoch": 30.172491174062397, "img/sec/core": 552.4013339885431, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.80716553726222, "core_hours": 19.80716553726222} {"step": 37800, "l2_params": 338.06214468921985, "train/loss": 2.8625675439834595, "l2_grads": 1.7421875, "lr": 0.0008295498739967222, "uptime": 71476.924170525, "examples_seen": 38707200.0, "progress": 0.3356926547250073, "epoch": 30.212454738531356, "img/sec/core": 552.6362730741287, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.832900768399167, "core_hours": 19.832900768399167} {"step": 37850, "l2_params": 338.08586014224994, "train/loss": 3.3403685092926025, "l2_grads": 1.578125, "lr": 0.000828973809891676, "uptime": 71569.544890856, "examples_seen": 38758400.0, "progress": 0.3361366926280827, "epoch": 30.25241830300031, "img/sec/core": 552.7920730590687, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.85862874626889, "core_hours": 19.85862874626889} {"step": 37900, "l2_params": 338.15680303300127, "train/loss": 4.510960936546326, "l2_grads": 1.6015625, "lr": 0.0008283969747395876, "uptime": 71662.542800215, "examples_seen": 38809600.0, "progress": 0.3365807305311581, "epoch": 30.292381867469267, "img/sec/core": 550.5500107788021, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.88446149886861, "core_hours": 19.88446149886861} {"step": 37950, "l2_params": 338.24567509245406, "train/loss": 2.787507653236389, "l2_grads": 1.734375, "lr": 0.0008278193698924404, "uptime": 71755.225066935, "examples_seen": 38860800.0, "progress": 0.33702476843423357, "epoch": 30.332345431938226, "img/sec/core": 552.4249871302488, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.910206572957502, "core_hours": 19.910206572957502} {"step": 38000, "l2_params": 338.2576709449839, "train/loss": 3.1743839979171753, "l2_grads": 1.625, "lr": 0.0008272409967040218, "uptime": 71847.881970737, "examples_seen": 38912000.0, "progress": 0.33746880633730897, "epoch": 30.37230899640718, "img/sec/core": 552.5762020864925, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.935944601791387, "core_hours": 19.935944601791387} {"step": 38050, "l2_params": 338.25758722089296, "train/loss": 3.9277403354644775, "l2_grads": 1.421875, "lr": 0.00082666185652992, "uptime": 71940.862482999, "examples_seen": 38963200.0, "progress": 0.33791284424038437, "epoch": 30.41227256087614, "img/sec/core": 550.6530213097544, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.961772521864166, "core_hours": 19.961772521864166} {"step": 38100, "l2_params": 338.3048375148329, "train/loss": 2.6481199860572815, "l2_grads": 1.8203125, "lr": 0.0008260819507275206, "uptime": 72033.668362888, "examples_seen": 39014400.0, "progress": 0.33835688214345977, "epoch": 30.452236125345095, "img/sec/core": 551.6891824229098, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 19.98755193294444, "core_hours": 19.98755193294444} {"step": 38150, "l2_params": 338.3051665910343, "train/loss": 4.734787702560425, "l2_grads": 1.59375, "lr": 0.0008255012806560031, "uptime": 72126.437438679, "examples_seen": 39065600.0, "progress": 0.33880092004653517, "epoch": 30.49219968981405, "img/sec/core": 551.9080530170155, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.013321120664166, "core_hours": 20.013321120664166} {"step": 38200, "l2_params": 338.3409127524892, "train/loss": 2.536676824092865, "l2_grads": 1.8828125, "lr": 0.0008249198476763398, "uptime": 72219.18667823101, "examples_seen": 39116800.0, "progress": 0.33924495794961057, "epoch": 30.53216325428301, "img/sec/core": 552.026089349115, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.039084798317504, "core_hours": 20.039084798317504} {"step": 38250, "l2_params": 338.37048043712383, "train/loss": 2.7178860902786255, "l2_grads": 1.7734375, "lr": 0.0008243376531512897, "uptime": 72311.858550174, "examples_seen": 39168000.0, "progress": 0.33968899585268597, "epoch": 30.572126818751965, "img/sec/core": 552.4869512886959, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.06482698496833, "core_hours": 20.06482698496833} {"step": 38300, "l2_params": 338.3704515763751, "train/loss": 2.858985722064972, "l2_grads": 1.6484375, "lr": 0.0008237546984453961, "uptime": 72404.50769727501, "examples_seen": 39219200.0, "progress": 0.34013303375576137, "epoch": 30.612090383220924, "img/sec/core": 552.6224644483818, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.090562859163057, "core_hours": 20.090562859163057} {"step": 38350, "l2_params": 338.370457348525, "train/loss": 4.240697145462036, "l2_grads": 1.6015625, "lr": 0.000823170984924987, "uptime": 72497.22981150901, "examples_seen": 39270400.0, "progress": 0.34057707165883677, "epoch": 30.65205394768988, "img/sec/core": 552.1875813874227, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.116319002005834, "core_hours": 20.116319002005834} {"step": 38400, "l2_params": 338.37643291394056, "train/loss": 5.0294671058654785, "l2_grads": 1.859375, "lr": 0.000822586513958166, "uptime": 72589.959741558, "examples_seen": 39321600.0, "progress": 0.34102110956191223, "epoch": 30.692017512158838, "img/sec/core": 552.1410398233494, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.142077315908335, "core_hours": 20.142077315908335} {"step": 38450, "l2_params": 338.37644445803625, "train/loss": 4.429851055145264, "l2_grads": 1.4296875, "lr": 0.0008220012869148134, "uptime": 72682.72534561901, "examples_seen": 39372800.0, "progress": 0.34146514746498763, "epoch": 30.731981076627793, "img/sec/core": 551.9287080406586, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.167845539258614, "core_hours": 20.167845539258614} {"step": 38500, "l2_params": 338.37642281285645, "train/loss": 2.577742338180542, "l2_grads": 1.7265625, "lr": 0.0008214153051665811, "uptime": 72775.39655551901, "examples_seen": 39424000.0, "progress": 0.34190918536806303, "epoch": 30.77194464109675, "img/sec/core": 552.4908982546929, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.193587542008615, "core_hours": 20.193587542008615} {"step": 38550, "l2_params": 338.37643435695253, "train/loss": 2.6035080552101135, "l2_grads": 1.7734375, "lr": 0.0008208285700868891, "uptime": 72867.992193107, "examples_seen": 39475200.0, "progress": 0.34235322327113843, "epoch": 30.811908205565707, "img/sec/core": 552.9418159829222, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.21930855244972, "core_hours": 20.21930855244972} {"step": 38600, "l2_params": 338.38235931228746, "train/loss": 3.139124035835266, "l2_grads": 1.6953125, "lr": 0.0008202410830509247, "uptime": 72960.615138576, "examples_seen": 39526400.0, "progress": 0.34279726117421383, "epoch": 30.851871770034663, "img/sec/core": 552.7787929950259, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.245037148413335, "core_hours": 20.245037148413335} {"step": 38650, "l2_params": 338.3824718652327, "train/loss": 2.5871005058288574, "l2_grads": 1.7265625, "lr": 0.0008196528454356368, "uptime": 73053.301844332, "examples_seen": 39577600.0, "progress": 0.34324129907728923, "epoch": 30.89183533450362, "img/sec/core": 552.3985298904095, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.270783455567777, "core_hours": 20.270783455567777} {"step": 38700, "l2_params": 338.42970905159905, "train/loss": 3.4077318906784058, "l2_grads": 1.6953125, "lr": 0.0008190638586197336, "uptime": 73145.902787663, "examples_seen": 39628800.0, "progress": 0.34368533698036463, "epoch": 30.931798898972577, "img/sec/core": 552.9101341547811, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.296505939826385, "core_hours": 20.296505939826385} {"step": 38750, "l2_params": 338.44169838116136, "train/loss": 4.877997994422913, "l2_grads": 1.59375, "lr": 0.0008184741239836789, "uptime": 73238.60126980301, "examples_seen": 39680000.0, "progress": 0.34412937488344003, "epoch": 30.971762463441536, "img/sec/core": 552.3283533668646, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.322255518198613, "core_hours": 20.322255518198613} {"step": 38800, "l2_params": 338.48892441721785, "train/loss": 2.5586960911750793, "l2_grads": 1.6484375, "lr": 0.0008178836429096895, "uptime": 73331.228811023, "examples_seen": 39731200.0, "progress": 0.34457341278651543, "epoch": 31.01172602791049, "img/sec/core": 552.7513666631838, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.34798539075972, "core_hours": 20.34798539075972} {"step": 38850, "l2_params": 338.49187582569834, "train/loss": 2.5014989376068115, "l2_grads": 1.828125, "lr": 0.0008172924167817329, "uptime": 73423.881084944, "examples_seen": 39782400.0, "progress": 0.3450174506895909, "epoch": 31.051689592379446, "img/sec/core": 552.6038145987972, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.373722133515557, "core_hours": 20.373722133515557} {"step": 38900, "l2_params": 338.5096154699671, "train/loss": 5.128792881965637, "l2_grads": 1.5234375, "lr": 0.0008167004469855203, "uptime": 73516.539401688, "examples_seen": 39833600.0, "progress": 0.3454614885926663, "epoch": 31.091653156848405, "img/sec/core": 552.5677758798402, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.399460554833336, "core_hours": 20.399460554833336} {"step": 38950, "l2_params": 338.50974817481256, "train/loss": 5.251305460929871, "l2_grads": 1.6171875, "lr": 0.0008161077349085086, "uptime": 73609.18922967701, "examples_seen": 39884800.0, "progress": 0.3459055264957417, "epoch": 31.13161672131736, "img/sec/core": 552.6184031995685, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.425196618163614, "core_hours": 20.425196618163614} {"step": 39000, "l2_params": 338.5572272064946, "train/loss": 2.7090153098106384, "l2_grads": 1.7265625, "lr": 0.0008155142819398924, "uptime": 73701.833725628, "examples_seen": 39936000.0, "progress": 0.3463495643988171, "epoch": 31.17158028578632, "img/sec/core": 552.6502084601053, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.450931200372224, "core_hours": 20.450931200372224} {"step": 39050, "l2_params": 338.5927535172231, "train/loss": 4.141917824745178, "l2_grads": 1.5, "lr": 0.0008149200894706029, "uptime": 73794.68494475, "examples_seen": 39987200.0, "progress": 0.3467936023018925, "epoch": 31.211543850255275, "img/sec/core": 551.419792697939, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.476723205683886, "core_hours": 20.476723205683886} {"step": 39100, "l2_params": 338.59285734769276, "train/loss": 3.2242459058761597, "l2_grads": 1.6796875, "lr": 0.0008143251588933058, "uptime": 73887.351143541, "examples_seen": 40038400.0, "progress": 0.3472376402049679, "epoch": 31.25150741472423, "img/sec/core": 552.5207752988146, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.502463816459166, "core_hours": 20.502463816459166} {"step": 39150, "l2_params": 338.59873236989534, "train/loss": 3.826941668987274, "l2_grads": 1.6875, "lr": 0.0008137294916023965, "uptime": 73979.975809144, "examples_seen": 40089600.0, "progress": 0.3476816781080433, "epoch": 31.29147097919319, "img/sec/core": 552.7685273321279, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.52819289023778, "core_hours": 20.52819289023778} {"step": 39200, "l2_params": 338.6047082329187, "train/loss": 5.066267609596252, "l2_grads": 1.53125, "lr": 0.0008131330889939963, "uptime": 74072.670081104, "examples_seen": 40140800.0, "progress": 0.3481257160111187, "epoch": 31.331434543662144, "img/sec/core": 552.3534401574624, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.553941299115554, "core_hours": 20.553941299115554} {"step": 39250, "l2_params": 338.61641450448764, "train/loss": 2.6627601981163025, "l2_grads": 1.859375, "lr": 0.0008125359524659509, "uptime": 74165.274452463, "examples_seen": 40192000.0, "progress": 0.3485697539141941, "epoch": 31.371398108131103, "img/sec/core": 552.889666531165, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.579664735604165, "core_hours": 20.579664735604165} {"step": 39300, "l2_params": 338.61655870338797, "train/loss": 3.982407569885254, "l2_grads": 1.6953125, "lr": 0.0008119380834178253, "uptime": 74257.89156087, "examples_seen": 40243200.0, "progress": 0.34901379181726955, "epoch": 31.41136167260006, "img/sec/core": 552.8136310950266, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.605391710161665, "core_hours": 20.605391710161665} {"step": 39350, "l2_params": 338.66381802700005, "train/loss": 2.8471747636795044, "l2_grads": 1.7109375, "lr": 0.0008113394832509018, "uptime": 74350.48569333501, "examples_seen": 40294400.0, "progress": 0.34945782972034495, "epoch": 31.451325237069018, "img/sec/core": 552.950804084164, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.631112302513056, "core_hours": 20.631112302513056} {"step": 39400, "l2_params": 338.6638410955988, "train/loss": 2.918548285961151, "l2_grads": 1.734375, "lr": 0.0008107401533681771, "uptime": 74443.08386662, "examples_seen": 40345600.0, "progress": 0.34990186762342035, "epoch": 31.491288801537973, "img/sec/core": 552.9266742921716, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.656834017314445, "core_hours": 20.656834017314445} {"step": 39450, "l2_params": 338.7407488358538, "train/loss": 2.480441153049469, "l2_grads": 1.7109375, "lr": 0.000810140095174356, "uptime": 74535.634751595, "examples_seen": 40396800.0, "progress": 0.35034590552649575, "epoch": 31.531252366006928, "img/sec/core": 553.2091888027652, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.682542596474168, "core_hours": 20.682542596474168} {"step": 39500, "l2_params": 338.7288248686182, "train/loss": 3.1021485328674316, "l2_grads": 1.734375, "lr": 0.0008095393100758517, "uptime": 74628.233084091, "examples_seen": 40448000.0, "progress": 0.35078994342957115, "epoch": 31.571215930475887, "img/sec/core": 552.9257236053774, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.708264355500834, "core_hours": 20.708264355500834} {"step": 39550, "l2_params": 338.7526781490074, "train/loss": 2.448755204677582, "l2_grads": 1.7890625, "lr": 0.0008089377994807825, "uptime": 74720.770933194, "examples_seen": 40499200.0, "progress": 0.35123398133264655, "epoch": 31.611179494944842, "img/sec/core": 553.2871197709828, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.733969313585, "core_hours": 20.733969313585} {"step": 39600, "l2_params": 338.77612906608397, "train/loss": 3.0866450667381287, "l2_grads": 1.5234375, "lr": 0.0008083355647989651, "uptime": 74813.385656189, "examples_seen": 40550400.0, "progress": 0.35167801923572195, "epoch": 31.6511430594138, "img/sec/core": 552.8278695252809, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.759695625528057, "core_hours": 20.759695625528057} {"step": 39650, "l2_params": 338.7998291303436, "train/loss": 2.822717845439911, "l2_grads": 1.859375, "lr": 0.0008077326074419132, "uptime": 74906.02338860401, "examples_seen": 40601600.0, "progress": 0.35212205713879735, "epoch": 31.691106623882757, "img/sec/core": 552.6905577808022, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.785428328976668, "core_hours": 20.785428328976668} {"step": 39700, "l2_params": 338.79996460393113, "train/loss": 2.7370076775550842, "l2_grads": 1.8046875, "lr": 0.0008071289288228353, "uptime": 74998.601585828, "examples_seen": 40652800.0, "progress": 0.35256609504187275, "epoch": 31.731070188351715, "img/sec/core": 553.045982048253, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.81114449487222, "core_hours": 20.81114449487222} {"step": 39750, "l2_params": 338.81172754016353, "train/loss": 4.3642942905426025, "l2_grads": 1.5546875, "lr": 0.0008065245303566301, "uptime": 75091.185805595, "examples_seen": 40704000.0, "progress": 0.3530101329449482, "epoch": 31.77103375282067, "img/sec/core": 553.0100067684523, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.836862333696388, "core_hours": 20.836862333696388} {"step": 39800, "l2_params": 338.8352320127365, "train/loss": 2.5359201431274414, "l2_grads": 1.859375, "lr": 0.0008059194134598839, "uptime": 75183.80049085, "examples_seen": 40755200.0, "progress": 0.3534541708480236, "epoch": 31.810997317289626, "img/sec/core": 552.8280947997428, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.86258863515611, "core_hours": 20.86258863515611} {"step": 39850, "l2_params": 338.8825703460935, "train/loss": 4.554886817932129, "l2_grads": 1.6015625, "lr": 0.0008053135795508661, "uptime": 75276.37150148301, "examples_seen": 40806400.0, "progress": 0.353898208751099, "epoch": 31.850960881758585, "img/sec/core": 553.0889168206148, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.88830280477639, "core_hours": 20.88830280477639} {"step": 39900, "l2_params": 338.88271731345344, "train/loss": 3.334020495414734, "l2_grads": 1.6484375, "lr": 0.0008047070300495267, "uptime": 75368.875540383, "examples_seen": 40857600.0, "progress": 0.3543422466541744, "epoch": 31.89092444622754, "img/sec/core": 553.4893460744312, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.9139983711375, "core_hours": 20.9139983711375} {"step": 39950, "l2_params": 338.88275765742344, "train/loss": 3.304352283477783, "l2_grads": 1.734375, "lr": 0.0008040997663774937, "uptime": 75461.395233912, "examples_seen": 40908800.0, "progress": 0.3547862845572498, "epoch": 31.9308880106965, "img/sec/core": 553.3956939011179, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.939698286006667, "core_hours": 20.939698286006667} {"step": 40000, "l2_params": 338.912527316231, "train/loss": 3.721108317375183, "l2_grads": 1.53125, "lr": 0.0008034917899580681, "uptime": 75553.914254198, "examples_seen": 40960000.0, "progress": 0.3552303224603252, "epoch": 31.970851575165455, "img/sec/core": 553.3997208544795, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.965398013863886, "core_hours": 20.965398013863886, "val/acc@1": 0.6035754145408163, "val/loss": 1.6836990121067787, "z/secs/eval/val": 31.502214437990915} {"step": 40050, "l2_params": 338.9300922341877, "train/loss": 4.8807759284973145, "l2_grads": 1.640625, "lr": 0.0008028831022162218, "uptime": 75677.777779159, "examples_seen": 41011200.0, "progress": 0.3556743603634006, "epoch": 32.01081513963441, "img/sec/core": 413.35816993838444, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 20.99980454857528, "core_hours": 20.99980454857528} {"step": 40100, "l2_params": 338.930106640735, "train/loss": 2.788098633289337, "l2_grads": 1.8046875, "lr": 0.0008022737045785937, "uptime": 75770.207926563, "examples_seen": 41062400.0, "progress": 0.356118398266476, "epoch": 32.050778704103365, "img/sec/core": 553.93182244115, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.025479589520835, "core_hours": 21.025479589520835} {"step": 40150, "l2_params": 338.93010087811615, "train/loss": 2.440006136894226, "l2_grads": 1.9140625, "lr": 0.0008016635984734867, "uptime": 75862.71856792101, "examples_seen": 41113600.0, "progress": 0.3565624361695514, "epoch": 32.09074226857233, "img/sec/core": 553.4498436981006, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.051176989898057, "core_hours": 21.051176989898057} {"step": 40200, "l2_params": 338.96544982029513, "train/loss": 4.902088165283203, "l2_grads": 1.546875, "lr": 0.0008010527853308648, "uptime": 75955.215408453, "examples_seen": 41164800.0, "progress": 0.35700647407262687, "epoch": 32.13070583304128, "img/sec/core": 553.5324201942788, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.0768705567125, "core_hours": 21.0768705567125} {"step": 40250, "l2_params": 338.97737410666514, "train/loss": 2.521249294281006, "l2_grads": 1.8671875, "lr": 0.0008004412665823475, "uptime": 76047.73067723401, "examples_seen": 41216000.0, "progress": 0.35745051197570227, "epoch": 32.17066939751024, "img/sec/core": 553.4221612780175, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.102569242485004, "core_hours": 21.102569242485004} {"step": 40300, "l2_params": 339.0363901237226, "train/loss": 2.6146055459976196, "l2_grads": 1.890625, "lr": 0.0007998290436612102, "uptime": 76140.240278972, "examples_seen": 41267200.0, "progress": 0.35789454987877767, "epoch": 32.210632961979194, "img/sec/core": 553.4560633501204, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.128266354078892, "core_hours": 21.128266354078892} {"step": 40350, "l2_params": 339.0364390906234, "train/loss": 2.531781315803528, "l2_grads": 1.78125, "lr": 0.0007992161180023776, "uptime": 76232.74080456, "examples_seen": 41318400.0, "progress": 0.35833858778185307, "epoch": 32.25059652644815, "img/sec/core": 553.5103684496778, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.15396094452, "core_hours": 21.15396094452} {"step": 40400, "l2_params": 339.03646213386844, "train/loss": 2.9467079639434814, "l2_grads": 1.875, "lr": 0.0007986024910424207, "uptime": 76325.265216973, "examples_seen": 41369600.0, "progress": 0.35878262568492847, "epoch": 32.29056009091711, "img/sec/core": 553.3674698895793, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.179662170190277, "core_hours": 21.179662170190277} {"step": 40450, "l2_params": 339.0424504440779, "train/loss": 2.494449198246002, "l2_grads": 1.9375, "lr": 0.0007979881642195551, "uptime": 76417.972761824, "examples_seen": 41420800.0, "progress": 0.35922666358800387, "epoch": 32.33052365538607, "img/sec/core": 552.2743600026151, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.20541426598222, "core_hours": 21.20541426598222} {"step": 40500, "l2_params": 339.04238707626956, "train/loss": 5.169439911842346, "l2_grads": 1.625, "lr": 0.0007973731389736368, "uptime": 76510.497567589, "examples_seen": 41472000.0, "progress": 0.35967070149107927, "epoch": 32.37048721985502, "img/sec/core": 553.3651173506863, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.231115600916944, "core_hours": 21.231115600916944} {"step": 40550, "l2_params": 339.0423726744933, "train/loss": 2.550292670726776, "l2_grads": 1.703125, "lr": 0.0007967574167461598, "uptime": 76602.97585747301, "examples_seen": 41523200.0, "progress": 0.36011473939415467, "epoch": 32.41045078432398, "img/sec/core": 553.643455823193, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.25680401477361, "core_hours": 21.25680401477361} {"step": 40600, "l2_params": 339.04238995662473, "train/loss": 2.6698243021965027, "l2_grads": 1.8515625, "lr": 0.0007961409989802487, "uptime": 76695.452300993, "examples_seen": 41574400.0, "progress": 0.36055877729723007, "epoch": 32.45041434879294, "img/sec/core": 553.6545097447677, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.28249191575139, "core_hours": 21.28249191575139} {"step": 40650, "l2_params": 339.05425105173066, "train/loss": 2.9191262125968933, "l2_grads": 1.859375, "lr": 0.0007955238871206619, "uptime": 76787.899663861, "examples_seen": 41625600.0, "progress": 0.36100281520030547, "epoch": 32.490377913261895, "img/sec/core": 553.8286697599584, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.308171738770277, "core_hours": 21.308171738770277} {"step": 40700, "l2_params": 339.05436338163383, "train/loss": 2.527597665786743, "l2_grads": 1.859375, "lr": 0.0007949060826137824, "uptime": 76880.353645704, "examples_seen": 41676800.0, "progress": 0.3614468531033809, "epoch": 32.53034147773085, "img/sec/core": 553.7890200006927, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.33385340039333, "core_hours": 21.33385340039333} {"step": 40750, "l2_params": 339.0543144173216, "train/loss": 4.70506227016449, "l2_grads": 1.765625, "lr": 0.0007942875869076165, "uptime": 76972.797847259, "examples_seen": 41728000.0, "progress": 0.36189089100645633, "epoch": 32.570305042199806, "img/sec/core": 553.8476090308133, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.359532345269724, "core_hours": 21.359532345269724} {"step": 40800, "l2_params": 339.05448147200474, "train/loss": 3.6560869812965393, "l2_grads": 1.4765625, "lr": 0.0007936684014517912, "uptime": 77065.23266353601, "examples_seen": 41779200.0, "progress": 0.36233492890953173, "epoch": 32.61026860666876, "img/sec/core": 553.9038434021062, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.385208683124446, "core_hours": 21.385208683124446} {"step": 40850, "l2_params": 339.10765540330254, "train/loss": 2.566467046737671, "l2_grads": 1.859375, "lr": 0.0007930485276975499, "uptime": 77157.66577190401, "examples_seen": 41830400.0, "progress": 0.36277896681260713, "epoch": 32.65023217113772, "img/sec/core": 553.9140780180102, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.410884546560002, "core_hours": 21.410884546560002} {"step": 40900, "l2_params": 339.10766404270487, "train/loss": 3.9741058349609375, "l2_grads": 1.6015625, "lr": 0.00079242796709775, "uptime": 77250.11388512401, "examples_seen": 41881600.0, "progress": 0.36322300471568253, "epoch": 32.69019573560668, "img/sec/core": 553.8241746281803, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.436564578010003, "core_hours": 21.436564578010003} {"step": 40950, "l2_params": 339.1195890878688, "train/loss": 2.484033763408661, "l2_grads": 1.8046875, "lr": 0.0007918067211068578, "uptime": 77342.597834707, "examples_seen": 41932800.0, "progress": 0.36366704261875793, "epoch": 32.730159300075634, "img/sec/core": 553.609574751707, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.462254564005278, "core_hours": 21.462254564005278} {"step": 41000, "l2_params": 339.14315572944264, "train/loss": 2.6160436868667603, "l2_grads": 1.765625, "lr": 0.0007911847911809455, "uptime": 77435.076679139, "examples_seen": 41984000.0, "progress": 0.36411108052183333, "epoch": 32.77012286454459, "img/sec/core": 553.640135908569, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.48794313190306, "core_hours": 21.48794313190306} {"step": 41050, "l2_params": 339.1490586517601, "train/loss": 2.851637601852417, "l2_grads": 1.71875, "lr": 0.00079056217877769, "uptime": 77527.795756426, "examples_seen": 42035200.0, "progress": 0.36455511842490873, "epoch": 32.810086429013545, "img/sec/core": 552.205667896371, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.513698431149447, "core_hours": 21.513698431149447} {"step": 41100, "l2_params": 339.2198079785436, "train/loss": 3.1219034790992737, "l2_grads": 1.7421875, "lr": 0.0007899388853563677, "uptime": 77620.43614892701, "examples_seen": 42086400.0, "progress": 0.36499915632798413, "epoch": 32.85004999348251, "img/sec/core": 552.6746877658396, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.539431873510832, "core_hours": 21.539431873510832} {"step": 41150, "l2_params": 339.22583623413766, "train/loss": 4.958850145339966, "l2_grads": 1.6953125, "lr": 0.000789314912377849, "uptime": 77713.111835182, "examples_seen": 42137600.0, "progress": 0.3654431942310596, "epoch": 32.89001355795146, "img/sec/core": 552.4642122327974, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.56517511969278, "core_hours": 21.56517511969278} {"step": 41200, "l2_params": 339.2966530191537, "train/loss": 2.7412625551223755, "l2_grads": 1.75, "lr": 0.0007886902613045985, "uptime": 77805.82571429301, "examples_seen": 42188800.0, "progress": 0.365887232134135, "epoch": 32.92997712242042, "img/sec/core": 552.2366283337058, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.590928975001393, "core_hours": 21.590928975001393} {"step": 41250, "l2_params": 339.32022750917014, "train/loss": 2.832578659057617, "l2_grads": 1.6640625, "lr": 0.00078806493360067, "uptime": 77898.59992860601, "examples_seen": 42240000.0, "progress": 0.3663312700372104, "epoch": 32.96994068688937, "img/sec/core": 551.8774842680036, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.616699590088334, "core_hours": 21.616699590088334} {"step": 41300, "l2_params": 339.32028506909955, "train/loss": 2.486616611480713, "l2_grads": 1.796875, "lr": 0.0007874389307317041, "uptime": 77991.34442136501, "examples_seen": 42291200.0, "progress": 0.3667753079402858, "epoch": 33.00990425135833, "img/sec/core": 552.0543428173884, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.642461949188057, "core_hours": 21.642461949188057} {"step": 41350, "l2_params": 339.3674147402782, "train/loss": 4.194086194038391, "l2_grads": 1.6328125, "lr": 0.0007868122541649217, "uptime": 78084.16081457201, "examples_seen": 42342400.0, "progress": 0.3672193458433612, "epoch": 33.04986781582729, "img/sec/core": 551.6266925586323, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.668244280634447, "core_hours": 21.668244280634447} {"step": 41400, "l2_params": 339.3675557424796, "train/loss": 2.5051591992378235, "l2_grads": 1.921875, "lr": 0.000786184905369125, "uptime": 78177.028815852, "examples_seen": 42393600.0, "progress": 0.3676633837464366, "epoch": 33.089831380296246, "img/sec/core": 551.3201457371372, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.694040947656667, "core_hours": 21.694040947656667} {"step": 41450, "l2_params": 339.39137276343666, "train/loss": 2.4511406421661377, "l2_grads": 1.8515625, "lr": 0.0007855568858146908, "uptime": 78269.894744316, "examples_seen": 42444800.0, "progress": 0.368107421649512, "epoch": 33.1297949447652, "img/sec/core": 551.3324514905063, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.719837038896667, "core_hours": 21.719837038896667} {"step": 41500, "l2_params": 339.4207151530384, "train/loss": 2.549681842327118, "l2_grads": 1.828125, "lr": 0.0007849281969735675, "uptime": 78362.755153395, "examples_seen": 42496000.0, "progress": 0.3685514595525874, "epoch": 33.16975850923416, "img/sec/core": 551.3652212800442, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.745631596974167, "core_hours": 21.745631596974167} {"step": 41550, "l2_params": 339.42668517571656, "train/loss": 2.4928075075149536, "l2_grads": 1.8359375, "lr": 0.0007842988403192721, "uptime": 78455.623191538, "examples_seen": 42547200.0, "progress": 0.3689954974556628, "epoch": 33.20972207370312, "img/sec/core": 551.3199268962702, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.77142827423611, "core_hours": 21.77142827423611} {"step": 41600, "l2_params": 339.4266535276804, "train/loss": 2.927886426448822, "l2_grads": 1.8359375, "lr": 0.0007836688173268882, "uptime": 78548.601999492, "examples_seen": 42598400.0, "progress": 0.36943953535873825, "epoch": 33.249685638172075, "img/sec/core": 550.6631148178392, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.79725572089, "core_hours": 21.79725572089} {"step": 41650, "l2_params": 339.4266420193029, "train/loss": 2.529874324798584, "l2_grads": 1.8125, "lr": 0.0007830381294730596, "uptime": 78641.526029998, "examples_seen": 42649600.0, "progress": 0.36988357326181365, "epoch": 33.28964920264103, "img/sec/core": 550.987723210063, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.82306795158611, "core_hours": 21.82306795158611} {"step": 41700, "l2_params": 339.4266247567359, "train/loss": 2.415294110774994, "l2_grads": 1.78125, "lr": 0.0007824067782359899, "uptime": 78734.545315186, "examples_seen": 42700800.0, "progress": 0.37032761116488905, "epoch": 33.329612767109985, "img/sec/core": 550.423494402492, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.848906641916113, "core_hours": 21.848906641916113} {"step": 41750, "l2_params": 339.4267657343407, "train/loss": 5.090084075927734, "l2_grads": 1.6328125, "lr": 0.0007817747650954357, "uptime": 78827.73268557001, "examples_seen": 42752000.0, "progress": 0.37077164906796445, "epoch": 33.36957633157894, "img/sec/core": 549.4306770221442, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.874792022578333, "core_hours": 21.874792022578333} {"step": 41800, "l2_params": 339.42692972862363, "train/loss": 5.077638864517212, "l2_grads": 1.6953125, "lr": 0.0007811420915327065, "uptime": 78920.497634338, "examples_seen": 42803200.0, "progress": 0.37121568697103985, "epoch": 33.4095398960479, "img/sec/core": 551.9326068734739, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.900560063902777, "core_hours": 21.900560063902777} {"step": 41850, "l2_params": 339.4268290303891, "train/loss": 5.130733251571655, "l2_grads": 1.7265625, "lr": 0.0007805087590306595, "uptime": 79013.207236138, "examples_seen": 42854400.0, "progress": 0.37165972487411525, "epoch": 33.44950346051686, "img/sec/core": 552.2621066850422, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.926312731069444, "core_hours": 21.926312731069444} {"step": 41900, "l2_params": 339.4327644210264, "train/loss": 2.563261330127716, "l2_grads": 1.8671875, "lr": 0.0007798747690736955, "uptime": 79105.942057128, "examples_seen": 42905600.0, "progress": 0.37210376277719065, "epoch": 33.489467024985814, "img/sec/core": 552.1119192705029, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.952072403566667, "core_hours": 21.952072403566667} {"step": 41950, "l2_params": 339.4327500358134, "train/loss": 2.510879933834076, "l2_grads": 1.765625, "lr": 0.0007792401231477576, "uptime": 79198.781170267, "examples_seen": 42956800.0, "progress": 0.37254780068026605, "epoch": 33.52943058945477, "img/sec/core": 551.4916964291303, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 21.977861046105275, "core_hours": 21.977861046105275} {"step": 42000, "l2_params": 339.4326809867827, "train/loss": 4.535974740982056, "l2_grads": 1.5078125, "lr": 0.0007786048227403243, "uptime": 79291.658882036, "examples_seen": 43008000.0, "progress": 0.37299183858334145, "epoch": 33.569394153923724, "img/sec/core": 551.2625044783543, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.00366041048556, "core_hours": 22.00366041048556} {"step": 42050, "l2_params": 339.46233625304444, "train/loss": 2.9796007871627808, "l2_grads": 1.7890625, "lr": 0.0007779688693404092, "uptime": 79384.79647371, "examples_seen": 43059200.0, "progress": 0.3734358764864169, "epoch": 33.60935771839269, "img/sec/core": 549.7243280587951, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.02953196372833, "core_hours": 22.02953196372833} {"step": 42100, "l2_params": 339.4564560394676, "train/loss": 4.289669871330261, "l2_grads": 1.7265625, "lr": 0.0007773322644385577, "uptime": 79477.861912205, "examples_seen": 43110400.0, "progress": 0.3738799143894923, "epoch": 33.64932128286164, "img/sec/core": 550.1505266399092, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.055383474421387, "core_hours": 22.055383474421387} {"step": 42150, "l2_params": 339.4860977225356, "train/loss": 2.552078127861023, "l2_grads": 1.8828125, "lr": 0.0007766950095268406, "uptime": 79570.966573903, "examples_seen": 43161600.0, "progress": 0.3743239522925677, "epoch": 33.6892848473306, "img/sec/core": 549.9187588058088, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.08124588044861, "core_hours": 22.08124588044861} {"step": 42200, "l2_params": 339.5213945302269, "train/loss": 2.465970814228058, "l2_grads": 1.84375, "lr": 0.0007760571060988518, "uptime": 79664.083971318, "examples_seen": 43212800.0, "progress": 0.3747679901956431, "epoch": 33.72924841179955, "img/sec/core": 549.8435461186119, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.107111824175, "core_hours": 22.107111824175} {"step": 42250, "l2_params": 339.5333079205927, "train/loss": 4.585124135017395, "l2_grads": 1.640625, "lr": 0.0007754185556497067, "uptime": 79757.15142887301, "examples_seen": 43264000.0, "progress": 0.3752120280987185, "epoch": 33.76921197626851, "img/sec/core": 550.1385913517439, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.132963895718056, "core_hours": 22.132963895718056} {"step": 42300, "l2_params": 339.5568544763527, "train/loss": 3.1698241233825684, "l2_grads": 1.6640625, "lr": 0.0007747793596760361, "uptime": 79850.215998532, "examples_seen": 43315200.0, "progress": 0.3756560660017939, "epoch": 33.80917554073747, "img/sec/core": 550.1556627576649, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.15881516506778, "core_hours": 22.15881516506778} {"step": 42350, "l2_params": 339.55690336819833, "train/loss": 4.6691261529922485, "l2_grads": 1.5546875, "lr": 0.0007741395196759844, "uptime": 79943.27005545501, "examples_seen": 43366400.0, "progress": 0.3761001039048693, "epoch": 33.849139105206426, "img/sec/core": 550.2178163211403, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.18466351421306, "core_hours": 22.18466351421306} {"step": 42400, "l2_params": 339.58056331947944, "train/loss": 3.8397783041000366, "l2_grads": 1.5625, "lr": 0.0007734990371492046, "uptime": 80036.349720611, "examples_seen": 43417600.0, "progress": 0.3765441418079447, "epoch": 33.88910266967538, "img/sec/core": 550.0664394762587, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.210518976756386, "core_hours": 22.210518976756386} {"step": 42450, "l2_params": 339.5805978289617, "train/loss": 4.56880509853363, "l2_grads": 1.7734375, "lr": 0.0007728579135968564, "uptime": 80129.421237079, "examples_seen": 43468800.0, "progress": 0.3769881797110201, "epoch": 33.92906623414434, "img/sec/core": 550.1145994285308, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.236372175775276, "core_hours": 22.236372175775276} {"step": 42500, "l2_params": 339.5806007047517, "train/loss": 2.415768265724182, "l2_grads": 1.7578125, "lr": 0.0007722161505216015, "uptime": 80222.512142167, "examples_seen": 43520000.0, "progress": 0.37743221761409557, "epoch": 33.9690297986133, "img/sec/core": 550.000023650001, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.262230760521945, "core_hours": 22.262230760521945, "val/acc@1": 0.6134008290816326, "val/loss": 1.6324903198650904, "z/secs/eval/val": 31.6988427460019} {"step": 42550, "l2_params": 339.58057769843083, "train/loss": 2.718576490879059, "l2_grads": 1.8515625, "lr": 0.0007715737494276011, "uptime": 80346.946909301, "examples_seen": 43571200.0, "progress": 0.37787625551717097, "epoch": 34.008993363082254, "img/sec/core": 411.46056829010837, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.29679597361472, "core_hours": 22.29679597361472} {"step": 42600, "l2_params": 339.60414685704296, "train/loss": 2.61942857503891, "l2_grads": 1.8984375, "lr": 0.0007709307118205112, "uptime": 80439.956534597, "examples_seen": 43622400.0, "progress": 0.37832029342024637, "epoch": 34.04895692755121, "img/sec/core": 550.4806608676695, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.32263198064139, "core_hours": 22.32263198064139} {"step": 42650, "l2_params": 339.65122851426577, "train/loss": 2.471401810646057, "l2_grads": 1.8046875, "lr": 0.0007702870392074796, "uptime": 80533.00837223801, "examples_seen": 43673600.0, "progress": 0.37876433132332177, "epoch": 34.088920492020165, "img/sec/core": 550.2309389904893, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.348479713319445, "core_hours": 22.348479713319445} {"step": 42700, "l2_params": 339.6573123660817, "train/loss": 2.3614822030067444, "l2_grads": 1.703125, "lr": 0.0007696427330971433, "uptime": 80626.10059182001, "examples_seen": 43724800.0, "progress": 0.37920836922639717, "epoch": 34.12888405648912, "img/sec/core": 549.9922574614246, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.374338663203336, "core_hours": 22.374338663203336} {"step": 42750, "l2_params": 339.6573238666436, "train/loss": 4.465772747993469, "l2_grads": 1.7265625, "lr": 0.0007689977949996231, "uptime": 80719.226517886, "examples_seen": 43776000.0, "progress": 0.37965240712947257, "epoch": 34.16884762095808, "img/sec/core": 549.7931903916982, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.400206975999442, "core_hours": 22.400206975999442} {"step": 42800, "l2_params": 339.65726636383033, "train/loss": 2.527989149093628, "l2_grads": 1.796875, "lr": 0.0007683522264265214, "uptime": 80812.355813343, "examples_seen": 43827200.0, "progress": 0.38009644503254797, "epoch": 34.20881118542704, "img/sec/core": 549.773299032798, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.426076224737503, "core_hours": 22.426076224737503} {"step": 42850, "l2_params": 339.65734686776614, "train/loss": 2.6040461659431458, "l2_grads": 1.8671875, "lr": 0.000767706028890918, "uptime": 80905.52516467801, "examples_seen": 43878400.0, "progress": 0.38054048293562337, "epoch": 34.24877474989599, "img/sec/core": 549.5369374839057, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.451956600108335, "core_hours": 22.451956600108335} {"step": 42900, "l2_params": 339.66911748788704, "train/loss": 2.627787411212921, "l2_grads": 1.875, "lr": 0.0007670592039073683, "uptime": 80998.64005110701, "examples_seen": 43929600.0, "progress": 0.38098452083869877, "epoch": 34.28873831436495, "img/sec/core": 549.8583734947637, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.477821846338614, "core_hours": 22.477821846338614} {"step": 42950, "l2_params": 339.68087907530946, "train/loss": 2.7842790484428406, "l2_grads": 1.796875, "lr": 0.000766411752991897, "uptime": 81091.799603034, "examples_seen": 43980800.0, "progress": 0.38142855874177417, "epoch": 34.328701878833904, "img/sec/core": 549.5947430074127, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.503699499651663, "core_hours": 22.503699499651663} {"step": 43000, "l2_params": 339.7045735129644, "train/loss": 2.5071746110916138, "l2_grads": 1.8515625, "lr": 0.0007657636776619951, "uptime": 81185.02413418201, "examples_seen": 44032000.0, "progress": 0.3818725966448496, "epoch": 34.368665443302866, "img/sec/core": 549.2116653149226, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.529595202748336, "core_hours": 22.529595202748336} {"step": 43050, "l2_params": 339.70455051503944, "train/loss": 2.470816433429718, "l2_grads": 1.8046875, "lr": 0.0007651149794366191, "uptime": 81278.455434963, "examples_seen": 44083200.0, "progress": 0.382316634547925, "epoch": 34.40862900777182, "img/sec/core": 547.9962236639769, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.555548341854166, "core_hours": 22.555548341854166} {"step": 43100, "l2_params": 339.71038331386046, "train/loss": 4.696271061897278, "l2_grads": 1.6328125, "lr": 0.0007644656598361838, "uptime": 81371.655243036, "examples_seen": 44134400.0, "progress": 0.3827606724510004, "epoch": 34.44859257224078, "img/sec/core": 549.3573544689965, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.58143717743, "core_hours": 22.58143717743} {"step": 43150, "l2_params": 339.71333273438063, "train/loss": 5.036544322967529, "l2_grads": 1.75, "lr": 0.0007638157203825614, "uptime": 81464.819108953, "examples_seen": 44185600.0, "progress": 0.38320471035407583, "epoch": 34.48855613670973, "img/sec/core": 549.5692938034053, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.607316029073612, "core_hours": 22.607316029073612} {"step": 43200, "l2_params": 339.71332411038134, "train/loss": 2.879888892173767, "l2_grads": 1.9375, "lr": 0.000763165162599076, "uptime": 81559.530997851, "examples_seen": 44236800.0, "progress": 0.38364874825715123, "epoch": 34.52851970117869, "img/sec/core": 540.5868322944938, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.633624887100833, "core_hours": 22.633624887100833} {"step": 43250, "l2_params": 339.71042930891895, "train/loss": 2.527442991733551, "l2_grads": 1.8203125, "lr": 0.0007625139880105012, "uptime": 81652.62775106, "examples_seen": 44288000.0, "progress": 0.38409278616022663, "epoch": 34.56848326564765, "img/sec/core": 549.965473930732, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.659485096325557, "core_hours": 22.659485096325557} {"step": 43300, "l2_params": 339.7132781157148, "train/loss": 3.3386523127555847, "l2_grads": 1.6015625, "lr": 0.0007618621981430568, "uptime": 81745.769233294, "examples_seen": 44339200.0, "progress": 0.38453682406330203, "epoch": 34.608446830116605, "img/sec/core": 549.7013658357856, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.685357730279446, "core_hours": 22.685357730279446} {"step": 43350, "l2_params": 339.71332411038134, "train/loss": 4.111621201038361, "l2_grads": 1.5703125, "lr": 0.0007612097945244047, "uptime": 81839.680454737, "examples_seen": 44390400.0, "progress": 0.38498086196637743, "epoch": 34.64841039458556, "img/sec/core": 545.1957626925424, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.711444180680278, "core_hours": 22.711444180680278} {"step": 43400, "l2_params": 339.7251100384324, "train/loss": 2.7383862137794495, "l2_grads": 1.8984375, "lr": 0.0007605567786836452, "uptime": 81932.834816876, "examples_seen": 44441600.0, "progress": 0.38542489986945283, "epoch": 34.688373959054516, "img/sec/core": 549.6253618655186, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.737320392385552, "core_hours": 22.737320392385552} {"step": 43450, "l2_params": 339.7369501724827, "train/loss": 2.6100679636001587, "l2_grads": 1.8515625, "lr": 0.0007599031521513125, "uptime": 82026.001444733, "examples_seen": 44492800.0, "progress": 0.3858689377725283, "epoch": 34.72833752352348, "img/sec/core": 549.5530017313016, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.763200011234723, "core_hours": 22.763200011234723} {"step": 43500, "l2_params": 339.7606119571543, "train/loss": 2.7027682065963745, "l2_grads": 1.734375, "lr": 0.0007592489164593735, "uptime": 82119.23588184001, "examples_seen": 44544000.0, "progress": 0.3863129756756037, "epoch": 34.768301087992434, "img/sec/core": 549.1533127532795, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.78909846598667, "core_hours": 22.78909846598667} {"step": 43550, "l2_params": 339.77236750323004, "train/loss": 2.4848830103874207, "l2_grads": 1.984375, "lr": 0.0007585940731412223, "uptime": 82214.00634073, "examples_seen": 44595200.0, "progress": 0.3867570135786791, "epoch": 34.80826465246139, "img/sec/core": 540.2527390885691, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.81542359345611, "core_hours": 22.81542359345611} {"step": 43600, "l2_params": 339.8018637980448, "train/loss": 3.022560775279999, "l2_grads": 1.765625, "lr": 0.000757938623731676, "uptime": 82307.18004179001, "examples_seen": 44646400.0, "progress": 0.3872010514817545, "epoch": 34.848228216930345, "img/sec/core": 549.5112828782752, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.84130517708389, "core_hours": 22.84130517708389} {"step": 43650, "l2_params": 339.79591473688293, "train/loss": 3.7578097581863403, "l2_grads": 1.59375, "lr": 0.0007572825697669749, "uptime": 82400.450113072, "examples_seen": 44697600.0, "progress": 0.3876450893848299, "epoch": 34.8881917813993, "img/sec/core": 548.9435067032555, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.86721353021778, "core_hours": 22.86721353021778} {"step": 43700, "l2_params": 339.8018551762924, "train/loss": 2.4550082683563232, "l2_grads": 1.875, "lr": 0.000756625912784774, "uptime": 82493.70109571201, "examples_seen": 44748800.0, "progress": 0.3880891272879053, "epoch": 34.92815534586826, "img/sec/core": 549.0558764153411, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.893116580951112, "core_hours": 22.893116580951112} {"step": 43750, "l2_params": 339.80196725905665, "train/loss": 3.4674111008644104, "l2_grads": 1.6328125, "lr": 0.000755968654324143, "uptime": 82587.609176043, "examples_seen": 44800000.0, "progress": 0.3885331651909807, "epoch": 34.96811891033722, "img/sec/core": 545.2139988331006, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.919202158820834, "core_hours": 22.919202158820834} {"step": 43800, "l2_params": 339.8019097807206, "train/loss": 3.9257653951644897, "l2_grads": 1.75, "lr": 0.00075531079592556, "uptime": 82680.77126772501, "examples_seen": 44851200.0, "progress": 0.3889772030940561, "epoch": 35.00808247480617, "img/sec/core": 549.5797601320584, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.94508051762139, "core_hours": 22.94508051762139} {"step": 43850, "l2_params": 339.8372082703717, "train/loss": 2.556161880493164, "l2_grads": 1.78125, "lr": 0.0007546523391309106, "uptime": 82775.411466734, "examples_seen": 44902400.0, "progress": 0.3894212409971315, "epoch": 35.04804603927513, "img/sec/core": 540.9963264672982, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.971369461790555, "core_hours": 22.971369461790555} {"step": 43900, "l2_params": 339.83129143830325, "train/loss": 4.079185962677002, "l2_grads": 1.6328125, "lr": 0.000753993285483482, "uptime": 82868.85857702201, "examples_seen": 44953600.0, "progress": 0.38986527890020695, "epoch": 35.088009603744084, "img/sec/core": 547.9035129304795, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 22.997326992426114, "core_hours": 22.997326992426114} {"step": 43950, "l2_params": 339.86653515571373, "train/loss": 2.406024396419525, "l2_grads": 1.9296875, "lr": 0.0007533336365279608, "uptime": 82962.085685778, "examples_seen": 45004800.0, "progress": 0.39030931680328235, "epoch": 35.127973168213046, "img/sec/core": 549.1964803285684, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.023223411525, "core_hours": 23.023223411525} {"step": 44001, "l2_params": 339.8724168943767, "train/loss": 3.225381910800934, "l2_grads": 1.671875, "lr": 0.000752673393810428, "uptime": 83056.637636928, "examples_seen": 45056000.0, "progress": 0.39075335470635775, "epoch": 35.167936732682, "img/sec/core": 541.5012527745038, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.0494878424, "core_hours": 23.0494878424} {"step": 44050, "l2_params": 339.872468614148, "train/loss": 2.538963556289673, "l2_grads": 1.859375, "lr": 0.0007520125588783571, "uptime": 83150.07785156301, "examples_seen": 45107200.0, "progress": 0.39119739260943315, "epoch": 35.20790029715096, "img/sec/core": 547.9439468327142, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.07544345757639, "core_hours": 23.07544345757639} {"step": 44100, "l2_params": 339.89613245721847, "train/loss": 2.5202351808547974, "l2_grads": 1.9609375, "lr": 0.0007513511332806101, "uptime": 83244.889668823, "examples_seen": 45158400.0, "progress": 0.39164143051250855, "epoch": 35.24786386161991, "img/sec/core": 540.0170725511897, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.101780073481944, "core_hours": 23.101780073481944} {"step": 44150, "l2_params": 339.89601753238446, "train/loss": 4.097069501876831, "l2_grads": 1.6875, "lr": 0.0007506891185674322, "uptime": 83339.345131618, "examples_seen": 45209600.0, "progress": 0.39208546841558395, "epoch": 35.28782742608887, "img/sec/core": 542.0544083418665, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.12801770203611, "core_hours": 23.12801770203611} {"step": 44200, "l2_params": 339.89601178614174, "train/loss": 3.639986574649811, "l2_grads": 1.6640625, "lr": 0.0007500265162904502, "uptime": 83432.55711285201, "examples_seen": 45260800.0, "progress": 0.39252950631865935, "epoch": 35.32779099055783, "img/sec/core": 549.2856103064887, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.153909919045557, "core_hours": 23.153909919045557} {"step": 44250, "l2_params": 339.8960692485646, "train/loss": 2.997315764427185, "l2_grads": 1.703125, "lr": 0.0007493633280026674, "uptime": 83527.05902728101, "examples_seen": 45312000.0, "progress": 0.39297354422173475, "epoch": 35.367754555026785, "img/sec/core": 541.7879659831437, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.18016045083139, "core_hours": 23.18016045083139} {"step": 44300, "l2_params": 339.94914314037476, "train/loss": 3.9109928607940674, "l2_grads": 1.671875, "lr": 0.0007486995552584609, "uptime": 83620.527961988, "examples_seen": 45363200.0, "progress": 0.39341758212481015, "epoch": 35.40771811949574, "img/sec/core": 547.7755808440671, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.206124043805556, "core_hours": 23.206124043805556} {"step": 44350, "l2_params": 339.9668096162109, "train/loss": 2.7101640701293945, "l2_grads": 1.8671875, "lr": 0.0007480351996135777, "uptime": 83714.875529173, "examples_seen": 45414400.0, "progress": 0.3938616200278856, "epoch": 35.447681683964696, "img/sec/core": 542.6743002244426, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.232331701356944, "core_hours": 23.232331701356944} {"step": 44400, "l2_params": 339.9962000017427, "train/loss": 4.563546538352966, "l2_grads": 1.734375, "lr": 0.0007473702626251314, "uptime": 83809.38015909301, "examples_seen": 45465600.0, "progress": 0.394305657930961, "epoch": 35.48764524843365, "img/sec/core": 541.7723982765676, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.258582987445834, "core_hours": 23.258582987445834} {"step": 44450, "l2_params": 340.00792442511545, "train/loss": 2.534240424633026, "l2_grads": 1.9609375, "lr": 0.0007467047458515975, "uptime": 83902.776980301, "examples_seen": 45516800.0, "progress": 0.3947496958340364, "epoch": 35.52760881290261, "img/sec/core": 548.1985290053797, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.284526548892497, "core_hours": 23.284526548892497} {"step": 44500, "l2_params": 340.00504362067926, "train/loss": 4.445703148841858, "l2_grads": 1.734375, "lr": 0.0007460386508528106, "uptime": 83997.46287180501, "examples_seen": 45568000.0, "progress": 0.3951937337371118, "epoch": 35.56757237737157, "img/sec/core": 540.7352583022731, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.31082818542139, "core_hours": 23.31082818542139} {"step": 44550, "l2_params": 340.0050177708779, "train/loss": 2.471441686153412, "l2_grads": 1.8671875, "lr": 0.000745371979189961, "uptime": 84090.72286377501, "examples_seen": 45619200.0, "progress": 0.3956377716401872, "epoch": 35.607535941840524, "img/sec/core": 549.0028351757716, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.33673373874639, "core_hours": 23.33673373874639} {"step": 44600, "l2_params": 340.0169860187135, "train/loss": 3.1996891498565674, "l2_grads": 1.6640625, "lr": 0.0007447047324255897, "uptime": 84184.085125362, "examples_seen": 45670400.0, "progress": 0.3960818095432626, "epoch": 35.64749950630948, "img/sec/core": 548.4014539674642, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.362667700298335, "core_hours": 23.362667700298335} {"step": 44650, "l2_params": 340.0639789298846, "train/loss": 2.479162096977234, "l2_grads": 1.8359375, "lr": 0.0007440369121235861, "uptime": 84277.685332537, "examples_seen": 45721600.0, "progress": 0.396525847446338, "epoch": 35.68746307077844, "img/sec/core": 547.0073362580838, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.388667757846942, "core_hours": 23.388667757846942} {"step": 44700, "l2_params": 340.0640478507321, "train/loss": 3.3377737402915955, "l2_grads": 1.671875, "lr": 0.0007433685198491837, "uptime": 84371.231256382, "examples_seen": 45772800.0, "progress": 0.3969698853494134, "epoch": 35.7274266352474, "img/sec/core": 547.3247566065644, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.41465273669278, "core_hours": 23.41465273669278} {"step": 44750, "l2_params": 340.1109969324353, "train/loss": 5.103677988052368, "l2_grads": 1.546875, "lr": 0.0007426995571689567, "uptime": 84464.723729553, "examples_seen": 45824000.0, "progress": 0.3974139232524888, "epoch": 35.76739019971635, "img/sec/core": 547.6376681826683, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.440622868129164, "core_hours": 23.440622868129164} {"step": 44800, "l2_params": 340.11103425940183, "train/loss": 3.2754522562026978, "l2_grads": 1.828125, "lr": 0.0007420300256508162, "uptime": 84558.180990905, "examples_seen": 45875200.0, "progress": 0.39785796115556427, "epoch": 35.80735376418531, "img/sec/core": 547.8440011970733, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.46658321850472, "core_hours": 23.46658321850472} {"step": 44850, "l2_params": 340.11112039853975, "train/loss": 2.5066086053848267, "l2_grads": 1.78125, "lr": 0.0007413599268640071, "uptime": 84651.608673422, "examples_seen": 45926400.0, "progress": 0.39830199905863967, "epoch": 35.84731732865426, "img/sec/core": 548.0174464424578, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.49253535253722, "core_hours": 23.49253535253722} {"step": 44900, "l2_params": 340.1143075313063, "train/loss": 2.4910680055618286, "l2_grads": 1.828125, "lr": 0.0007406892623791028, "uptime": 84744.831043179, "examples_seen": 45977600.0, "progress": 0.39874603696171507, "epoch": 35.887280893123226, "img/sec/core": 549.224398966269, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.518430455247497, "core_hours": 23.518430455247497} {"step": 44950, "l2_params": 340.11420416530683, "train/loss": 2.3872098326683044, "l2_grads": 1.890625, "lr": 0.0007400180337680034, "uptime": 84839.05960678401, "examples_seen": 46028800.0, "progress": 0.39919007486479047, "epoch": 35.92724445759218, "img/sec/core": 543.3596569997932, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.54460505624889, "core_hours": 23.54460505624889} {"step": 45000, "l2_params": 340.1259934292732, "train/loss": 2.5791298747062683, "l2_grads": 1.8671875, "lr": 0.0007393462426039304, "uptime": 84932.358262265, "examples_seen": 46080000.0, "progress": 0.39963411276786587, "epoch": 35.967208022061136, "img/sec/core": 548.7753251753128, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.570521349438057, "core_hours": 23.570521349438057, "val/acc@1": 0.6202168367346939, "val/loss": 1.5964800396135874, "z/secs/eval/val": 31.740153089005616} {"step": 45050, "l2_params": 340.1494042145304, "train/loss": 2.409615933895111, "l2_grads": 1.984375, "lr": 0.0007386738904614249, "uptime": 85057.212484963, "examples_seen": 46131200.0, "progress": 0.40007815067094127, "epoch": 36.00717158653009, "img/sec/core": 410.0782407963973, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.605203077965278, "core_hours": 23.605203077965278} {"step": 45100, "l2_params": 340.14939847256824, "train/loss": 4.332622051239014, "l2_grads": 1.59375, "lr": 0.000738000978916342, "uptime": 85150.406697558, "examples_seen": 46182400.0, "progress": 0.40052218857401667, "epoch": 36.04713515099905, "img/sec/core": 549.3903384591339, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.631090359241668, "core_hours": 23.631090359241668} {"step": 45150, "l2_params": 340.14951905375375, "train/loss": 2.4059168100357056, "l2_grads": 1.9296875, "lr": 0.000737327509545848, "uptime": 85244.258490614, "examples_seen": 46233600.0, "progress": 0.40096622647709207, "epoch": 36.08709871546801, "img/sec/core": 545.5409889660295, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.657160301757223, "core_hours": 23.657160301757223} {"step": 45200, "l2_params": 340.1553069003922, "train/loss": 3.0013322830200195, "l2_grads": 1.7421875, "lr": 0.0007366534839284169, "uptime": 85337.52330092901, "examples_seen": 46284800.0, "progress": 0.40141026438016747, "epoch": 36.127062279936965, "img/sec/core": 548.9744720121749, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.683067193511388, "core_hours": 23.683067193511388} {"step": 45250, "l2_params": 340.1552839329414, "train/loss": 2.389579474925995, "l2_grads": 1.890625, "lr": 0.000735978903643826, "uptime": 85431.722168847, "examples_seen": 46336000.0, "progress": 0.40185430228324287, "epoch": 36.16702584440592, "img/sec/core": 543.5309482123903, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.709233545710834, "core_hours": 23.709233545710834} {"step": 45300, "l2_params": 340.16729569801385, "train/loss": 2.9151695370674133, "l2_grads": 1.84375, "lr": 0.0007353037702731531, "uptime": 85525.039699592, "examples_seen": 46387200.0, "progress": 0.4022983401863183, "epoch": 36.206989408874875, "img/sec/core": 548.6643248191955, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.73515508202889, "core_hours": 23.73515508202889} {"step": 45350, "l2_params": 340.1673100521639, "train/loss": 4.383794069290161, "l2_grads": 1.7109375, "lr": 0.000734628085398773, "uptime": 85618.443968684, "examples_seen": 46438400.0, "progress": 0.4027423780893937, "epoch": 36.24695297334383, "img/sec/core": 548.1548166665485, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.761100712332222, "core_hours": 23.761100712332222} {"step": 45400, "l2_params": 340.1908500432147, "train/loss": 2.442841351032257, "l2_grads": 1.875, "lr": 0.0007339518506043514, "uptime": 85713.010858768, "examples_seen": 46489600.0, "progress": 0.4031864159924691, "epoch": 36.28691653781279, "img/sec/core": 541.4157106628281, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.787369292911112, "core_hours": 23.787369292911112} {"step": 45450, "l2_params": 340.19092467962014, "train/loss": 2.767353057861328, "l2_grads": 1.84375, "lr": 0.000733275067474844, "uptime": 85806.204215526, "examples_seen": 46540800.0, "progress": 0.4036304538955445, "epoch": 36.32688010228175, "img/sec/core": 549.395383760612, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.813256336455, "core_hours": 23.813256336455} {"step": 45500, "l2_params": 340.1909131970973, "train/loss": 4.502415299415588, "l2_grads": 1.6484375, "lr": 0.0007325977375964911, "uptime": 85899.552925612, "examples_seen": 46592000.0, "progress": 0.40407449179861993, "epoch": 36.366843666750704, "img/sec/core": 548.4810658104062, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.839186533701113, "core_hours": 23.839186533701113} {"step": 45550, "l2_params": 340.1908615257397, "train/loss": 4.449675679206848, "l2_grads": 1.5703125, "lr": 0.0007319198625568152, "uptime": 85994.31648814201, "examples_seen": 46643200.0, "progress": 0.40451852970169533, "epoch": 36.40680723121966, "img/sec/core": 540.2920556494464, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.865509745515002, "core_hours": 23.865509745515002} {"step": 45600, "l2_params": 340.1909964453792, "train/loss": 2.4632335901260376, "l2_grads": 1.875, "lr": 0.0007312414439446163, "uptime": 86087.62106582601, "examples_seen": 46694400.0, "progress": 0.40496256760477073, "epoch": 36.44677079568862, "img/sec/core": 548.740493455761, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.891427683760558, "core_hours": 23.891427683760558} {"step": 45650, "l2_params": 340.19100218663925, "train/loss": 2.4546236395835876, "l2_grads": 1.8046875, "lr": 0.000730562483349968, "uptime": 86180.914231649, "examples_seen": 46745600.0, "progress": 0.40540660550784613, "epoch": 36.48673436015758, "img/sec/core": 548.8076168102436, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.917342452044725, "core_hours": 23.917342452044725} {"step": 45700, "l2_params": 340.26149468552126, "train/loss": 2.456167995929718, "l2_grads": 1.8046875, "lr": 0.0007298829823642146, "uptime": 86274.26524475, "examples_seen": 46796800.0, "progress": 0.40585064341092153, "epoch": 36.52669792462653, "img/sec/core": 548.4675345152, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.94327328901722, "core_hours": 23.94327328901722} {"step": 45750, "l2_params": 340.273241537224, "train/loss": 5.110775470733643, "l2_grads": 1.734375, "lr": 0.0007292029425799669, "uptime": 86368.83701674601, "examples_seen": 46848000.0, "progress": 0.406294681313997, "epoch": 36.56666148909549, "img/sec/core": 541.3877621132125, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.96954322568278, "core_hours": 23.96954322568278} {"step": 45800, "l2_params": 340.3025652819855, "train/loss": 4.742993116378784, "l2_grads": 1.7265625, "lr": 0.0007285223655910981, "uptime": 86463.500567669, "examples_seen": 46899200.0, "progress": 0.4067387192170724, "epoch": 36.60662505356444, "img/sec/core": 540.8628717260818, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 23.995838656494723, "core_hours": 23.995838656494723} {"step": 45850, "l2_params": 340.3026915482744, "train/loss": 2.452156662940979, "l2_grads": 1.8125, "lr": 0.0007278412529927411, "uptime": 86556.724208099, "examples_seen": 46950400.0, "progress": 0.4071827571201478, "epoch": 36.646588618033405, "img/sec/core": 549.2169128328569, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.02173411216972, "core_hours": 24.02173411216972} {"step": 45900, "l2_params": 340.31454602231594, "train/loss": 3.352443218231201, "l2_grads": 1.6640625, "lr": 0.0007271596063812842, "uptime": 86650.94272424601, "examples_seen": 47001600.0, "progress": 0.4076267950232232, "epoch": 36.68655218250236, "img/sec/core": 543.417600847283, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.047905922210557, "core_hours": 24.047905922210557} {"step": 45950, "l2_params": 340.31441402124744, "train/loss": 3.2530753016471863, "l2_grads": 1.75, "lr": 0.0007264774273543666, "uptime": 86744.330676696, "examples_seen": 47052800.0, "progress": 0.4080708329262986, "epoch": 36.726515746971316, "img/sec/core": 548.2505896830334, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.07384702011333, "core_hours": 24.07384702011333} {"step": 46000, "l2_params": 340.3142934984879, "train/loss": 2.6544498801231384, "l2_grads": 1.875, "lr": 0.0007257947175108763, "uptime": 86838.66043261801, "examples_seen": 47104000.0, "progress": 0.408514870829374, "epoch": 36.76647931144027, "img/sec/core": 542.776767516839, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.10004973009167, "core_hours": 24.10004973009167} {"step": 46050, "l2_params": 340.3377946292845, "train/loss": 3.666459083557129, "l2_grads": 1.65625, "lr": 0.0007251114784509444, "uptime": 86932.12901457801, "examples_seen": 47155200.0, "progress": 0.4089589087324494, "epoch": 36.80644287590923, "img/sec/core": 547.7776481289952, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.126013225080555, "core_hours": 24.126013225080555} {"step": 46100, "l2_params": 340.34964501138387, "train/loss": 2.6133033633232117, "l2_grads": 1.8515625, "lr": 0.0007244277117759437, "uptime": 87026.539421104, "examples_seen": 47206400.0, "progress": 0.4094029466355248, "epoch": 36.84640644037819, "img/sec/core": 542.3130975069561, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.152238338004445, "core_hours": 24.152238338004445} {"step": 46150, "l2_params": 340.3497425672965, "train/loss": 5.020360946655273, "l2_grads": 1.6484375, "lr": 0.0007237434190884819, "uptime": 87120.864072248, "examples_seen": 47257600.0, "progress": 0.4098469845386002, "epoch": 36.886370004847144, "img/sec/core": 542.8061421804928, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.178439629988887, "core_hours": 24.178439629988887} {"step": 46200, "l2_params": 340.3496880507605, "train/loss": 3.5881775617599487, "l2_grads": 1.796875, "lr": 0.0007230586019924008, "uptime": 87214.70990567701, "examples_seen": 47308800.0, "progress": 0.41029102244167565, "epoch": 36.9263335693161, "img/sec/core": 545.5756332403768, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.204507917052503, "core_hours": 24.204507917052503} {"step": 46250, "l2_params": 340.34986307750296, "train/loss": 2.5038098096847534, "l2_grads": 1.9375, "lr": 0.0007223732620927716, "uptime": 87309.079634982, "examples_seen": 47360000.0, "progress": 0.41073506034475105, "epoch": 36.966297133785055, "img/sec/core": 542.5468566782434, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.230721730748332, "core_hours": 24.230721730748332} {"step": 46301, "l2_params": 340.3499807183776, "train/loss": 2.41403067111969, "l2_grads": 1.890625, "lr": 0.0007216874009958894, "uptime": 87402.63250976401, "examples_seen": 47411200.0, "progress": 0.41117909824782645, "epoch": 37.00626069825401, "img/sec/core": 547.2840906204593, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.25670864041, "core_hours": 24.25670864041} {"step": 46350, "l2_params": 340.3500008034009, "train/loss": 2.558478832244873, "l2_grads": 1.8828125, "lr": 0.0007210010203092726, "uptime": 87497.78846121501, "examples_seen": 47462400.0, "progress": 0.41162313615090185, "epoch": 37.04622426272297, "img/sec/core": 538.0640855276895, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.28314084914639, "core_hours": 24.28314084914639} {"step": 46400, "l2_params": 340.35001228055654, "train/loss": 3.4525644779205322, "l2_grads": 1.6171875, "lr": 0.0007203141216416557, "uptime": 87592.050279741, "examples_seen": 47513600.0, "progress": 0.41206717405397725, "epoch": 37.08618782719193, "img/sec/core": 543.1679634515185, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.309324687625836, "core_hours": 24.309324687625836} {"step": 46451, "l2_params": 340.3615753182562, "train/loss": 4.072111785411835, "l2_grads": 1.7421875, "lr": 0.0007196267066029882, "uptime": 87687.052484221, "examples_seen": 47564800.0, "progress": 0.41251121195705265, "epoch": 37.12615139166088, "img/sec/core": 538.9348624092116, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.335714188870277, "core_hours": 24.335714188870277} {"step": 46500, "l2_params": 340.36179337673167, "train/loss": 3.0587769746780396, "l2_grads": 1.765625, "lr": 0.0007189387768044304, "uptime": 87781.650860276, "examples_seen": 47616000.0, "progress": 0.41295524986012805, "epoch": 37.16611495612984, "img/sec/core": 541.2355067303869, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.361991515552223, "core_hours": 24.361991515552223} {"step": 46550, "l2_params": 340.3618048534897, "train/loss": 4.021058559417725, "l2_grads": 1.6015625, "lr": 0.0007182503338583484, "uptime": 87875.765669887, "examples_seen": 47667200.0, "progress": 0.41339928776320345, "epoch": 37.2060785205988, "img/sec/core": 544.0164009428892, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.388134518221943, "core_hours": 24.388134518221943} {"step": 46600, "l2_params": 340.36179050754214, "train/loss": 2.387951076030731, "l2_grads": 1.84375, "lr": 0.0007175613793783111, "uptime": 87969.527883384, "examples_seen": 47718400.0, "progress": 0.41384332566627885, "epoch": 37.24604208506776, "img/sec/core": 546.062193824358, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.414179577526667, "core_hours": 24.414179577526667} {"step": 46650, "l2_params": 340.3616527864148, "train/loss": 5.100783467292786, "l2_grads": 1.75, "lr": 0.0007168719149790859, "uptime": 88063.528855681, "examples_seen": 47769600.0, "progress": 0.4142873635693543, "epoch": 37.28600564953671, "img/sec/core": 544.6752171693718, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.440290958720276, "core_hours": 24.440290958720276} {"step": 46700, "l2_params": 340.36169869346344, "train/loss": 3.1365250945091248, "l2_grads": 1.65625, "lr": 0.0007161819422766359, "uptime": 88157.70472835901, "examples_seen": 47820800.0, "progress": 0.4147314014724297, "epoch": 37.32596921400567, "img/sec/core": 543.6636639944321, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.466450923353058, "core_hours": 24.466450923353058} {"step": 46750, "l2_params": 340.40885630830024, "train/loss": 3.328839659690857, "l2_grads": 1.6015625, "lr": 0.0007154914628881157, "uptime": 88251.40009740401, "examples_seen": 47872000.0, "progress": 0.4151754393755051, "epoch": 37.36593277847462, "img/sec/core": 546.4517672736652, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.492477414754447, "core_hours": 24.492477414754447} {"step": 46800, "l2_params": 340.40876737570966, "train/loss": 2.543142259120941, "l2_grads": 1.9140625, "lr": 0.0007148004784318665, "uptime": 88346.31007704, "examples_seen": 47923200.0, "progress": 0.4156194772785805, "epoch": 37.405896342943585, "img/sec/core": 539.4585500530666, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.51884129798667, "core_hours": 24.51884129798667} {"step": 46850, "l2_params": 340.4558754449686, "train/loss": 2.5306608080863953, "l2_grads": 1.890625, "lr": 0.0007141089905274145, "uptime": 88440.951514958, "examples_seen": 47974400.0, "progress": 0.4160635151816559, "epoch": 37.44585990741254, "img/sec/core": 540.9892445248535, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.54513058629722, "core_hours": 24.54513058629722} {"step": 46900, "l2_params": 340.4559701020456, "train/loss": 4.200544834136963, "l2_grads": 1.6796875, "lr": 0.0007134170007954645, "uptime": 88535.485556124, "examples_seen": 48025600.0, "progress": 0.4165075530847313, "epoch": 37.485823471881496, "img/sec/core": 541.603843107625, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.571390042176667, "core_hours": 24.571390042176667} {"step": 46950, "l2_params": 340.47352136399684, "train/loss": 2.518571138381958, "l2_grads": 1.9375, "lr": 0.0007127245108578991, "uptime": 88629.954291032, "examples_seen": 48076800.0, "progress": 0.4169515909878067, "epoch": 37.52578703635045, "img/sec/core": 541.9782539679323, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.597631357428888, "core_hours": 24.597631357428888} {"step": 47000, "l2_params": 340.4970315812239, "train/loss": 2.715873658657074, "l2_grads": 1.90625, "lr": 0.0007120315223377724, "uptime": 88724.780784402, "examples_seen": 48128000.0, "progress": 0.4173956288908821, "epoch": 37.565750600819406, "img/sec/core": 539.9334951702365, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.623972050031668, "core_hours": 24.623972050031668} {"step": 47050, "l2_params": 340.49715777539905, "train/loss": 2.4245272874832153, "l2_grads": 1.921875, "lr": 0.0007113380368593069, "uptime": 88819.516907838, "examples_seen": 48179200.0, "progress": 0.4178396667939575, "epoch": 37.60571416528837, "img/sec/core": 540.4485442618825, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.650287639875, "core_hours": 24.650287639875} {"step": 47100, "l2_params": 340.49700576877325, "train/loss": 2.6695327162742615, "l2_grads": 1.7890625, "lr": 0.0007106440560478909, "uptime": 88913.569223888, "examples_seen": 48230400.0, "progress": 0.41828370469703297, "epoch": 37.645677729757324, "img/sec/core": 544.3778755302557, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.676413283222224, "core_hours": 24.676413283222224} {"step": 47150, "l2_params": 340.4970086368234, "train/loss": 2.404726982116699, "l2_grads": 1.9765625, "lr": 0.000709949581530072, "uptime": 89007.905688147, "examples_seen": 48281600.0, "progress": 0.41872774260010837, "epoch": 37.68564129422628, "img/sec/core": 542.7381702522748, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.7026178566275, "core_hours": 24.7026178566275} {"step": 47200, "l2_params": 340.4970889422184, "train/loss": 2.4907925128936768, "l2_grads": 1.9296875, "lr": 0.0007092546149335559, "uptime": 89101.66423546801, "examples_seen": 48332800.0, "progress": 0.41917178050318377, "epoch": 37.725604858695235, "img/sec/core": 546.083546118778, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.72866189755, "core_hours": 24.72866189755} {"step": 47250, "l2_params": 340.4971204907613, "train/loss": 3.3470528721809387, "l2_grads": 1.765625, "lr": 0.0007085591578872015, "uptime": 89197.574912874, "examples_seen": 48384000.0, "progress": 0.41961581840625917, "epoch": 37.76556842316419, "img/sec/core": 533.8300321169645, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.755303752384997, "core_hours": 24.755303752384997} {"step": 47300, "l2_params": 340.4971864558869, "train/loss": 4.947053670883179, "l2_grads": 1.71875, "lr": 0.0007078632120210179, "uptime": 89291.377934387, "examples_seen": 48435200.0, "progress": 0.42005985630933457, "epoch": 37.80553198763315, "img/sec/core": 545.8246352214269, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.78136014724972, "core_hours": 24.78136014724972} {"step": 47350, "l2_params": 340.49717498369205, "train/loss": 2.3659819960594177, "l2_grads": 1.84375, "lr": 0.0007071667789661591, "uptime": 89385.28136203601, "examples_seen": 48486400.0, "progress": 0.42050389421240997, "epoch": 37.84549555210211, "img/sec/core": 545.2410128347238, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.80744443270778, "core_hours": 24.80744443270778} {"step": 47400, "l2_params": 340.49716924759446, "train/loss": 2.5159876346588135, "l2_grads": 1.96875, "lr": 0.0007064698603549206, "uptime": 89479.459002021, "examples_seen": 48537600.0, "progress": 0.42094793211548537, "epoch": 37.88545911657106, "img/sec/core": 543.6534617788201, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.833604888259167, "core_hours": 24.833604888259167} {"step": 47450, "l2_params": 340.5206864356775, "train/loss": 3.62910532951355, "l2_grads": 1.625, "lr": 0.000705772457820737, "uptime": 89574.83830491401, "examples_seen": 48588800.0, "progress": 0.42139197001856077, "epoch": 37.92542268104002, "img/sec/core": 536.8040911080409, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.86009913906278, "core_hours": 24.86009913906278} {"step": 47500, "l2_params": 340.52056885377715, "train/loss": 4.13776171207428, "l2_grads": 1.7421875, "lr": 0.0007050745729981757, "uptime": 89668.01806132101, "examples_seen": 48640000.0, "progress": 0.42183600792163617, "epoch": 37.96538624550898, "img/sec/core": 549.4755725306183, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.885982404731394, "core_hours": 24.885982404731394, "val/acc@1": 0.6246213329081632, "val/loss": 1.588960441703699, "z/secs/eval/val": 31.915200142990216} {"step": 47550, "l2_params": 340.5265454043194, "train/loss": 2.5522327423095703, "l2_grads": 2.03125, "lr": 0.0007043762075229363, "uptime": 89792.728010296, "examples_seen": 48691200.0, "progress": 0.4222800458247116, "epoch": 38.005349809977936, "img/sec/core": 410.5526497349892, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.920624057224448, "core_hours": 24.920624057224448} {"step": 47600, "l2_params": 340.5266199671474, "train/loss": 2.7204025983810425, "l2_grads": 1.78125, "lr": 0.0007036773630318435, "uptime": 89885.880802504, "examples_seen": 48742400.0, "progress": 0.422724083727787, "epoch": 38.04531337444689, "img/sec/core": 549.6346248610217, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.94649983283778, "core_hours": 24.94649983283778} {"step": 47650, "l2_params": 340.5265454043194, "train/loss": 2.505614459514618, "l2_grads": 1.7734375, "lr": 0.000702978041162846, "uptime": 89980.255549601, "examples_seen": 48793600.0, "progress": 0.4231681216308624, "epoch": 38.08527693891585, "img/sec/core": 542.5180101132047, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.972715040364722, "core_hours": 24.972715040364722} {"step": 47700, "l2_params": 340.55002615254637, "train/loss": 2.3827178478240967, "l2_grads": 1.96875, "lr": 0.0007022782435550099, "uptime": 90074.308146122, "examples_seen": 48844800.0, "progress": 0.4236121595339378, "epoch": 38.1252405033848, "img/sec/core": 544.3762521598233, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 24.998840761620556, "core_hours": 24.998840761620556} {"step": 47750, "l2_params": 340.54999174130074, "train/loss": 3.7020058035850525, "l2_grads": 1.65625, "lr": 0.0007015779718485177, "uptime": 90168.483939323, "examples_seen": 48896000.0, "progress": 0.4240561974370132, "epoch": 38.165204067853765, "img/sec/core": 543.664122804034, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.02500070417639, "core_hours": 25.02500070417639} {"step": 47800, "l2_params": 340.55002902014996, "train/loss": 3.60447359085083, "l2_grads": 1.8828125, "lr": 0.0007008772276846621, "uptime": 90262.790543348, "examples_seen": 48947200.0, "progress": 0.4245002353400886, "epoch": 38.20516763232272, "img/sec/core": 542.9100170591282, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.05119698307222, "core_hours": 25.05119698307222} {"step": 47850, "l2_params": 340.5500490933748, "train/loss": 2.486282706260681, "l2_grads": 1.828125, "lr": 0.0007001760127058427, "uptime": 90355.945998582, "examples_seen": 48998400.0, "progress": 0.42494427324316403, "epoch": 38.245131196791675, "img/sec/core": 549.6189125091171, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.077073498415, "core_hours": 25.077073498415} {"step": 47900, "l2_params": 340.5559104244118, "train/loss": 2.4241718649864197, "l2_grads": 1.921875, "lr": 0.000699474328555565, "uptime": 90451.364324168, "examples_seen": 49049600.0, "progress": 0.42538831114623943, "epoch": 38.28509476126063, "img/sec/core": 536.5845573747288, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.103578588855555, "core_hours": 25.103578588855555} {"step": 47950, "l2_params": 340.5559390999517, "train/loss": 3.1299121379852295, "l2_grads": 1.8203125, "lr": 0.0006987721768784309, "uptime": 90545.62122458, "examples_seen": 49100800.0, "progress": 0.42583234904931483, "epoch": 38.325058325729586, "img/sec/core": 543.1963047395188, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.12976106119222, "core_hours": 25.12976106119222} {"step": 48000, "l2_params": 340.5559018217494, "train/loss": 2.9600273966789246, "l2_grads": 1.7109375, "lr": 0.0006980695593201414, "uptime": 90639.665576624, "examples_seen": 49152000.0, "progress": 0.42627638695239023, "epoch": 38.36502189019855, "img/sec/core": 544.4239753605211, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.155884492315558, "core_hours": 25.155884492315558} {"step": 48050, "l2_params": 340.5677274098722, "train/loss": 2.3461520671844482, "l2_grads": 1.8125, "lr": 0.0006973664775274861, "uptime": 90734.414395098, "examples_seen": 49203200.0, "progress": 0.4267204248554657, "epoch": 38.404985454667504, "img/sec/core": 540.376131593093, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.182203608558336, "core_hours": 25.182203608558336} {"step": 48100, "l2_params": 340.5677790240512, "train/loss": 2.3627836108207703, "l2_grads": 1.8984375, "lr": 0.0006966629331483452, "uptime": 90829.114759052, "examples_seen": 49254400.0, "progress": 0.4271644627585411, "epoch": 38.44494901913646, "img/sec/core": 540.6526211966305, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.20850926521222, "core_hours": 25.20850926521222} {"step": 48150, "l2_params": 340.5678134334996, "train/loss": 4.381340146064758, "l2_grads": 1.6796875, "lr": 0.0006959589278316822, "uptime": 90923.405397889, "examples_seen": 49305600.0, "progress": 0.4276085006616165, "epoch": 38.484912583605414, "img/sec/core": 543.001941990315, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.23470110933361, "core_hours": 25.23470110933361} {"step": 48200, "l2_params": 340.59101034543613, "train/loss": 3.996561288833618, "l2_grads": 1.7578125, "lr": 0.0006952544632275414, "uptime": 91018.506238883, "examples_seen": 49356800.0, "progress": 0.4280525385646919, "epoch": 38.52487614807437, "img/sec/core": 538.3758909475044, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.26111800960972, "core_hours": 25.26111800960972} {"step": 48250, "l2_params": 340.5912597968421, "train/loss": 2.3573794960975647, "l2_grads": 1.890625, "lr": 0.0006945495409870422, "uptime": 91112.773778253, "examples_seen": 49408000.0, "progress": 0.4284965764677673, "epoch": 38.56483971254333, "img/sec/core": 543.1350000453233, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.287303437212497, "core_hours": 25.287303437212497} {"step": 48300, "l2_params": 340.6147418180106, "train/loss": 2.4900534749031067, "l2_grads": 1.921875, "lr": 0.0006938441627623782, "uptime": 91207.078029282, "examples_seen": 49459200.0, "progress": 0.4289406143708427, "epoch": 38.60480327701229, "img/sec/core": 542.9235632681855, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.313499062498334, "core_hours": 25.313499062498334} {"step": 48350, "l2_params": 340.6148392979965, "train/loss": 2.4082981944084167, "l2_grads": 1.8828125, "lr": 0.0006931383302068104, "uptime": 91301.88376375701, "examples_seen": 49510400.0, "progress": 0.4293846522739181, "epoch": 38.64476684148124, "img/sec/core": 540.0517203259963, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.339833988741393, "core_hours": 25.339833988741393} {"step": 48400, "l2_params": 340.6149740496959, "train/loss": 2.292831003665924, "l2_grads": 1.78125, "lr": 0.0006924320449746662, "uptime": 91395.399730699, "examples_seen": 49561600.0, "progress": 0.4298286901769935, "epoch": 38.6847304059502, "img/sec/core": 547.5000866082848, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.365810646225277, "core_hours": 25.365810646225277} {"step": 48450, "l2_params": 340.6150858648953, "train/loss": 2.4798338413238525, "l2_grads": 1.9453125, "lr": 0.0006917253087213326, "uptime": 91489.977326762, "examples_seen": 49612800.0, "progress": 0.4302727280800689, "epoch": 38.72469397041916, "img/sec/core": 541.3544235771834, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.392082200687224, "core_hours": 25.392082200687224} {"step": 48500, "l2_params": 340.615131737787, "train/loss": 4.523490309715271, "l2_grads": 1.8984375, "lr": 0.0006910181231032539, "uptime": 91585.232209327, "examples_seen": 49664000.0, "progress": 0.43071676598314435, "epoch": 38.764657534888116, "img/sec/core": 537.5052555973874, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.418541890288612, "core_hours": 25.418541890288612} {"step": 48550, "l2_params": 340.6151862118379, "train/loss": 2.512427270412445, "l2_grads": 1.84375, "lr": 0.0006903104897779284, "uptime": 91678.360781006, "examples_seen": 49715200.0, "progress": 0.43116080388621975, "epoch": 38.80462109935707, "img/sec/core": 549.7775717690398, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.444410937977224, "core_hours": 25.444410937977224} {"step": 48600, "l2_params": 340.6150743966714, "train/loss": 2.546195387840271, "l2_grads": 1.828125, "lr": 0.0006896024104039033, "uptime": 91773.02666294201, "examples_seen": 49766400.0, "progress": 0.43160484178929515, "epoch": 38.844584663826026, "img/sec/core": 540.8495537453862, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.47070701629278, "core_hours": 25.47070701629278} {"step": 48650, "l2_params": 340.61508873195123, "train/loss": 3.6906161308288574, "l2_grads": 1.703125, "lr": 0.000688893886640771, "uptime": 91867.288412325, "examples_seen": 49817600.0, "progress": 0.43204887969237055, "epoch": 38.88454822829498, "img/sec/core": 543.1683618768021, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.49689083556583, "core_hours": 25.49689083556583} {"step": 48700, "l2_params": 340.65035742770766, "train/loss": 2.339450418949127, "l2_grads": 1.9609375, "lr": 0.0006881849201491658, "uptime": 91960.869087392, "examples_seen": 49868800.0, "progress": 0.43249291759544595, "epoch": 38.924511792763944, "img/sec/core": 547.1215073340935, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.52288546752889, "core_hours": 25.52288546752889} {"step": 48750, "l2_params": 340.6502742916847, "train/loss": 2.4713051319122314, "l2_grads": 2.0, "lr": 0.0006874755125907596, "uptime": 92056.91375421, "examples_seen": 49920000.0, "progress": 0.43293695549852135, "epoch": 38.9644753572329, "img/sec/core": 533.0852997493035, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.549564541645, "core_hours": 25.549564541645} {"step": 48800, "l2_params": 340.6502456240858, "train/loss": 4.849804043769836, "l2_grads": 1.921875, "lr": 0.0006867656656282581, "uptime": 92150.058415444, "examples_seen": 49971200.0, "progress": 0.43338099340159675, "epoch": 39.004438921701855, "img/sec/core": 549.6826046892584, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.575438058654445, "core_hours": 25.575438058654445} {"step": 48850, "l2_params": 340.73236266716725, "train/loss": 3.433924376964569, "l2_grads": 1.8046875, "lr": 0.0006860553809253967, "uptime": 92244.700062713, "examples_seen": 50022400.0, "progress": 0.43382503130467215, "epoch": 39.04440248617081, "img/sec/core": 540.9880478355618, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.60172740511806, "core_hours": 25.60172740511806} {"step": 48900, "l2_params": 340.73239705999487, "train/loss": 2.4079304337501526, "l2_grads": 1.828125, "lr": 0.000685344660146937, "uptime": 92339.377153718, "examples_seen": 50073600.0, "progress": 0.43426906920774755, "epoch": 39.084366050639765, "img/sec/core": 540.785521148913, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.628026597063887, "core_hours": 25.628026597063887} {"step": 48950, "l2_params": 340.73834696692126, "train/loss": 5.040885090827942, "l2_grads": 1.7734375, "lr": 0.0006846335049586619, "uptime": 92433.705289068, "examples_seen": 50124800.0, "progress": 0.434713107110823, "epoch": 39.12432961510873, "img/sec/core": 542.7860925059272, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.654228856883332, "core_hours": 25.654228856883332} {"step": 49000, "l2_params": 340.7383899572002, "train/loss": 2.475066602230072, "l2_grads": 1.9140625, "lr": 0.0006839219170273734, "uptime": 92527.43248835701, "examples_seen": 50176000.0, "progress": 0.4351571450138984, "epoch": 39.16429317957768, "img/sec/core": 546.2661894134706, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.680264190019166, "core_hours": 25.680264190019166} {"step": 49050, "l2_params": 340.7384128853467, "train/loss": 3.4815887212753296, "l2_grads": 1.734375, "lr": 0.0006832098980208878, "uptime": 92621.96924960401, "examples_seen": 50227200.0, "progress": 0.4356011829169738, "epoch": 39.20425674404664, "img/sec/core": 541.5882596847985, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.706524401476667, "core_hours": 25.706524401476667} {"step": 49100, "l2_params": 340.74434549141824, "train/loss": 2.4702866673469543, "l2_grads": 2.03125, "lr": 0.0006824974496080312, "uptime": 92715.453920768, "examples_seen": 50278400.0, "progress": 0.4360452208200492, "epoch": 39.244220308515594, "img/sec/core": 547.6833727123112, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.732492365688888, "core_hours": 25.732492365688888} {"step": 49150, "l2_params": 340.7501318323296, "train/loss": 2.4121023416519165, "l2_grads": 2.03125, "lr": 0.0006817845734586362, "uptime": 92809.909209784, "examples_seen": 50329600.0, "progress": 0.4364892587231246, "epoch": 39.28418387298455, "img/sec/core": 542.0554056144854, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.75872994597111, "core_hours": 25.75872994597111} {"step": 49200, "l2_params": 340.73835556497744, "train/loss": 2.7335093021392822, "l2_grads": 1.953125, "lr": 0.0006810712712435382, "uptime": 92904.45368328001, "examples_seen": 50380800.0, "progress": 0.4369332966262, "epoch": 39.32414743745351, "img/sec/core": 541.5440808622635, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.78499229972, "core_hours": 25.78499229972} {"step": 49250, "l2_params": 340.74995701118587, "train/loss": 2.5325247049331665, "l2_grads": 2.015625, "lr": 0.0006803575446345713, "uptime": 92999.538403233, "examples_seen": 50432000.0, "progress": 0.4373773345292754, "epoch": 39.36411100192247, "img/sec/core": 538.4671693339369, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.81140472192917, "core_hours": 25.81140472192917} {"step": 49300, "l2_params": 340.773502605653, "train/loss": 2.3162898421287537, "l2_grads": 1.9296875, "lr": 0.0006796433953045632, "uptime": 93092.79934682901, "examples_seen": 50483200.0, "progress": 0.4378213724323508, "epoch": 39.40407456639142, "img/sec/core": 548.9972332018506, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.837310539594725, "core_hours": 25.837310539594725} {"step": 49350, "l2_params": 340.77359430878005, "train/loss": 2.4994351267814636, "l2_grads": 2.03125, "lr": 0.0006789288249273346, "uptime": 93187.497843609, "examples_seen": 50534400.0, "progress": 0.4382654103354262, "epoch": 39.44403813086038, "img/sec/core": 540.663281265688, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.863615677589166, "core_hours": 25.863615677589166} {"step": 49400, "l2_params": 340.77953203372556, "train/loss": 2.3847396969795227, "l2_grads": 1.7890625, "lr": 0.0006782138351776912, "uptime": 93282.681399687, "examples_seen": 50585600.0, "progress": 0.43870944823850166, "epoch": 39.48400169532933, "img/sec/core": 537.908039052903, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.890055554277502, "core_hours": 25.890055554277502} {"step": 49450, "l2_params": 340.797000724955, "train/loss": 2.821627140045166, "l2_grads": 1.90625, "lr": 0.0006774984277314216, "uptime": 93376.227824264, "examples_seen": 50636800.0, "progress": 0.43915348614157707, "epoch": 39.523965259798295, "img/sec/core": 547.3218269059258, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.916040672215555, "core_hours": 25.916040672215555} {"step": 49500, "l2_params": 340.79715832882175, "train/loss": 2.336480677127838, "l2_grads": 1.8671875, "lr": 0.0006767826042652946, "uptime": 93470.353311731, "examples_seen": 50688000.0, "progress": 0.43959752404465247, "epoch": 39.56392882426725, "img/sec/core": 543.9546862155887, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.942186640956386, "core_hours": 25.942186640956386} {"step": 49550, "l2_params": 340.79718411853844, "train/loss": 2.496058464050293, "l2_grads": 1.9296875, "lr": 0.0006760663664570523, "uptime": 93564.950618584, "examples_seen": 50739200.0, "progress": 0.44004156194772787, "epoch": 39.603892388736206, "img/sec/core": 541.2416241359008, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.968463670637778, "core_hours": 25.968463670637778} {"step": 49600, "l2_params": 340.80880362015296, "train/loss": 2.4272943139076233, "l2_grads": 1.8671875, "lr": 0.00067534971598541, "uptime": 93659.92067524101, "examples_seen": 50790400.0, "progress": 0.44048559985080327, "epoch": 39.64385595320516, "img/sec/core": 539.1172944637892, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 25.99484424193139, "core_hours": 25.99484424193139} {"step": 49650, "l2_params": 340.8088494669703, "train/loss": 2.464348256587982, "l2_grads": 1.9609375, "lr": 0.0006746326545300494, "uptime": 93754.181871993, "examples_seen": 50841600.0, "progress": 0.44092963775387867, "epoch": 39.683819517674124, "img/sec/core": 543.171546343838, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.021027907695835, "core_hours": 26.021027907695835} {"step": 49700, "l2_params": 340.8381586480965, "train/loss": 2.4158536195755005, "l2_grads": 1.84375, "lr": 0.0006739151837716144, "uptime": 93848.73839718, "examples_seen": 50892800.0, "progress": 0.44137367565695407, "epoch": 39.72378308214308, "img/sec/core": 541.4750584239905, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.047293609136666, "core_hours": 26.047293609136666} {"step": 49750, "l2_params": 340.8323967234482, "train/loss": 2.5011963844299316, "l2_grads": 1.9453125, "lr": 0.0006731973053917094, "uptime": 93942.864353571, "examples_seen": 50944000.0, "progress": 0.44181771356002947, "epoch": 39.763746646612034, "img/sec/core": 543.9519762998781, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.073439708134167, "core_hours": 26.073439708134167} {"step": 49800, "l2_params": 340.8383334240003, "train/loss": 2.5214314460754395, "l2_grads": 1.8125, "lr": 0.0006724790210728938, "uptime": 94036.668451189, "examples_seen": 50995200.0, "progress": 0.44226175146310487, "epoch": 39.80371021108099, "img/sec/core": 545.818373611989, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.099496401916944, "core_hours": 26.099496401916944} {"step": 49850, "l2_params": 340.85008904667313, "train/loss": 4.060530960559845, "l2_grads": 1.6953125, "lr": 0.0006717603324986787, "uptime": 94130.59146515101, "examples_seen": 51046400.0, "progress": 0.4427057893661803, "epoch": 39.843673775549945, "img/sec/core": 545.1273105515136, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.125586128017503, "core_hours": 26.125586128017503} {"step": 49900, "l2_params": 340.85016926888125, "train/loss": 4.134881138801575, "l2_grads": 1.7421875, "lr": 0.0006710412413535229, "uptime": 94226.03574866, "examples_seen": 51097600.0, "progress": 0.4431498272692557, "epoch": 39.88363734001891, "img/sec/core": 536.4386228032105, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.152098428992222, "core_hours": 26.152098428992222} {"step": 49950, "l2_params": 340.8501205625429, "train/loss": 2.3762006759643555, "l2_grads": 2.015625, "lr": 0.0006703217493228278, "uptime": 94320.219953042, "examples_seen": 51148800.0, "progress": 0.4435938651723311, "epoch": 39.92360090448786, "img/sec/core": 543.6155705295873, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.178260707987224, "core_hours": 26.178260707987224} {"step": 50000, "l2_params": 340.8500689911181, "train/loss": 2.362420976161957, "l2_grads": 1.875, "lr": 0.0006696018580929353, "uptime": 94414.50357998701, "examples_seen": 51200000.0, "progress": 0.4440379030754065, "epoch": 39.96356446895682, "img/sec/core": 543.0423251522176, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.204450604360837, "core_hours": 26.204450604360837, "val/acc@1": 0.6304009885204082, "val/loss": 1.5481391579520947, "z/secs/eval/val": 31.66543260400067} {"step": 50050, "l2_params": 340.8560025188423, "train/loss": 3.096561014652252, "l2_grads": 1.78125, "lr": 0.0006688815693511231, "uptime": 94539.222250954, "examples_seen": 51251200.0, "progress": 0.4444819409784819, "epoch": 40.00352803342577, "img/sec/core": 410.52393842098303, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.239094679629442, "core_hours": 26.239094679629442} {"step": 50100, "l2_params": 340.8618958335619, "train/loss": 2.5525102615356445, "l2_grads": 1.953125, "lr": 0.0006681608847855986, "uptime": 94633.150786062, "examples_seen": 51302400.0, "progress": 0.4449259788815573, "epoch": 40.04349159789473, "img/sec/core": 545.095267813214, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.26518593938167, "core_hours": 26.26518593938167} {"step": 50150, "l2_params": 340.8618442639187, "train/loss": 3.382028579711914, "l2_grads": 1.7734375, "lr": 0.0006674398060854989, "uptime": 94727.381721187, "examples_seen": 51353600.0, "progress": 0.4453700167846327, "epoch": 40.08345516236369, "img/sec/core": 543.3459822093611, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.291361199138613, "core_hours": 26.291361199138613} {"step": 50200, "l2_params": 340.8736621031684, "train/loss": 4.211210131645203, "l2_grads": 1.609375, "lr": 0.000666718334940885, "uptime": 94821.803016339, "examples_seen": 51404800.0, "progress": 0.44581405468770813, "epoch": 40.12341872683265, "img/sec/core": 542.2505581773345, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.317589336680836, "core_hours": 26.317589336680836} {"step": 50250, "l2_params": 340.87364777876275, "train/loss": 2.3295748233795166, "l2_grads": 1.8046875, "lr": 0.0006659964730427364, "uptime": 94915.410126463, "examples_seen": 51456000.0, "progress": 0.44625809259078353, "epoch": 40.1633822913016, "img/sec/core": 546.9669978293246, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.343591311715276, "core_hours": 26.343591311715276} {"step": 50300, "l2_params": 340.87958662572476, "train/loss": 2.35887748003006, "l2_grads": 1.8671875, "lr": 0.0006652742220829495, "uptime": 95009.709383262, "examples_seen": 51507200.0, "progress": 0.44670213049385893, "epoch": 40.20334585577056, "img/sec/core": 542.9523173139443, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.369785549715, "core_hours": 26.369785549715} {"step": 50350, "l2_params": 340.91466754435044, "train/loss": 2.3168525099754333, "l2_grads": 2.015625, "lr": 0.0006645515837543321, "uptime": 95103.207965013, "examples_seen": 51558400.0, "progress": 0.4471461683969344, "epoch": 40.24330942023951, "img/sec/core": 547.6018891532664, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.39575737797917, "core_hours": 26.39575737797917} {"step": 50400, "l2_params": 340.91470764785873, "train/loss": 2.430434763431549, "l2_grads": 1.9765625, "lr": 0.0006638285597506002, "uptime": 95198.077627363, "examples_seen": 51609600.0, "progress": 0.4475902063000098, "epoch": 40.283272984708475, "img/sec/core": 539.6878067417302, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.422110061965277, "core_hours": 26.422110061965277} {"step": 50450, "l2_params": 340.914713376931, "train/loss": 2.579707622528076, "l2_grads": 2.078125, "lr": 0.0006631051517663737, "uptime": 95291.717596926, "examples_seen": 51660800.0, "progress": 0.4480342442030852, "epoch": 40.32323654917743, "img/sec/core": 546.7750602541126, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.448121164621668, "core_hours": 26.448121164621668} {"step": 50500, "l2_params": 340.9147391577548, "train/loss": 2.778673768043518, "l2_grads": 1.890625, "lr": 0.0006623813614971713, "uptime": 95386.545968456, "examples_seen": 51712000.0, "progress": 0.4484782821061606, "epoch": 40.363200113646386, "img/sec/core": 539.9228013084584, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.47446237893556, "core_hours": 26.47446237893556} {"step": 50550, "l2_params": 340.9148021775382, "train/loss": 2.266583025455475, "l2_grads": 1.8359375, "lr": 0.0006616571906394099, "uptime": 95480.722852663, "examples_seen": 51763200.0, "progress": 0.448922320009236, "epoch": 40.40316367811534, "img/sec/core": 543.6578246468853, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.500622624548612, "core_hours": 26.500622624548612} {"step": 50600, "l2_params": 340.93815879863024, "train/loss": 4.825529217720032, "l2_grads": 1.8359375, "lr": 0.0006609326408903966, "uptime": 95574.91626995, "examples_seen": 51814400.0, "progress": 0.4493663579123114, "epoch": 40.4431272425843, "img/sec/core": 543.5624003745427, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.526787462683888, "core_hours": 26.526787462683888} {"step": 50650, "l2_params": 340.9381988993753, "train/loss": 2.434792220592499, "l2_grads": 2.03125, "lr": 0.0006602077139483273, "uptime": 95669.25578653501, "examples_seen": 51865600.0, "progress": 0.4498103958153868, "epoch": 40.48309080705326, "img/sec/core": 542.7206101259164, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.552992883957504, "core_hours": 26.552992883957504} {"step": 50700, "l2_params": 340.93815879863024, "train/loss": 3.8475273847579956, "l2_grads": 1.6953125, "lr": 0.0006594824115122826, "uptime": 95764.329726469, "examples_seen": 51916800.0, "progress": 0.4502544337184622, "epoch": 40.523054371522214, "img/sec/core": 538.5282237755772, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.579402311716944, "core_hours": 26.579402311716944} {"step": 50750, "l2_params": 340.93835930230847, "train/loss": 3.1049492955207825, "l2_grads": 1.734375, "lr": 0.0006587567352822212, "uptime": 95857.356089659, "examples_seen": 51968000.0, "progress": 0.4506984716215376, "epoch": 40.56301793599117, "img/sec/core": 550.3816148915403, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.605242968158613, "core_hours": 26.605242968158613} {"step": 50800, "l2_params": 341.00873453806133, "train/loss": 3.188019812107086, "l2_grads": 1.828125, "lr": 0.0006580306869589797, "uptime": 95951.680019483, "examples_seen": 52019200.0, "progress": 0.45114250952461304, "epoch": 40.602981500460125, "img/sec/core": 542.810293162491, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.63144405977639, "core_hours": 26.63144405977639} {"step": 50851, "l2_params": 341.02039837724516, "train/loss": 3.716276228427887, "l2_grads": 1.8125, "lr": 0.0006573042682442664, "uptime": 96046.348532605, "examples_seen": 52070400.0, "progress": 0.45158654742768845, "epoch": 40.64294506492909, "img/sec/core": 540.8345215480263, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.657740868976944, "core_hours": 26.657740868976944} {"step": 50900, "l2_params": 341.0204098318384, "train/loss": 2.375861704349518, "l2_grads": 1.90625, "lr": 0.0006565774808406574, "uptime": 96140.572186453, "examples_seen": 52121600.0, "progress": 0.45203058533076385, "epoch": 40.68290862939804, "img/sec/core": 543.3879701013445, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.683914106156944, "core_hours": 26.683914106156944} {"step": 50950, "l2_params": 341.02030960413487, "train/loss": 2.4151883125305176, "l2_grads": 2.0, "lr": 0.0006558503264515929, "uptime": 96233.88107510301, "examples_seen": 52172800.0, "progress": 0.45247462323383925, "epoch": 40.722872193867, "img/sec/core": 548.7151410842307, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.709833241893058, "core_hours": 26.709833241893058} {"step": 51000, "l2_params": 341.0319988193923, "train/loss": 2.3495997190475464, "l2_grads": 1.9921875, "lr": 0.0006551228067813735, "uptime": 96328.682894426, "examples_seen": 52224000.0, "progress": 0.45291866113691465, "epoch": 40.76283575833595, "img/sec/core": 540.0740235328083, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.736167080593887, "core_hours": 26.736167080593887} {"step": 51050, "l2_params": 341.0321248156103, "train/loss": 4.446783065795898, "l2_grads": 1.6875, "lr": 0.0006543949235351564, "uptime": 96422.34917416, "examples_seen": 52275200.0, "progress": 0.45336269903999005, "epoch": 40.80279932280491, "img/sec/core": 546.6214751498998, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.76218549163111, "core_hours": 26.76218549163111} {"step": 51100, "l2_params": 341.0322078585467, "train/loss": 2.4874908924102783, "l2_grads": 1.984375, "lr": 0.00065366667841895, "uptime": 96516.797618184, "examples_seen": 52326400.0, "progress": 0.45380673694306545, "epoch": 40.84276288727387, "img/sec/core": 542.094690167549, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.788421170526668, "core_hours": 26.788421170526668} {"step": 51150, "l2_params": 341.0321649053063, "train/loss": 2.4398550987243652, "l2_grads": 2.0, "lr": 0.0006529380731396121, "uptime": 96611.398178306, "examples_seen": 52377600.0, "progress": 0.45425077484614085, "epoch": 40.882726451742826, "img/sec/core": 541.223011089718, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.814699103893886, "core_hours": 26.814699103893886} {"step": 51200, "l2_params": 341.03221072209584, "train/loss": 2.360753059387207, "l2_grads": 1.8984375, "lr": 0.0006522091094048428, "uptime": 96704.563928987, "examples_seen": 52428800.0, "progress": 0.45469481274921625, "epoch": 40.92269001621178, "img/sec/core": 549.5581758935073, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.840578479083053, "core_hours": 26.840578479083053} {"step": 51250, "l2_params": 341.0321563146575, "train/loss": 3.8558254837989807, "l2_grads": 1.65625, "lr": 0.0006514797889231838, "uptime": 96798.88796527301, "examples_seen": 52480000.0, "progress": 0.4551388506522917, "epoch": 40.96265358068074, "img/sec/core": 542.8096805012846, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.866779600273613, "core_hours": 26.866779600273613} {"step": 51300, "l2_params": 341.03221072209584, "train/loss": 2.3757811188697815, "l2_grads": 1.9296875, "lr": 0.0006507501134040118, "uptime": 96893.223078704, "examples_seen": 52531200.0, "progress": 0.4555828885553671, "epoch": 41.00261714514969, "img/sec/core": 542.7459419705222, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.89298379844889, "core_hours": 26.89298379844889} {"step": 51350, "l2_params": 341.0322364940373, "train/loss": 2.664551317691803, "l2_grads": 1.8984375, "lr": 0.0006500200845575373, "uptime": 96986.636926716, "examples_seen": 52582400.0, "progress": 0.4560269264584425, "epoch": 41.042580709618655, "img/sec/core": 548.0986073223513, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.918932089563334, "core_hours": 26.918932089563334} {"step": 51400, "l2_params": 341.03221072209584, "train/loss": 2.34896057844162, "l2_grads": 1.953125, "lr": 0.0006492897040947973, "uptime": 97080.076272338, "examples_seen": 52633600.0, "progress": 0.4564709643615179, "epoch": 41.08254427408761, "img/sec/core": 547.9490428702859, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.944887463347225, "core_hours": 26.944887463347225} {"step": 51450, "l2_params": 341.0439453446579, "train/loss": 2.3362868428230286, "l2_grads": 1.9609375, "lr": 0.0006485589737276544, "uptime": 97173.401773192, "examples_seen": 52684800.0, "progress": 0.4569150022645933, "epoch": 41.122507838556565, "img/sec/core": 548.6174682319484, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.970811213584444, "core_hours": 26.970811213584444} {"step": 51500, "l2_params": 341.0439567984602, "train/loss": 2.7020527124404907, "l2_grads": 1.90625, "lr": 0.0006478278951687896, "uptime": 97266.62078963101, "examples_seen": 52736000.0, "progress": 0.4573590401676687, "epoch": 41.16247140302552, "img/sec/core": 549.244155922855, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 26.996705384817503, "core_hours": 26.996705384817503} {"step": 51550, "l2_params": 341.06742483158666, "train/loss": 4.158943772315979, "l2_grads": 1.71875, "lr": 0.0006470964701317015, "uptime": 97359.70680677201, "examples_seen": 52787200.0, "progress": 0.4578030780707441, "epoch": 41.20243496749448, "img/sec/core": 550.0289041526473, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.022562611801114, "core_hours": 27.022562611801114} {"step": 51600, "l2_params": 341.1145163742669, "train/loss": 2.6263219714164734, "l2_grads": 1.8125, "lr": 0.0006463647003307003, "uptime": 97452.6043759, "examples_seen": 52838400.0, "progress": 0.4582471159738195, "epoch": 41.24239853196344, "img/sec/core": 551.1446691296935, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.048367492114444, "core_hours": 27.048367492114444} {"step": 51650, "l2_params": 341.12020196332554, "train/loss": 2.288435995578766, "l2_grads": 1.9296875, "lr": 0.0006456325874809035, "uptime": 97545.489554225, "examples_seen": 52889600.0, "progress": 0.4586911538768949, "epoch": 41.282362096432394, "img/sec/core": 551.218191355078, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.074168930538058, "core_hours": 27.074168930538058} {"step": 51700, "l2_params": 341.12609930200296, "train/loss": 2.5104207396507263, "l2_grads": 2.03125, "lr": 0.0006449001332982336, "uptime": 97638.220547163, "examples_seen": 52940800.0, "progress": 0.45913519177997036, "epoch": 41.32232566090135, "img/sec/core": 552.1347111448804, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.0999275396875, "core_hours": 27.0999275396875} {"step": 51751, "l2_params": 341.12620522414426, "train/loss": 3.9570415019989014, "l2_grads": 1.734375, "lr": 0.0006441673394994124, "uptime": 97730.920930422, "examples_seen": 52992000.0, "progress": 0.45957922968304576, "epoch": 41.362289225370304, "img/sec/core": 552.317026100647, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.125677646148333, "core_hours": 27.125677646148333} {"step": 51800, "l2_params": 341.126199498624, "train/loss": 2.394222140312195, "l2_grads": 1.8828125, "lr": 0.0006434342078019578, "uptime": 97823.651318302, "examples_seen": 53043200.0, "progress": 0.46002326758612117, "epoch": 41.40225278983927, "img/sec/core": 552.1383137775281, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.15143608722611, "core_hours": 27.15143608722611} {"step": 51850, "l2_params": 341.1261164785687, "train/loss": 4.6839375495910645, "l2_grads": 1.7109375, "lr": 0.0006427007399241815, "uptime": 97916.507233487, "examples_seen": 53094400.0, "progress": 0.46046730548919657, "epoch": 41.44221635430822, "img/sec/core": 551.3919053836179, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.177229396999724, "core_hours": 27.177229396999724} {"step": 51900, "l2_params": 341.1260849881976, "train/loss": 2.9672651290893555, "l2_grads": 2.046875, "lr": 0.0006419669375851794, "uptime": 98009.175578879, "examples_seen": 53145600.0, "progress": 0.46091134339227197, "epoch": 41.48217991877718, "img/sec/core": 552.5079765201174, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.202970604053057, "core_hours": 27.202970604053057} {"step": 51950, "l2_params": 341.1260935764809, "train/loss": 3.216646909713745, "l2_grads": 1.8046875, "lr": 0.0006412328025048349, "uptime": 98101.805584064, "examples_seen": 53196800.0, "progress": 0.46135538129534737, "epoch": 41.52214348324613, "img/sec/core": 552.7366634358388, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.22870116104889, "core_hours": 27.22870116104889} {"step": 52000, "l2_params": 341.1261622827396, "train/loss": 2.5580671429634094, "l2_grads": 1.78125, "lr": 0.0006404983364038094, "uptime": 98194.442245336, "examples_seen": 53248000.0, "progress": 0.46179941919842277, "epoch": 41.56210704771509, "img/sec/core": 552.6969484539793, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.25443356695778, "core_hours": 27.25443356695778} {"step": 52050, "l2_params": 341.1260735371528, "train/loss": 4.41999363899231, "l2_grads": 1.7109375, "lr": 0.0006397635410035409, "uptime": 98287.196975931, "examples_seen": 53299200.0, "progress": 0.46224345710149817, "epoch": 41.60207061218405, "img/sec/core": 551.9934096251945, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.28019876990083, "core_hours": 27.28019876990083} {"step": 52100, "l2_params": 341.12607926267526, "train/loss": 4.563007235527039, "l2_grads": 1.7734375, "lr": 0.0006390284180262384, "uptime": 98379.782429475, "examples_seen": 53350400.0, "progress": 0.46268749500457357, "epoch": 41.642034176653006, "img/sec/core": 553.0026374571596, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.305916951440835, "core_hours": 27.305916951440835} {"step": 52150, "l2_params": 341.12609643924196, "train/loss": 4.406824469566345, "l2_grads": 1.9765625, "lr": 0.0006382929691948795, "uptime": 98472.38256950601, "examples_seen": 53401600.0, "progress": 0.463131532907649, "epoch": 41.68199774112196, "img/sec/core": 552.9149306130292, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.331639212560557, "core_hours": 27.331639212560557} {"step": 52200, "l2_params": 341.12609930200296, "train/loss": 2.4113080501556396, "l2_grads": 2.046875, "lr": 0.000637557196233206, "uptime": 98564.980475338, "examples_seen": 53452800.0, "progress": 0.4635755708107244, "epoch": 41.721961305590916, "img/sec/core": 552.9282713250072, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.357360853069444, "core_hours": 27.357360853069444} {"step": 52250, "l2_params": 341.1260907137198, "train/loss": 2.3346864581108093, "l2_grads": 2.015625, "lr": 0.0006368211008657166, "uptime": 98657.601286031, "examples_seen": 53504000.0, "progress": 0.4640196087137998, "epoch": 41.76192487005987, "img/sec/core": 552.7915337483666, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.38308885603972, "core_hours": 27.38308885603972} {"step": 52300, "l2_params": 341.12610789028594, "train/loss": 4.649880766868591, "l2_grads": 1.8359375, "lr": 0.0006360846848176691, "uptime": 98750.170462824, "examples_seen": 53555200.0, "progress": 0.4644636466168752, "epoch": 41.801888434528834, "img/sec/core": 553.0998737786506, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.408802516259996, "core_hours": 27.408802516259996} {"step": 52350, "l2_params": 341.13783928292827, "train/loss": 3.9668092727661133, "l2_grads": 1.6953125, "lr": 0.0006353479498150711, "uptime": 98842.743037825, "examples_seen": 53606400.0, "progress": 0.4649076845199506, "epoch": 41.84185199899779, "img/sec/core": 553.0795702663082, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.434517120426946, "core_hours": 27.434517120426946} {"step": 52400, "l2_params": 341.1378077936393, "train/loss": 2.629082679748535, "l2_grads": 1.90625, "lr": 0.0006346108975846786, "uptime": 98935.326659859, "examples_seen": 53657600.0, "progress": 0.465351722423026, "epoch": 41.881815563466745, "img/sec/core": 553.0135770795204, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.460234793214166, "core_hours": 27.460234793214166} {"step": 52450, "l2_params": 341.13783069494065, "train/loss": 2.5608233213424683, "l2_grads": 1.9296875, "lr": 0.00063387352985399, "uptime": 99027.889634998, "examples_seen": 53708800.0, "progress": 0.4657957603261014, "epoch": 41.9217791279357, "img/sec/core": 553.1369310797281, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.48594673075278, "core_hours": 27.48594673075278} {"step": 52500, "l2_params": 341.16137528210163, "train/loss": 2.6382538080215454, "l2_grads": 1.8671875, "lr": 0.000633135848351244, "uptime": 99120.379769359, "examples_seen": 53760000.0, "progress": 0.4662397982291768, "epoch": 41.96174269240466, "img/sec/core": 553.5725551026053, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.511638434741943, "core_hours": 27.511638434741943, "val/acc@1": 0.6371372767857143, "val/loss": 1.5070398243106142, "z/secs/eval/val": 31.554590131010627} {"step": 52550, "l2_params": 341.1612894081405, "train/loss": 3.979839503765106, "l2_grads": 2.0, "lr": 0.0006323978548054149, "uptime": 99244.16900725801, "examples_seen": 53811200.0, "progress": 0.4666838361322522, "epoch": 42.00170625687362, "img/sec/core": 413.6062299839928, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.546024334158336, "core_hours": 27.546024334158336} {"step": 52601, "l2_params": 341.1848695859402, "train/loss": 3.3755308985710144, "l2_grads": 1.75, "lr": 0.0006316595509462076, "uptime": 99336.689876692, "examples_seen": 53862400.0, "progress": 0.46712787403532763, "epoch": 42.04166982134257, "img/sec/core": 553.3886604527178, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.571724575667776, "core_hours": 27.571724575667776} {"step": 52650, "l2_params": 341.18478658016096, "train/loss": 2.2783689498901367, "l2_grads": 1.921875, "lr": 0.0006309209385040544, "uptime": 99429.223336781, "examples_seen": 53913600.0, "progress": 0.4675719119384031, "epoch": 42.08163338581153, "img/sec/core": 553.3133630879047, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.59742831458139, "core_hours": 27.59742831458139} {"step": 52700, "l2_params": 341.1847407838604, "train/loss": 4.953097343444824, "l2_grads": 1.90625, "lr": 0.0006301820192101114, "uptime": 99521.74401756801, "examples_seen": 53964800.0, "progress": 0.4680159498414785, "epoch": 42.121596950280484, "img/sec/core": 553.3897887961397, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.623128503688893, "core_hours": 27.623128503688893} {"step": 52751, "l2_params": 341.1846348798917, "train/loss": 2.359947621822357, "l2_grads": 1.96875, "lr": 0.0006294427947962542, "uptime": 99614.31194362, "examples_seen": 54016000.0, "progress": 0.4684599877445539, "epoch": 42.161560514749446, "img/sec/core": 553.1073470441575, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.648841816481113, "core_hours": 27.648841816481113} {"step": 52800, "l2_params": 341.18469784982295, "train/loss": 3.1560248136520386, "l2_grads": 1.8125, "lr": 0.0006287032669950728, "uptime": 99706.88964074, "examples_seen": 54067200.0, "progress": 0.4689040256476293, "epoch": 42.2015240792184, "img/sec/core": 553.0489695983309, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.67455784345889, "core_hours": 27.67455784345889} {"step": 52850, "l2_params": 341.2083107547719, "train/loss": 4.922660827636719, "l2_grads": 1.875, "lr": 0.0006279634375398679, "uptime": 99799.446430604, "examples_seen": 54118400.0, "progress": 0.4693480635507047, "epoch": 42.24148764368736, "img/sec/core": 553.1738954563091, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.700268062865558, "core_hours": 27.700268062865558} {"step": 52900, "l2_params": 341.2080875131406, "train/loss": 2.3282971382141113, "l2_grads": 1.9140625, "lr": 0.0006272233081646479, "uptime": 99892.039594568, "examples_seen": 54169600.0, "progress": 0.4697921014537801, "epoch": 42.28145120815631, "img/sec/core": 552.9565878092715, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.725988386188888, "core_hours": 27.725988386188888} {"step": 52950, "l2_params": 341.231690213922, "train/loss": 2.291856288909912, "l2_grads": 1.8984375, "lr": 0.0006264828806041245, "uptime": 99984.618376289, "examples_seen": 54220800.0, "progress": 0.4702361393568555, "epoch": 42.32141477262527, "img/sec/core": 553.0424903872977, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.75170471444472, "core_hours": 27.75170471444472} {"step": 53000, "l2_params": 341.2316186670353, "train/loss": 2.4799233078956604, "l2_grads": 1.9375, "lr": 0.0006257421565937073, "uptime": 100077.164220013, "examples_seen": 54272000.0, "progress": 0.4706801772599309, "epoch": 42.36137833709423, "img/sec/core": 553.239323774424, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.777411893256943, "core_hours": 27.777411893256943} {"step": 53050, "l2_params": 341.2316415620407, "train/loss": 4.916182637214661, "l2_grads": 1.828125, "lr": 0.0006250011378695022, "uptime": 100169.85345141501, "examples_seen": 54323200.0, "progress": 0.4711242151630063, "epoch": 42.401341901563185, "img/sec/core": 552.3834778382992, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.803158901979725, "core_hours": 27.803158901979725} {"step": 53100, "l2_params": 341.2374511200009, "train/loss": 2.8632516860961914, "l2_grads": 1.8984375, "lr": 0.0006242598261683039, "uptime": 100262.55237864901, "examples_seen": 54374400.0, "progress": 0.47156825306608174, "epoch": 42.44130546603214, "img/sec/core": 552.3257013617423, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.82890860398917, "core_hours": 27.82890860398917} {"step": 53150, "l2_params": 341.2843704073994, "train/loss": 4.711867809295654, "l2_grads": 1.7109375, "lr": 0.0006235182232275955, "uptime": 100355.120895567, "examples_seen": 54425600.0, "progress": 0.47201229096915714, "epoch": 42.481269030501096, "img/sec/core": 553.1038165530806, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.854622080910833, "core_hours": 27.854622080910833} {"step": 53200, "l2_params": 341.28438471456616, "train/loss": 3.504573404788971, "l2_grads": 1.8203125, "lr": 0.0006227763307855409, "uptime": 100447.63882735801, "examples_seen": 54476800.0, "progress": 0.47245632887223254, "epoch": 42.52123259497005, "img/sec/core": 553.4062317309206, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.880321506408336, "core_hours": 27.880321506408336} {"step": 53250, "l2_params": 341.2843274858956, "train/loss": 3.2679595351219177, "l2_grads": 1.828125, "lr": 0.0006220341505809844, "uptime": 100540.18794401501, "examples_seen": 54528000.0, "progress": 0.47290036677530795, "epoch": 42.561196159439014, "img/sec/core": 553.2197588633381, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.90602959436861, "core_hours": 27.90602959436861} {"step": 53300, "l2_params": 341.28441332889787, "train/loss": 4.050556540489197, "l2_grads": 1.71875, "lr": 0.0006212916843534444, "uptime": 100632.779180029, "examples_seen": 54579200.0, "progress": 0.47334440467838335, "epoch": 42.60115972390797, "img/sec/core": 552.9681015626894, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.931749382150276, "core_hours": 27.931749382150276} {"step": 53350, "l2_params": 341.28433034732933, "train/loss": 4.741677641868591, "l2_grads": 1.7578125, "lr": 0.0006205489338431082, "uptime": 100725.366127589, "examples_seen": 54630400.0, "progress": 0.47378844258145875, "epoch": 42.641123288376924, "img/sec/core": 552.9937140093936, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.95746797869472, "core_hours": 27.95746797869472} {"step": 53400, "l2_params": 341.28437899169955, "train/loss": 2.4308160543441772, "l2_grads": 2.078125, "lr": 0.0006198059007908309, "uptime": 100817.880355407, "examples_seen": 54681600.0, "progress": 0.47423248048453415, "epoch": 42.68108685284588, "img/sec/core": 553.4283883417846, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 27.983166375310834, "core_hours": 27.983166375310834} {"step": 53450, "l2_params": 341.28441332889787, "train/loss": 2.3584600687026978, "l2_grads": 2.109375, "lr": 0.0006190625869381293, "uptime": 100910.42722280801, "examples_seen": 54732800.0, "progress": 0.47467651838760955, "epoch": 42.72105041731484, "img/sec/core": 553.2332042980022, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.00887383847778, "core_hours": 28.00887383847778} {"step": 53500, "l2_params": 341.28437899169955, "train/loss": 2.336728513240814, "l2_grads": 1.9921875, "lr": 0.0006183189940271785, "uptime": 101003.000781932, "examples_seen": 54784000.0, "progress": 0.47512055629068495, "epoch": 42.7610139817838, "img/sec/core": 553.0736906358153, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.03458871601222, "core_hours": 28.03458871601222} {"step": 53550, "l2_params": 341.2843131787264, "train/loss": 4.782210469245911, "l2_grads": 1.84375, "lr": 0.0006175751238008073, "uptime": 101095.583864408, "examples_seen": 54835200.0, "progress": 0.4755645941937604, "epoch": 42.80097754625275, "img/sec/core": 553.0167999458173, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.060306238922223, "core_hours": 28.060306238922223} {"step": 53600, "l2_params": 341.2845363704969, "train/loss": 4.134348511695862, "l2_grads": 1.625, "lr": 0.000616830978002495, "uptime": 101188.165466316, "examples_seen": 54886400.0, "progress": 0.4760086320968358, "epoch": 42.84094111072171, "img/sec/core": 553.0256438086018, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.086023350563334, "core_hours": 28.086023350563334} {"step": 53650, "l2_params": 341.28454209336087, "train/loss": 2.437819004058838, "l2_grads": 2.046875, "lr": 0.0006160865583763666, "uptime": 101280.761858595, "examples_seen": 54937600.0, "progress": 0.4764526699999112, "epoch": 42.88090467519066, "img/sec/core": 552.9373093255368, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.11174457064083, "core_hours": 28.11174457064083} {"step": 53700, "l2_params": 341.28439616029914, "train/loss": 4.864381790161133, "l2_grads": 1.921875, "lr": 0.0006153418666671892, "uptime": 101373.349262381, "examples_seen": 54988800.0, "progress": 0.4768967079029866, "epoch": 42.920868239659626, "img/sec/core": 552.990989123503, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.13746329391472, "core_hours": 28.13746329391472} {"step": 53750, "l2_params": 341.28455926195227, "train/loss": 3.0045436024665833, "l2_grads": 1.890625, "lr": 0.0006145969046203664, "uptime": 101465.98968865, "examples_seen": 55040000.0, "progress": 0.477340745806062, "epoch": 42.96083180412858, "img/sec/core": 552.6744863125726, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.163196745656112, "core_hours": 28.163196745656112} {"step": 53800, "l2_params": 341.28454781622474, "train/loss": 2.3910160064697266, "l2_grads": 2.046875, "lr": 0.0006138516739819367, "uptime": 101558.494891198, "examples_seen": 55091200.0, "progress": 0.4777847837091374, "epoch": 43.00079536859754, "img/sec/core": 553.4823835819925, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.188892635252778, "core_hours": 28.188892635252778} {"step": 53850, "l2_params": 341.2844676961215, "train/loss": 4.0977436900138855, "l2_grads": 1.8046875, "lr": 0.0006131061764985669, "uptime": 101651.051726555, "examples_seen": 55142400.0, "progress": 0.4782288216122128, "epoch": 43.04075893306649, "img/sec/core": 553.1736235634912, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.21460286729639, "core_hours": 28.21460286729639} {"step": 53900, "l2_params": 341.28439329886595, "train/loss": 4.206947922706604, "l2_grads": 1.875, "lr": 0.000612360413917551, "uptime": 101743.610832091, "examples_seen": 55193600.0, "progress": 0.4786728595152882, "epoch": 43.08072249753545, "img/sec/core": 553.1600559826846, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.240313729945278, "core_hours": 28.240313729945278} {"step": 53950, "l2_params": 341.30209080446605, "train/loss": 2.308878242969513, "l2_grads": 1.984375, "lr": 0.0006116143879868021, "uptime": 101836.122965132, "examples_seen": 55244800.0, "progress": 0.4791168974183636, "epoch": 43.12068606200441, "img/sec/core": 553.4409197689432, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.266011544678886, "core_hours": 28.266011544678886} {"step": 54000, "l2_params": 341.3020707754716, "train/loss": 2.2696167826652527, "l2_grads": 2.015625, "lr": 0.0006108681004548532, "uptime": 101928.61415904001, "examples_seen": 55296000.0, "progress": 0.47956093532143906, "epoch": 43.160649626473365, "img/sec/core": 553.5662135675905, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.291703542986667, "core_hours": 28.291703542986667} {"step": 54050, "l2_params": 341.30195632405184, "train/loss": 2.326196074485779, "l2_grads": 2.015625, "lr": 0.0006101215530708487, "uptime": 102021.336544206, "examples_seen": 55347200.0, "progress": 0.48000497322451446, "epoch": 43.20061319094232, "img/sec/core": 552.1859679120645, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.317459761088333, "core_hours": 28.317459761088333} {"step": 54100, "l2_params": 341.30195632405184, "train/loss": 3.5674086213111877, "l2_grads": 1.6953125, "lr": 0.0006093747475845419, "uptime": 102113.747266109, "examples_seen": 55398400.0, "progress": 0.48044901112758986, "epoch": 43.240576755411276, "img/sec/core": 554.048263509337, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.34312940606139, "core_hours": 28.34312940606139} {"step": 54150, "l2_params": 341.3020478851907, "train/loss": 2.708486020565033, "l2_grads": 1.90625, "lr": 0.0006086276857462914, "uptime": 102206.198311099, "examples_seen": 55449600.0, "progress": 0.48089304903066526, "epoch": 43.28054031988023, "img/sec/core": 553.8066119808557, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.368810251891944, "core_hours": 28.368810251891944} {"step": 54200, "l2_params": 341.30197921433887, "train/loss": 2.4119226932525635, "l2_grads": 1.9140625, "lr": 0.0006078803693070563, "uptime": 102298.749717524, "examples_seen": 55500800.0, "progress": 0.48133708693374067, "epoch": 43.32050388434919, "img/sec/core": 553.2060719302996, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.39451897589889, "core_hours": 28.39451897589889} {"step": 54250, "l2_params": 341.30195060147986, "train/loss": 2.2559831738471985, "l2_grads": 2.015625, "lr": 0.0006071328000183936, "uptime": 102391.226822854, "examples_seen": 55552000.0, "progress": 0.48178112483681607, "epoch": 43.36046744881815, "img/sec/core": 553.6505475305671, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.420207060712777, "core_hours": 28.420207060712777} {"step": 54300, "l2_params": 341.3137074232443, "train/loss": 5.015326142311096, "l2_grads": 1.6953125, "lr": 0.000606384979632452, "uptime": 102483.746817256, "examples_seen": 55603200.0, "progress": 0.48222516273989147, "epoch": 43.400431013287104, "img/sec/core": 553.3938942704252, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.44590705915778, "core_hours": 28.44590705915778} {"step": 54350, "l2_params": 341.3136988396818, "train/loss": 2.3560632467269897, "l2_grads": 1.8984375, "lr": 0.000605636909901968, "uptime": 102576.19140446301, "examples_seen": 55654400.0, "progress": 0.48266920064296687, "epoch": 43.44039457775606, "img/sec/core": 553.8452985392263, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.471586111159727, "core_hours": 28.471586111159727} {"step": 54400, "l2_params": 341.3137331739305, "train/loss": 2.536863923072815, "l2_grads": 1.921875, "lr": 0.0006048885925802653, "uptime": 102668.67937986, "examples_seen": 55705600.0, "progress": 0.48311323854604227, "epoch": 43.48035814222502, "img/sec/core": 553.5854772497038, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.497277215436664, "core_hours": 28.497277215436664} {"step": 54450, "l2_params": 341.3371826590608, "train/loss": 2.7993412613868713, "l2_grads": 1.8203125, "lr": 0.0006041400294212444, "uptime": 102761.163696116, "examples_seen": 55756800.0, "progress": 0.4835572764491177, "epoch": 43.52032170669398, "img/sec/core": 553.6073798532173, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.522967303285554, "core_hours": 28.522967303285554} {"step": 54500, "l2_params": 341.3723367023535, "train/loss": 2.2315380573272705, "l2_grads": 1.984375, "lr": 0.0006033912221793843, "uptime": 102853.66748794001, "examples_seen": 55808000.0, "progress": 0.4840013143521931, "epoch": 43.56028527116293, "img/sec/core": 553.490824434609, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.548662801014448, "core_hours": 28.548662801014448} {"step": 54550, "l2_params": 341.37231953817667, "train/loss": 2.6600483059883118, "l2_grads": 1.9765625, "lr": 0.000602642172609735, "uptime": 102946.193885371, "examples_seen": 55859200.0, "progress": 0.4844453522552685, "epoch": 43.60024883563189, "img/sec/core": 553.3555982030482, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.574364578078608, "core_hours": 28.574364578078608} {"step": 54600, "l2_params": 341.40757007753945, "train/loss": 4.12756621837616, "l2_grads": 1.7109375, "lr": 0.0006018928824679155, "uptime": 103038.752335579, "examples_seen": 55910400.0, "progress": 0.4848893901583439, "epoch": 43.64021240010084, "img/sec/core": 553.163972440559, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.600075258691945, "core_hours": 28.600075258691945} {"step": 54650, "l2_params": 341.40755005473295, "train/loss": 3.5261167883872986, "l2_grads": 1.765625, "lr": 0.0006011433535101074, "uptime": 103131.414714066, "examples_seen": 55961600.0, "progress": 0.4853334280614193, "epoch": 43.680175964569806, "img/sec/core": 552.5435547413846, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.62581480827167, "core_hours": 28.62581480827167} {"step": 54700, "l2_params": 341.4105076965631, "train/loss": 2.4776676297187805, "l2_grads": 2.125, "lr": 0.0006003935874930524, "uptime": 103224.15206449, "examples_seen": 56012800.0, "progress": 0.4857774659644947, "epoch": 43.72013952903876, "img/sec/core": 552.0968602824398, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.651575183389447, "core_hours": 28.651575183389447} {"step": 54750, "l2_params": 341.40752145072173, "train/loss": 3.544952929019928, "l2_grads": 1.7734375, "lr": 0.0005996435861740487, "uptime": 103316.883610995, "examples_seen": 56064000.0, "progress": 0.4862215038675701, "epoch": 43.760103093507716, "img/sec/core": 552.1314151407637, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.677333946307503, "core_hours": 28.677333946307503} {"step": 54800, "l2_params": 341.40752145072173, "train/loss": 4.282261252403259, "l2_grads": 1.8046875, "lr": 0.0005988933513109446, "uptime": 103409.602405304, "examples_seen": 56115200.0, "progress": 0.4866655417706455, "epoch": 43.80006665797667, "img/sec/core": 552.2073532294897, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.70308916694889, "core_hours": 28.70308916694889} {"step": 54850, "l2_params": 341.40753575272765, "train/loss": 3.4593080282211304, "l2_grads": 1.8984375, "lr": 0.0005981428846621377, "uptime": 103502.495801815, "examples_seen": 56166400.0, "progress": 0.4871095796737209, "epoch": 43.84003022244563, "img/sec/core": 551.1694256322584, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.728892888201944, "core_hours": 28.728892888201944} {"step": 54900, "l2_params": 341.4075271715241, "train/loss": 2.529106080532074, "l2_grads": 2.109375, "lr": 0.0005973921879865662, "uptime": 103595.492967849, "examples_seen": 56217600.0, "progress": 0.4875536175767963, "epoch": 43.87999378691459, "img/sec/core": 550.5544113170535, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.7547254343225, "core_hours": 28.7547254343225} {"step": 54950, "l2_params": 341.4075185903204, "train/loss": 2.3871744871139526, "l2_grads": 2.03125, "lr": 0.0005966412630437104, "uptime": 103688.538990217, "examples_seen": 56268800.0, "progress": 0.4879976554798718, "epoch": 43.919957351383545, "img/sec/core": 550.2653278127598, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.780571551646947, "core_hours": 28.780571551646947} {"step": 55000, "l2_params": 341.407552915134, "train/loss": 2.3066744804382324, "l2_grads": 1.921875, "lr": 0.0005958901115935834, "uptime": 103781.582492229, "examples_seen": 56320000.0, "progress": 0.4884416933829472, "epoch": 43.9599209158525, "img/sec/core": 550.2802333621693, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.8064169688725, "core_hours": 28.8064169688725, "val/acc@1": 0.6387316645408163, "val/loss": 1.5124879886909408, "z/secs/eval/val": 31.64279088100011} {"step": 55050, "l2_params": 341.410521998444, "train/loss": 2.3030614852905273, "l2_grads": 1.9140625, "lr": 0.0005951387353967295, "uptime": 103906.152501769, "examples_seen": 56371200.0, "progress": 0.4888857312860226, "epoch": 43.999884480321455, "img/sec/core": 411.01385629710023, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.84101974930028, "core_hours": 28.84101974930028} {"step": 55100, "l2_params": 341.4075586359359, "train/loss": 4.906528115272522, "l2_grads": 1.765625, "lr": 0.0005943871362142208, "uptime": 103999.092936218, "examples_seen": 56422400.0, "progress": 0.489329769189098, "epoch": 44.03984804479041, "img/sec/core": 550.8904741358157, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.86683653664722, "core_hours": 28.86683653664722} {"step": 55150, "l2_params": 341.4105391607002, "train/loss": 2.3524361848831177, "l2_grads": 1.9921875, "lr": 0.000593635315807651, "uptime": 104092.11301217301, "examples_seen": 56473600.0, "progress": 0.4897738070921734, "epoch": 44.07981160925937, "img/sec/core": 550.4188152325896, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.892675446634723, "core_hours": 28.892675446634723} {"step": 55200, "l2_params": 341.4105448814521, "train/loss": 3.178613066673279, "l2_grads": 1.7734375, "lr": 0.0005928832759391329, "uptime": 104185.145511371, "examples_seen": 56524800.0, "progress": 0.4902178449952488, "epoch": 44.11977517372833, "img/sec/core": 550.345314179283, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.918517807523056, "core_hours": 28.918517807523056} {"step": 55250, "l2_params": 341.4106135304672, "train/loss": 2.387741506099701, "l2_grads": 2.03125, "lr": 0.0005921310183712936, "uptime": 104278.139504659, "examples_seen": 56576000.0, "progress": 0.4906618828983242, "epoch": 44.159738738197284, "img/sec/core": 550.5731949958376, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.94434947232528, "core_hours": 28.94434947232528} {"step": 55300, "l2_params": 341.410521998444, "train/loss": 2.7517279982566833, "l2_grads": 1.8359375, "lr": 0.0005913785448672703, "uptime": 104371.209817988, "examples_seen": 56627200.0, "progress": 0.4911059208013996, "epoch": 44.19970230266624, "img/sec/core": 550.1217108726553, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.97020233713889, "core_hours": 28.97020233713889} {"step": 55350, "l2_params": 341.4106936209673, "train/loss": 4.369813799858093, "l2_grads": 1.828125, "lr": 0.0005906258571907061, "uptime": 104464.238467017, "examples_seen": 56678400.0, "progress": 0.491549958704475, "epoch": 44.239665867135194, "img/sec/core": 550.3680912751761, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 28.996043628535833, "core_hours": 28.996043628535833} {"step": 55400, "l2_params": 341.41052485882005, "train/loss": 3.9104251861572266, "l2_grads": 1.7421875, "lr": 0.000589872957105747, "uptime": 104557.214653988, "examples_seen": 56729600.0, "progress": 0.49199399660755044, "epoch": 44.27962943160416, "img/sec/core": 550.6786379179719, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.02187034713889, "core_hours": 29.02187034713889} {"step": 55450, "l2_params": 341.45738318456375, "train/loss": 3.8326817750930786, "l2_grads": 1.65625, "lr": 0.0005891198463770357, "uptime": 104650.231439264, "examples_seen": 56780800.0, "progress": 0.49243803451062584, "epoch": 44.31959299607311, "img/sec/core": 550.4382875422297, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.04770834304889, "core_hours": 29.04770834304889} {"step": 55500, "l2_params": 341.4604033138396, "train/loss": 3.730759918689728, "l2_grads": 1.84375, "lr": 0.0005883665267697093, "uptime": 104743.28954767801, "examples_seen": 56832000.0, "progress": 0.49288207241370124, "epoch": 44.35955656054207, "img/sec/core": 550.1938613689852, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.073557817608336, "core_hours": 29.073557817608336} {"step": 55550, "l2_params": 341.4693033879473, "train/loss": 2.6777143478393555, "l2_grads": 1.921875, "lr": 0.0005876130000493937, "uptime": 104836.24586320101, "examples_seen": 56883200.0, "progress": 0.49332611031677664, "epoch": 44.39952012501102, "img/sec/core": 550.7963575356241, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.099379016364722, "core_hours": 29.099379016364722} {"step": 55600, "l2_params": 341.4692175914251, "train/loss": 2.4496747851371765, "l2_grads": 2.21875, "lr": 0.000586859267982201, "uptime": 104929.262385298, "examples_seen": 56934400.0, "progress": 0.49377014821985205, "epoch": 44.439483689479985, "img/sec/core": 550.4398449407806, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.125216939169444, "core_hours": 29.125216939169444} {"step": 55650, "l2_params": 341.4692290309626, "train/loss": 2.404751777648926, "l2_grads": 2.09375, "lr": 0.0005861053323347246, "uptime": 105022.47766351, "examples_seen": 56985600.0, "progress": 0.49421418612292745, "epoch": 44.47944725394894, "img/sec/core": 549.2661823478977, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.151110072006112, "core_hours": 29.151110072006112} {"step": 55700, "l2_params": 341.46929194841226, "train/loss": 2.4179210662841797, "l2_grads": 1.9453125, "lr": 0.0005853511948740343, "uptime": 105115.48053898901, "examples_seen": 57036800.0, "progress": 0.49465822402600285, "epoch": 44.519410818417896, "img/sec/core": 550.5206127906754, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.176944204083615, "core_hours": 29.176944204083615} {"step": 55750, "l2_params": 341.4810229902974, "train/loss": 2.291414260864258, "l2_grads": 2.15625, "lr": 0.0005845968573676734, "uptime": 105208.517264533, "examples_seen": 57088000.0, "progress": 0.49510226192907825, "epoch": 44.55937438288685, "img/sec/core": 550.32031383983, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.202787738956943, "core_hours": 29.202787738956943} {"step": 55800, "l2_params": 341.50441523500103, "train/loss": 2.3889987468719482, "l2_grads": 1.9765625, "lr": 0.0005838423215836547, "uptime": 105301.607583205, "examples_seen": 57139200.0, "progress": 0.49554629983215365, "epoch": 44.59933794735581, "img/sec/core": 550.0034883369965, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.22864616081028, "core_hours": 29.22864616081028} {"step": 55850, "l2_params": 341.50438377951315, "train/loss": 2.2727226316928864, "l2_grads": 1.9296875, "lr": 0.0005830875892904548, "uptime": 105394.60764671401, "examples_seen": 57190400.0, "progress": 0.4959903377352291, "epoch": 44.63930151182477, "img/sec/core": 550.5372584507874, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.254479511785004, "core_hours": 29.254479511785004} {"step": 55900, "l2_params": 341.5043437452517, "train/loss": 4.263098359107971, "l2_grads": 1.7578125, "lr": 0.000582332662257011, "uptime": 105487.719933015, "examples_seen": 57241600.0, "progress": 0.4964343756383045, "epoch": 44.679265076293724, "img/sec/core": 549.8737280973935, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.280344035757498, "core_hours": 29.280344035757498} {"step": 55950, "l2_params": 341.50434088566135, "train/loss": 2.343392312526703, "l2_grads": 2.1875, "lr": 0.0005815775422527176, "uptime": 105580.798528012, "examples_seen": 57292800.0, "progress": 0.4968784135413799, "epoch": 44.71922864076268, "img/sec/core": 550.0727637933242, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.306199201034442, "core_hours": 29.306199201034442} {"step": 56000, "l2_params": 341.5043237281191, "train/loss": 2.3771554231643677, "l2_grads": 1.9609375, "lr": 0.0005808222310474211, "uptime": 105673.86983427001, "examples_seen": 57344000.0, "progress": 0.4973224514444553, "epoch": 44.759192205231635, "img/sec/core": 550.1158419123097, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.33205234166167, "core_hours": 29.33205234166167} {"step": 56050, "l2_params": 341.50439235828287, "train/loss": 3.439169764518738, "l2_grads": 1.8359375, "lr": 0.0005800667304114149, "uptime": 105767.118572131, "examples_seen": 57395200.0, "progress": 0.4977664893475307, "epoch": 44.79915576970059, "img/sec/core": 549.0690938500788, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.35795476884528, "core_hours": 29.35795476884528} {"step": 56100, "l2_params": 341.5043866391031, "train/loss": 3.024785578250885, "l2_grads": 1.8671875, "lr": 0.0005793110421154371, "uptime": 105860.241833087, "examples_seen": 57446400.0, "progress": 0.4982105272506061, "epoch": 44.83911933416955, "img/sec/core": 549.8089250138479, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.383822341333055, "core_hours": 29.383822341333055} {"step": 56150, "l2_params": 341.5043580432027, "train/loss": 2.4141902327537537, "l2_grads": 2.09375, "lr": 0.0005785551679306671, "uptime": 105953.311777676, "examples_seen": 57497600.0, "progress": 0.4986545651536815, "epoch": 44.87908289863851, "img/sec/core": 550.123890436356, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.40967510371889, "core_hours": 29.40967510371889} {"step": 56200, "l2_params": 341.5042722554873, "train/loss": 2.360741376876831, "l2_grads": 1.8046875, "lr": 0.0005777991096287176, "uptime": 106046.416648205, "examples_seen": 57548800.0, "progress": 0.4990986030567569, "epoch": 44.91904646310746, "img/sec/core": 549.9175253570827, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.435537567754725, "core_hours": 29.435537567754725} {"step": 56250, "l2_params": 341.51607930209525, "train/loss": 2.410081207752228, "l2_grads": 2.09375, "lr": 0.0005770428689816351, "uptime": 106139.514429417, "examples_seen": 57600000.0, "progress": 0.4995426409598323, "epoch": 44.95901002757642, "img/sec/core": 549.9594011097926, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.46139806253583, "core_hours": 29.46139806253583} {"step": 56300, "l2_params": 341.53954062816797, "train/loss": 4.694007754325867, "l2_grads": 1.8828125, "lr": 0.0005762864477618915, "uptime": 106232.696814536, "examples_seen": 57651200.0, "progress": 0.49998667886290776, "epoch": 44.998973592045374, "img/sec/core": 549.4600716070441, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.487282058402222, "core_hours": 29.487282058402222} {"step": 56350, "l2_params": 341.5394891608436, "train/loss": 3.1497945189476013, "l2_grads": 1.8828125, "lr": 0.0005755298477423831, "uptime": 106325.901858494, "examples_seen": 57702400.0, "progress": 0.5004307167659832, "epoch": 45.038937156514336, "img/sec/core": 549.3264937793369, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.513172348390558, "core_hours": 29.513172348390558} {"step": 56400, "l2_params": 341.5394891608436, "train/loss": 3.2869380116462708, "l2_grads": 1.8046875, "lr": 0.000574773070696424, "uptime": 106419.152496283, "examples_seen": 57753600.0, "progress": 0.5008747546690585, "epoch": 45.07890072098329, "img/sec/core": 549.057906883747, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.539075303331945, "core_hours": 29.539075303331945} {"step": 56450, "l2_params": 341.53941481913915, "train/loss": 3.0522600412368774, "l2_grads": 1.984375, "lr": 0.0005740161183977454, "uptime": 106512.40196758401, "examples_seen": 57804800.0, "progress": 0.501318792572134, "epoch": 45.11886428545225, "img/sec/core": 549.0647752278022, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.56497793424889, "core_hours": 29.56497793424889} {"step": 56500, "l2_params": 341.5395549246456, "train/loss": 3.2492690086364746, "l2_grads": 1.875, "lr": 0.0005732589926204876, "uptime": 106605.59731173501, "examples_seen": 57856000.0, "progress": 0.5017628304752093, "epoch": 45.1588278499212, "img/sec/core": 549.3836678905797, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.59086552984639, "core_hours": 29.59086552984639} {"step": 56550, "l2_params": 341.53942339702894, "train/loss": 2.5450364351272583, "l2_grads": 1.984375, "lr": 0.000572501695139198, "uptime": 106698.761837058, "examples_seen": 57907200.0, "progress": 0.5022068683782848, "epoch": 45.198791414390165, "img/sec/core": 549.5654040257643, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.616744564658333, "core_hours": 29.616744564658333} {"step": 56600, "l2_params": 341.55112915656565, "train/loss": 2.595711350440979, "l2_grads": 1.984375, "lr": 0.0005717442277288265, "uptime": 106791.98542534301, "examples_seen": 57958400.0, "progress": 0.5026509062813602, "epoch": 45.23875497885912, "img/sec/core": 549.217220039515, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.642640005848612, "core_hours": 29.642640005848612} {"step": 56650, "l2_params": 341.55109770537996, "train/loss": 2.2641456723213196, "l2_grads": 2.0625, "lr": 0.0005709865921647213, "uptime": 106886.137494801, "examples_seen": 58009600.0, "progress": 0.5030949441844356, "epoch": 45.278718543328075, "img/sec/core": 543.8011112739473, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.668793358475835, "core_hours": 29.668793358475835} {"step": 56700, "l2_params": 341.5510862685844, "train/loss": 4.700376272201538, "l2_grads": 1.8984375, "lr": 0.0005702287902226237, "uptime": 106979.251564844, "examples_seen": 58060800.0, "progress": 0.503538982087511, "epoch": 45.31868210779703, "img/sec/core": 549.8631944276261, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.69465837793222, "core_hours": 29.69465837793222} {"step": 56750, "l2_params": 341.56283451493226, "train/loss": 3.812779426574707, "l2_grads": 1.8359375, "lr": 0.0005694708236786665, "uptime": 107072.387454582, "examples_seen": 58112000.0, "progress": 0.5039830199905864, "epoch": 45.358645672265986, "img/sec/core": 549.7343735484959, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.720529458415, "core_hours": 29.720529458415} {"step": 56800, "l2_params": 341.56278305111783, "train/loss": 2.92935311794281, "l2_grads": 1.9375, "lr": 0.0005687126943093671, "uptime": 107165.552633101, "examples_seen": 58163200.0, "progress": 0.5044270578936618, "epoch": 45.39860923673495, "img/sec/core": 549.5615509345693, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.74640867467028, "core_hours": 29.74640867467028} {"step": 56850, "l2_params": 341.5628259376304, "train/loss": 2.203378677368164, "l2_grads": 2.046875, "lr": 0.0005679544038916256, "uptime": 107258.80918838701, "examples_seen": 58214400.0, "progress": 0.5048710957967372, "epoch": 45.438572801203904, "img/sec/core": 549.023066989528, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.772313273360837, "core_hours": 29.772313273360837} {"step": 56900, "l2_params": 341.56291171063936, "train/loss": 2.4870144724845886, "l2_grads": 1.9921875, "lr": 0.0005671959542027191, "uptime": 107353.732384624, "examples_seen": 58265600.0, "progress": 0.5053151336998126, "epoch": 45.47853636567286, "img/sec/core": 539.383438713635, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.798680827871113, "core_hours": 29.798680827871113} {"step": 56950, "l2_params": 341.5629002742394, "train/loss": 4.697682738304138, "l2_grads": 1.7578125, "lr": 0.0005664373470202969, "uptime": 107446.94808135601, "examples_seen": 58316800.0, "progress": 0.505759171602888, "epoch": 45.518499930141815, "img/sec/core": 549.2637162515699, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.824574076963337, "core_hours": 29.824574076963337} {"step": 57000, "l2_params": 341.5628802605386, "train/loss": 3.4482405185699463, "l2_grads": 1.859375, "lr": 0.0005656785841223787, "uptime": 107540.3841072, "examples_seen": 58368000.0, "progress": 0.5062032095059634, "epoch": 45.55846349461077, "img/sec/core": 547.9685114763283, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.85052852858667, "core_hours": 29.85052852858667} {"step": 57050, "l2_params": 341.5746166652317, "train/loss": 2.286449432373047, "l2_grads": 2.046875, "lr": 0.0005649196672873495, "uptime": 107633.88451486001, "examples_seen": 58419200.0, "progress": 0.5066472474090389, "epoch": 45.59842705907973, "img/sec/core": 547.591195390079, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.87650086404778, "core_hours": 29.87650086404778} {"step": 57100, "l2_params": 341.57455948518765, "train/loss": 2.928829312324524, "l2_grads": 1.9453125, "lr": 0.0005641605982939548, "uptime": 107728.342518827, "examples_seen": 58470400.0, "progress": 0.5070912853121142, "epoch": 45.63839062354869, "img/sec/core": 542.0398256339325, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.902739198483058, "core_hours": 29.902739198483058} {"step": 57150, "l2_params": 341.57455948518765, "train/loss": 2.2598013281822205, "l2_grads": 2.125, "lr": 0.0005634013789212947, "uptime": 107821.42161628601, "examples_seen": 58521600.0, "progress": 0.5075353232151897, "epoch": 45.67835418801764, "img/sec/core": 550.069794376228, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.92859450333278, "core_hours": 29.92859450333278} {"step": 57200, "l2_params": 341.5744737151036, "train/loss": 2.3653258085250854, "l2_grads": 2.015625, "lr": 0.0005626420109488253, "uptime": 107914.57054370901, "examples_seen": 58572800.0, "progress": 0.507979361118265, "epoch": 45.7183177524866, "img/sec/core": 549.6574294140448, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.954469205394723, "core_hours": 29.954469205394723} {"step": 57250, "l2_params": 341.5744737151036, "train/loss": 4.667913198471069, "l2_grads": 1.9296875, "lr": 0.0005618824961563485, "uptime": 108008.677315633, "examples_seen": 58624000.0, "progress": 0.5084233990213405, "epoch": 45.758281316955554, "img/sec/core": 544.0628655433187, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 29.98060997537361, "core_hours": 29.98060997537361} {"step": 57300, "l2_params": 341.57449086912214, "train/loss": 3.014960765838623, "l2_grads": 1.90625, "lr": 0.0005611228363240106, "uptime": 108101.783929668, "examples_seen": 58675200.0, "progress": 0.5088674369244158, "epoch": 45.798244881424516, "img/sec/core": 549.9072276514379, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.006472923716668, "core_hours": 30.006472923716668} {"step": 57350, "l2_params": 341.5745080231398, "train/loss": 2.905732810497284, "l2_grads": 1.8203125, "lr": 0.0005603630332322988, "uptime": 108196.02754689, "examples_seen": 58726400.0, "progress": 0.5093114748274913, "epoch": 45.83820844589347, "img/sec/core": 543.2728656773774, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.032651706278333, "core_hours": 30.032651706278333} {"step": 57400, "l2_params": 341.574530895162, "train/loss": 2.378881573677063, "l2_grads": 2.0625, "lr": 0.0005596030886620354, "uptime": 108289.356492765, "examples_seen": 58777600.0, "progress": 0.5097555127305666, "epoch": 45.87817201036243, "img/sec/core": 548.5972172939612, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.058576413465833, "core_hours": 30.058576413465833} {"step": 57450, "l2_params": 341.5746566912569, "train/loss": 2.4712181091308594, "l2_grads": 2.015625, "lr": 0.0005588430043943738, "uptime": 108382.686361254, "examples_seen": 58828800.0, "progress": 0.5101995506336421, "epoch": 45.91813557483138, "img/sec/core": 548.5917941267935, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.084501376935002, "core_hours": 30.084501376935002} {"step": 57500, "l2_params": 341.59802251238955, "train/loss": 2.2302818298339844, "l2_grads": 1.984375, "lr": 0.0005580827822107959, "uptime": 108476.060174162, "examples_seen": 58880000.0, "progress": 0.5106435885367175, "epoch": 45.958099139300344, "img/sec/core": 548.3336109498503, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.110438547187226, "core_hours": 30.110438547187226, "val/acc@1": 0.6451690051020408, "val/loss": 1.4817921683496358, "z/secs/eval/val": 31.768423852990963} {"step": 57550, "l2_params": 341.5979224541625, "train/loss": 2.457643210887909, "l2_grads": 2.328125, "lr": 0.000557322423893106, "uptime": 108600.57523067501, "examples_seen": 58931200.0, "progress": 0.5110876264397929, "epoch": 45.9980627037693, "img/sec/core": 411.19525167346677, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.14502606288528, "core_hours": 30.14502606288528} {"step": 57600, "l2_params": 341.59790816012764, "train/loss": 4.843990802764893, "l2_grads": 1.8046875, "lr": 0.0005565619312234284, "uptime": 108693.620372251, "examples_seen": 58982400.0, "progress": 0.5115316643428683, "epoch": 46.038026268238255, "img/sec/core": 550.2705367822512, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.170871935545275, "core_hours": 30.170871935545275} {"step": 57650, "l2_params": 341.5980196535835, "train/loss": 2.427259862422943, "l2_grads": 2.109375, "lr": 0.0005558013059842014, "uptime": 108787.71926622301, "examples_seen": 59033600.0, "progress": 0.5119757022459437, "epoch": 46.07798983270721, "img/sec/core": 544.1084144435171, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.197010517204166, "core_hours": 30.197010517204166} {"step": 57700, "l2_params": 341.59786241921216, "train/loss": 4.873782753944397, "l2_grads": 1.828125, "lr": 0.000555040549958175, "uptime": 108880.73970099201, "examples_seen": 59084800.0, "progress": 0.5124197401490191, "epoch": 46.117953397176166, "img/sec/core": 550.4166920649798, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.222849526862223, "core_hours": 30.222849526862223} {"step": 57750, "l2_params": 341.59803966522554, "train/loss": 2.3393778204917908, "l2_grads": 2.125, "lr": 0.0005542796649284034, "uptime": 108975.119218965, "examples_seen": 59136000.0, "progress": 0.5128637780520945, "epoch": 46.15791696164513, "img/sec/core": 542.4905858774457, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.2490660596325, "core_hours": 30.2490660596325} {"step": 57800, "l2_params": 341.59803108880766, "train/loss": 2.4782094955444336, "l2_grads": 2.140625, "lr": 0.0005535186526782457, "uptime": 109068.15490241701, "examples_seen": 59187200.0, "progress": 0.5133078159551699, "epoch": 46.19788052611408, "img/sec/core": 550.3264779734999, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.274909305035838, "core_hours": 30.274909305035838} {"step": 57850, "l2_params": 341.5980025007465, "train/loss": 3.184758484363556, "l2_grads": 1.8046875, "lr": 0.0005527575149913587, "uptime": 109162.301939832, "examples_seen": 59238400.0, "progress": 0.5137518538582453, "epoch": 46.23784409058304, "img/sec/core": 543.8301767724645, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.301061259873332, "core_hours": 30.301061259873332} {"step": 57900, "l2_params": 341.6448208209075, "train/loss": 2.341963827610016, "l2_grads": 2.171875, "lr": 0.0005519962536516926, "uptime": 109255.428858129, "examples_seen": 59289600.0, "progress": 0.5141958917613207, "epoch": 46.277807655051994, "img/sec/core": 549.7873325595687, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.32692984828917, "core_hours": 30.32692984828917} {"step": 57950, "l2_params": 341.6506519366676, "train/loss": 2.937114953994751, "l2_grads": 2.0, "lr": 0.0005512348704434879, "uptime": 109350.002277399, "examples_seen": 59340800.0, "progress": 0.5146399296643962, "epoch": 46.31777121952095, "img/sec/core": 541.3783322544974, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.353200242530832, "core_hours": 30.353200242530832} {"step": 58000, "l2_params": 341.65070910397657, "train/loss": 3.849705696105957, "l2_grads": 1.8046875, "lr": 0.0005504733671512701, "uptime": 109443.147736378, "examples_seen": 59392000.0, "progress": 0.5150839675674715, "epoch": 46.35773478398991, "img/sec/core": 549.6778969283591, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.37907398113611, "core_hours": 30.37907398113611} {"step": 58050, "l2_params": 341.6506919537849, "train/loss": 2.3078829050064087, "l2_grads": 1.9921875, "lr": 0.0005497117455598471, "uptime": 109536.61845497301, "examples_seen": 59443200.0, "progress": 0.515528005470547, "epoch": 46.39769834845887, "img/sec/core": 547.7651265509078, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.405038069634724, "core_hours": 30.405038069634724} {"step": 58100, "l2_params": 341.6507719880053, "train/loss": 2.3451988101005554, "l2_grads": 1.9609375, "lr": 0.0005489500074543025, "uptime": 109629.815785472, "examples_seen": 59494400.0, "progress": 0.5159720433736223, "epoch": 46.43766191292782, "img/sec/core": 549.3719586802117, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.430926216995555, "core_hours": 30.430926216995555} {"step": 58150, "l2_params": 341.6507434043573, "train/loss": 2.236907184123993, "l2_grads": 2.015625, "lr": 0.000548188154619994, "uptime": 109725.08870848801, "examples_seen": 59545600.0, "progress": 0.5164160812766978, "epoch": 46.47762547739678, "img/sec/core": 537.4034760264408, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.457390917833333, "core_hours": 30.457390917833333} {"step": 58200, "l2_params": 341.65072625416735, "train/loss": 2.3741493225097656, "l2_grads": 2.15625, "lr": 0.0005474261888425485, "uptime": 109818.554026838, "examples_seen": 59596800.0, "progress": 0.5168601191797731, "epoch": 46.51758904186573, "img/sec/core": 547.7967753587099, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.48335350626389, "core_hours": 30.48335350626389} {"step": 58250, "l2_params": 341.65070910397657, "train/loss": 2.3596699833869934, "l2_grads": 2.046875, "lr": 0.0005466641119078575, "uptime": 109913.070085652, "examples_seen": 59648000.0, "progress": 0.5173041570828486, "epoch": 46.557552606334696, "img/sec/core": 541.7068870884483, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.509607967045554, "core_hours": 30.509607967045554} {"step": 58300, "l2_params": 341.65074912108713, "train/loss": 2.3110901713371277, "l2_grads": 2.125, "lr": 0.000545901925602073, "uptime": 110006.25356002801, "examples_seen": 59699200.0, "progress": 0.517748194985924, "epoch": 46.59751617080365, "img/sec/core": 549.4536487596384, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.535492265483338, "core_hours": 30.535492265483338} {"step": 58350, "l2_params": 341.6507662712759, "train/loss": 4.71521520614624, "l2_grads": 1.8359375, "lr": 0.0005451396317116024, "uptime": 110100.571769213, "examples_seen": 59750400.0, "progress": 0.5181922328889994, "epoch": 46.637479735272606, "img/sec/core": 542.8432159857938, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.561691768034724, "core_hours": 30.561691768034724} {"step": 58400, "l2_params": 341.6741640437568, "train/loss": 2.529654324054718, "l2_grads": 1.953125, "lr": 0.0005443772320231064, "uptime": 110194.173485741, "examples_seen": 59801600.0, "progress": 0.5186362707920749, "epoch": 46.67744329974156, "img/sec/core": 546.9985156167576, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.587692244848053, "core_hours": 30.587692244848053} {"step": 58450, "l2_params": 341.6741383202349, "train/loss": 3.783897578716278, "l2_grads": 1.9296875, "lr": 0.0005436147283234936, "uptime": 110288.10888914601, "examples_seen": 59852800.0, "progress": 0.5190803086951502, "epoch": 46.717406864210524, "img/sec/core": 545.0554119542124, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.613785412460558, "core_hours": 30.613785412460558} {"step": 58500, "l2_params": 341.6741840509391, "train/loss": 2.4521511793136597, "l2_grads": 1.8984375, "lr": 0.0005428521223999158, "uptime": 110382.557726105, "examples_seen": 59904000.0, "progress": 0.5195243465982257, "epoch": 46.75737042867948, "img/sec/core": 542.0924348939079, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.640021200504723, "core_hours": 30.640021200504723} {"step": 58550, "l2_params": 341.6741497529115, "train/loss": 2.3498347401618958, "l2_grads": 2.109375, "lr": 0.000542089416039764, "uptime": 110475.736809611, "examples_seen": 59955200.0, "progress": 0.519968384501301, "epoch": 46.797333993148435, "img/sec/core": 549.4795406171394, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.665904279256388, "core_hours": 30.665904279256388} {"step": 58600, "l2_params": 341.6741954836142, "train/loss": 2.1801863312721252, "l2_grads": 2.140625, "lr": 0.0005413266110306665, "uptime": 110569.00638668, "examples_seen": 60006400.0, "progress": 0.5204124224043765, "epoch": 46.83729755761739, "img/sec/core": 548.946415422473, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.691812495108888, "core_hours": 30.691812495108888} {"step": 58650, "l2_params": 341.67416690192573, "train/loss": 2.3752554655075073, "l2_grads": 1.9921875, "lr": 0.0005405637091604805, "uptime": 110662.25071206, "examples_seen": 60057600.0, "progress": 0.5208564603074518, "epoch": 46.877261122086345, "img/sec/core": 549.0950767389143, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.717713696603333, "core_hours": 30.717713696603333} {"step": 58700, "l2_params": 341.6741954836142, "train/loss": 4.6853331327438354, "l2_grads": 1.8125, "lr": 0.0005398007122172922, "uptime": 110756.99873216801, "examples_seen": 60108800.0, "progress": 0.5213004982105273, "epoch": 46.91722468655531, "img/sec/core": 540.3806849118013, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.74403259107778, "core_hours": 30.74403259107778} {"step": 58750, "l2_params": 341.6741125967111, "train/loss": 2.247451961040497, "l2_grads": 2.0625, "lr": 0.0005390376219894087, "uptime": 110852.01910422201, "examples_seen": 60160000.0, "progress": 0.5217445361136026, "epoch": 46.95718825102426, "img/sec/core": 538.8318198849236, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.77042713887056, "core_hours": 30.77042713887056} {"step": 58800, "l2_params": 341.67706507296475, "train/loss": 2.381312847137451, "l2_grads": 2.015625, "lr": 0.0005382744402653575, "uptime": 110945.894331185, "examples_seen": 60211200.0, "progress": 0.5221885740166781, "epoch": 46.99715181549322, "img/sec/core": 545.404806533088, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.796503590804722, "core_hours": 30.796503590804722} {"step": 58850, "l2_params": 341.67708793812176, "train/loss": 3.144585371017456, "l2_grads": 1.859375, "lr": 0.0005375111688338793, "uptime": 111038.994097438, "examples_seen": 60262400.0, "progress": 0.5226326119197535, "epoch": 47.037115379962174, "img/sec/core": 549.9476750657334, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.82236463698611, "core_hours": 30.82236463698611} {"step": 58900, "l2_params": 341.67414403657324, "train/loss": 4.873961687088013, "l2_grads": 1.921875, "lr": 0.0005367478094839259, "uptime": 111132.25677552201, "examples_seen": 60313600.0, "progress": 0.5230766498228289, "epoch": 47.07707894443113, "img/sec/core": 548.9870230177291, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.84827093645389, "core_hours": 30.84827093645389} {"step": 58950, "l2_params": 341.67417261826364, "train/loss": 2.1836554408073425, "l2_grads": 2.078125, "lr": 0.0005359843640046549, "uptime": 111225.509192464, "examples_seen": 60364800.0, "progress": 0.5235206877259043, "epoch": 47.11704250890009, "img/sec/core": 549.0474314660291, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.87417438560444, "core_hours": 30.87417438560444} {"step": 59000, "l2_params": 341.6770936544108, "train/loss": 3.459478735923767, "l2_grads": 1.78125, "lr": 0.0005352208341854257, "uptime": 111319.552717547, "examples_seen": 60416000.0, "progress": 0.5239647256289797, "epoch": 47.15700607336905, "img/sec/core": 544.4287626905696, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.90029758701639, "core_hours": 30.90029758701639} {"step": 59050, "l2_params": 341.674081156846, "train/loss": 3.50342857837677, "l2_grads": 1.796875, "lr": 0.0005344572218157951, "uptime": 111413.76150010001, "examples_seen": 60467200.0, "progress": 0.5244087635320551, "epoch": 47.196969637838, "img/sec/core": 543.4737464226761, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.92646669328111, "core_hours": 30.92646669328111} {"step": 59100, "l2_params": 341.6740983058637, "train/loss": 2.2337143421173096, "l2_grads": 2.09375, "lr": 0.0005336935286855137, "uptime": 111507.73030484401, "examples_seen": 60518400.0, "progress": 0.5248528014351305, "epoch": 47.23693320230696, "img/sec/core": 544.8616712693629, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.952569139043337, "core_hours": 30.952569139043337} {"step": 59150, "l2_params": 341.6740468588081, "train/loss": 2.960347056388855, "l2_grads": 2.015625, "lr": 0.0005329297565845217, "uptime": 111600.892692953, "examples_seen": 60569600.0, "progress": 0.5252968393382059, "epoch": 47.27689676677591, "img/sec/core": 549.5780114621044, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 30.97844758018472, "core_hours": 30.97844758018472} {"step": 59200, "l2_params": 341.67417261826364, "train/loss": 2.7226593494415283, "l2_grads": 1.8984375, "lr": 0.0005321659073029437, "uptime": 111695.23699513101, "examples_seen": 60620800.0, "progress": 0.5257408772412813, "epoch": 47.316860331244875, "img/sec/core": 542.693080747945, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.004654330789723, "core_hours": 31.004654330789723} {"step": 59250, "l2_params": 341.674081156846, "train/loss": 2.2319039702415466, "l2_grads": 2.109375, "lr": 0.0005314019826310855, "uptime": 111788.409735944, "examples_seen": 60672000.0, "progress": 0.5261849151443567, "epoch": 47.35682389571383, "img/sec/core": 549.5169461931163, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.03053564768222, "core_hours": 31.03053564768222} {"step": 59300, "l2_params": 341.6771479591516, "train/loss": 4.906989097595215, "l2_grads": 1.9765625, "lr": 0.00053063798435943, "uptime": 111881.601485818, "examples_seen": 60723200.0, "progress": 0.5266289530474322, "epoch": 47.396787460182786, "img/sec/core": 549.4048568594194, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.056422244869445, "core_hours": 31.056422244869445} {"step": 59350, "l2_params": 341.67707936368805, "train/loss": 4.34190559387207, "l2_grads": 1.8828125, "lr": 0.0005298739142786326, "uptime": 111974.814212599, "examples_seen": 60774400.0, "progress": 0.5270729909505075, "epoch": 47.43675102465174, "img/sec/core": 549.2812169339603, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.08231466897528, "core_hours": 31.08231466897528} {"step": 59400, "l2_params": 341.7004353231058, "train/loss": 2.4013428688049316, "l2_grads": 2.0625, "lr": 0.0005291097741795154, "uptime": 112067.998137669, "examples_seen": 60825600.0, "progress": 0.527517028853583, "epoch": 47.476714589120704, "img/sec/core": 549.4509912684906, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.108199092605833, "core_hours": 31.108199092605833} {"step": 59450, "l2_params": 341.700538209263, "train/loss": 2.7383939027786255, "l2_grads": 1.96875, "lr": 0.0005283455658530663, "uptime": 112161.210848549, "examples_seen": 60876800.0, "progress": 0.5279610667566583, "epoch": 47.51667815358966, "img/sec/core": 549.2813106348875, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.134091512294724, "core_hours": 31.134091512294724} {"step": 59500, "l2_params": 341.70049248208585, "train/loss": 2.5233523845672607, "l2_grads": 1.9453125, "lr": 0.0005275812910904326, "uptime": 112254.71113003501, "examples_seen": 60928000.0, "progress": 0.5284051046597338, "epoch": 47.556641718058614, "img/sec/core": 547.59193433726, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.160063812707502, "core_hours": 31.160063812707502} {"step": 59550, "l2_params": 341.70049819798334, "train/loss": 2.3423649668693542, "l2_grads": 2.09375, "lr": 0.0005268169516829176, "uptime": 112347.991564314, "examples_seen": 60979200.0, "progress": 0.5288491425628091, "epoch": 47.59660528252757, "img/sec/core": 548.8825217823012, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.185975044451663, "core_hours": 31.185975044451663} {"step": 59600, "l2_params": 341.7004353231058, "train/loss": 3.0586531162261963, "l2_grads": 2.046875, "lr": 0.0005260525494219763, "uptime": 112441.441593031, "examples_seen": 61030400.0, "progress": 0.5292931804658846, "epoch": 47.636568846996525, "img/sec/core": 547.8864019940237, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.211933385761945, "core_hours": 31.211933385761945} {"step": 59650, "l2_params": 341.7003667323171, "train/loss": 2.8528804183006287, "l2_grads": 1.9375, "lr": 0.0005252880860992101, "uptime": 112536.326619281, "examples_seen": 61081600.0, "progress": 0.5297372183689599, "epoch": 47.67653241146549, "img/sec/core": 539.6004198292026, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.238290337498054, "core_hours": 31.238290337498054} {"step": 59700, "l2_params": 341.7237839706947, "train/loss": 3.670093595981598, "l2_grads": 1.8359375, "lr": 0.0005245235635063641, "uptime": 112629.463240651, "examples_seen": 61132800.0, "progress": 0.5301812562720354, "epoch": 47.71649597593444, "img/sec/core": 549.7300551261649, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.264161621211944, "core_hours": 31.264161621211944} {"step": 59750, "l2_params": 341.72369823806486, "train/loss": 3.233803153038025, "l2_grads": 1.8203125, "lr": 0.0005237589834353221, "uptime": 112723.76244299501, "examples_seen": 61184000.0, "progress": 0.5306252941751108, "epoch": 47.7564595404034, "img/sec/core": 542.9526308528383, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.29035584408528, "core_hours": 31.29035584408528} {"step": 59800, "l2_params": 341.72380111721804, "train/loss": 2.322053372859955, "l2_grads": 2.09375, "lr": 0.0005229943476781026, "uptime": 112816.95419348, "examples_seen": 61235200.0, "progress": 0.5310693320781862, "epoch": 47.79642310487235, "img/sec/core": 549.4048532572813, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.316242441442224, "core_hours": 31.316242441442224} {"step": 59850, "l2_params": 341.72370395357416, "train/loss": 2.3502122163772583, "l2_grads": 1.984375, "lr": 0.0005222296580268554, "uptime": 112910.198589663, "examples_seen": 61286400.0, "progress": 0.5315133699812616, "epoch": 47.83638666934131, "img/sec/core": 549.0946597961337, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.342143662604165, "core_hours": 31.342143662604165} {"step": 59900, "l2_params": 341.72364679847664, "train/loss": 4.452456474304199, "l2_grads": 1.890625, "lr": 0.0005214649162738554, "uptime": 113004.50665989901, "examples_seen": 61337600.0, "progress": 0.531957407884337, "epoch": 47.87635023381027, "img/sec/core": 542.9015764173107, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.368340348780837, "core_hours": 31.368340348780837} {"step": 59950, "l2_params": 341.72367537602656, "train/loss": 4.76478898525238, "l2_grads": 2.015625, "lr": 0.0005207001242115007, "uptime": 113097.7941363, "examples_seen": 61388800.0, "progress": 0.5324014457874124, "epoch": 47.916313798279226, "img/sec/core": 548.8410875209022, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.39425353667, "core_hours": 31.39425353667} {"step": 60000, "l2_params": 341.72370395357416, "train/loss": 3.1083951592445374, "l2_grads": 1.890625, "lr": 0.0005199352836323064, "uptime": 113191.118760279, "examples_seen": 61440000.0, "progress": 0.5328454836904878, "epoch": 47.95627736274818, "img/sec/core": 548.622623023049, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.420177043330835, "core_hours": 31.420177043330835, "val/acc@1": 0.6485172193877551, "val/loss": 1.4649667630390244, "z/secs/eval/val": 31.865614077993087} {"step": 60050, "l2_params": 341.72371824234705, "train/loss": 2.4421769976615906, "l2_grads": 2.046875, "lr": 0.0005191703963289016, "uptime": 113316.124575987, "examples_seen": 61491200.0, "progress": 0.5332895215935632, "epoch": 47.99624092721714, "img/sec/core": 409.5809439746012, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.454900881027502, "core_hours": 31.454900881027502} {"step": 60100, "l2_params": 341.7237296733649, "train/loss": 4.331510543823242, "l2_grads": 1.9453125, "lr": 0.0005184054640940257, "uptime": 113409.28083621101, "examples_seen": 61542400.0, "progress": 0.5337335594966386, "epoch": 48.03620449168609, "img/sec/core": 549.6141630942018, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.48077761997861, "core_hours": 31.48077761997861} {"step": 60150, "l2_params": 341.72371252683797, "train/loss": 2.298756182193756, "l2_grads": 2.046875, "lr": 0.0005176404887205218, "uptime": 113503.873638691, "examples_seen": 61593600.0, "progress": 0.534177597399714, "epoch": 48.076168056155055, "img/sec/core": 541.2673972824573, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.50705339844528, "core_hours": 31.50705339844528} {"step": 60200, "l2_params": 341.72367823378147, "train/loss": 2.4212117791175842, "l2_grads": 2.0625, "lr": 0.0005168754720013362, "uptime": 113597.109233482, "examples_seen": 61644800.0, "progress": 0.5346216353027895, "epoch": 48.11613162062401, "img/sec/core": 549.1464940484757, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.53295217477611, "core_hours": 31.53295217477611} {"step": 60250, "l2_params": 341.7236810915363, "train/loss": 3.22855281829834, "l2_grads": 1.90625, "lr": 0.0005161104157295096, "uptime": 113691.18211373601, "examples_seen": 61696000.0, "progress": 0.5350656732058648, "epoch": 48.156095185092965, "img/sec/core": 544.2588752651395, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.559083530402226, "core_hours": 31.559083530402226} {"step": 60300, "l2_params": 341.72371538459254, "train/loss": 2.1881709694862366, "l2_grads": 2.09375, "lr": 0.0005153453216981775, "uptime": 113784.498163679, "examples_seen": 61747200.0, "progress": 0.5355097111089403, "epoch": 48.19605874956192, "img/sec/core": 548.6730313946805, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.58500465538639, "core_hours": 31.58500465538639} {"step": 60350, "l2_params": 341.72366680276184, "train/loss": 3.474120855331421, "l2_grads": 1.8125, "lr": 0.0005145801917005631, "uptime": 113878.127417751, "examples_seen": 61798400.0, "progress": 0.5359537490120156, "epoch": 48.236022314030876, "img/sec/core": 546.8376364573661, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.611012781517502, "core_hours": 31.611012781517502} {"step": 60400, "l2_params": 341.72371824234705, "train/loss": 2.2770241498947144, "l2_grads": 2.109375, "lr": 0.0005138150275299745, "uptime": 113971.817904945, "examples_seen": 61849600.0, "progress": 0.5363977869150911, "epoch": 48.27598587849984, "img/sec/core": 546.4802407739381, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.637037916849167, "core_hours": 31.637037916849167} {"step": 60450, "l2_params": 341.7353833971908, "train/loss": 3.0785031914711, "l2_grads": 1.9296875, "lr": 0.0005130498309797987, "uptime": 114067.072948265, "examples_seen": 61900800.0, "progress": 0.5368418248181664, "epoch": 48.315949442968794, "img/sec/core": 537.504348488867, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.663497651104723, "core_hours": 31.663497651104723} {"step": 60500, "l2_params": 341.7354519809512, "train/loss": 2.278236746788025, "l2_grads": 2.125, "lr": 0.0005122846038434993, "uptime": 114160.329624715, "examples_seen": 61952000.0, "progress": 0.5372858627212419, "epoch": 48.35591300743775, "img/sec/core": 549.0223536698173, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.689402283451944, "core_hours": 31.689402283451944} {"step": 60550, "l2_params": 341.7354634115766, "train/loss": 2.148639738559723, "l2_grads": 2.046875, "lr": 0.0005115193479146117, "uptime": 114254.68451222501, "examples_seen": 62003200.0, "progress": 0.5377299006243172, "epoch": 48.395876571906705, "img/sec/core": 542.6321979830508, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.71561197442695, "core_hours": 31.71561197442695} {"step": 60600, "l2_params": 341.7354748422016, "train/loss": 2.4297555088996887, "l2_grads": 2.140625, "lr": 0.000510754064986739, "uptime": 114347.985539538, "examples_seen": 62054400.0, "progress": 0.5381739385273927, "epoch": 48.43584013637567, "img/sec/core": 548.7613746014019, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.741528926458333, "core_hours": 31.741528926458333} {"step": 60650, "l2_params": 341.7471567410986, "train/loss": 2.3131402730941772, "l2_grads": 2.21875, "lr": 0.0005099887568535463, "uptime": 114442.55137277501, "examples_seen": 62105600.0, "progress": 0.5386179764304682, "epoch": 48.47580370084462, "img/sec/core": 541.4217614059289, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.76779721346861, "core_hours": 31.76779721346861} {"step": 60700, "l2_params": 341.77058220299625, "train/loss": 2.5758586525917053, "l2_grads": 2.109375, "lr": 0.000509223425308759, "uptime": 114535.873210125, "examples_seen": 62156800.0, "progress": 0.5390620143335435, "epoch": 48.51576726531358, "img/sec/core": 548.639005123497, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.793719946065835, "core_hours": 31.793719946065835} {"step": 60750, "l2_params": 341.8173083177986, "train/loss": 2.501448333263397, "l2_grads": 2.078125, "lr": 0.0005084580721461579, "uptime": 114629.471535239, "examples_seen": 62208000.0, "progress": 0.539506052236619, "epoch": 48.55573082978253, "img/sec/core": 547.0183353990641, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.819719480819725, "core_hours": 31.819719480819725} {"step": 60800, "l2_params": 341.8173626002635, "train/loss": 2.182374119758606, "l2_grads": 2.125, "lr": 0.0005076926991595728, "uptime": 114724.05104658501, "examples_seen": 62259200.0, "progress": 0.5399500901396943, "epoch": 48.59569439425149, "img/sec/core": 541.3434608759266, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.845991567304726, "core_hours": 31.845991567304726} {"step": 60850, "l2_params": 341.8173454584334, "train/loss": 2.4001351594924927, "l2_grads": 2.125, "lr": 0.0005069273081428801, "uptime": 114817.406646474, "examples_seen": 62310400.0, "progress": 0.5403941280427698, "epoch": 48.63565795872045, "img/sec/core": 548.4405869694006, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.871923678385, "core_hours": 31.871923678385} {"step": 60900, "l2_params": 341.8173454584334, "train/loss": 3.1046422123908997, "l2_grads": 1.90625, "lr": 0.0005061619008900007, "uptime": 114911.978854422, "examples_seen": 62361600.0, "progress": 0.5408381659458451, "epoch": 48.675621523189406, "img/sec/core": 541.3852664638007, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.898193736148336, "core_hours": 31.898193736148336} {"step": 60950, "l2_params": 341.8173568863202, "train/loss": 3.6701443791389465, "l2_grads": 1.7890625, "lr": 0.0005053964791948911, "uptime": 115005.328169044, "examples_seen": 62412800.0, "progress": 0.5412822038489206, "epoch": 48.71558508765836, "img/sec/core": 548.4775138127696, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.924124101321112, "core_hours": 31.924124101321112} {"step": 61000, "l2_params": 341.84080039179054, "train/loss": 2.485040843486786, "l2_grads": 2.0625, "lr": 0.0005046310448515427, "uptime": 115100.052461763, "examples_seen": 62464000.0, "progress": 0.5417262417519959, "epoch": 48.75554865212732, "img/sec/core": 540.5160443043682, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.950436404854166, "core_hours": 31.950436404854166} {"step": 61050, "l2_params": 341.8408175324445, "train/loss": 2.341675817966461, "l2_grads": 2.25, "lr": 0.0005038655996539759, "uptime": 115193.732198105, "examples_seen": 62515200.0, "progress": 0.5421702796550714, "epoch": 48.79551221659627, "img/sec/core": 546.5429558114872, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 31.976458553838054, "core_hours": 31.976458553838054} {"step": 61100, "l2_params": 341.8409203763499, "train/loss": 4.972247123718262, "l2_grads": 2.078125, "lr": 0.0005031001453962377, "uptime": 115288.417660923, "examples_seen": 62566400.0, "progress": 0.5426143175581467, "epoch": 48.835475781065234, "img/sec/core": 540.737706467294, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.0027600712875, "core_hours": 32.0027600712875} {"step": 61150, "l2_params": 341.8642365764515, "train/loss": 4.521738052368164, "l2_grads": 1.84375, "lr": 0.000502334683872395, "uptime": 115381.683231983, "examples_seen": 62617600.0, "progress": 0.5430583554612222, "epoch": 48.87543934553419, "img/sec/core": 548.9699941585646, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.02866717435972, "core_hours": 32.02866717435972} {"step": 61200, "l2_params": 341.8642365764515, "train/loss": 2.3524290919303894, "l2_grads": 2.09375, "lr": 0.0005015692168765335, "uptime": 115476.254828661, "examples_seen": 62668800.0, "progress": 0.5435023933642976, "epoch": 48.915402910003145, "img/sec/core": 541.3887657446318, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.054937062325834, "core_hours": 32.054937062325834} {"step": 61251, "l2_params": 341.864285138306, "train/loss": 2.8218749165534973, "l2_grads": 1.984375, "lr": 0.0005008037462027497, "uptime": 115570.040272875, "examples_seen": 62720000.0, "progress": 0.543946431267373, "epoch": 48.9553664744721, "img/sec/core": 545.9269338551818, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.0809885746075, "core_hours": 32.0809885746075} {"step": 61300, "l2_params": 341.86427085540834, "train/loss": 2.7559831738471985, "l2_grads": 1.9296875, "lr": 0.0005000382736451501, "uptime": 115663.763413582, "examples_seen": 62771200.0, "progress": 0.5443904691704484, "epoch": 48.995330038941056, "img/sec/core": 546.2898448961205, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.10702278035944, "core_hours": 32.10702278035944} {"step": 61350, "l2_params": 341.86425942908977, "train/loss": 4.538031339645386, "l2_grads": 1.8515625, "lr": 0.0004992728009978449, "uptime": 115757.98422674701, "examples_seen": 62822400.0, "progress": 0.5448345070735238, "epoch": 49.03529360341002, "img/sec/core": 543.404352818863, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.133195228460835, "core_hours": 32.133195228460835} {"step": 61400, "l2_params": 341.8876740109608, "train/loss": 4.0424376130104065, "l2_grads": 1.9140625, "lr": 0.0004985073300549449, "uptime": 115851.534390204, "examples_seen": 62873600.0, "progress": 0.5452785449765992, "epoch": 49.07525716787897, "img/sec/core": 547.2999523248974, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.15918138497667, "core_hours": 32.15918138497667} {"step": 61450, "l2_params": 341.8876454471191, "train/loss": 3.3187222480773926, "l2_grads": 1.96875, "lr": 0.0004977418626105569, "uptime": 115945.974865333, "examples_seen": 62924800.0, "progress": 0.5457225828796746, "epoch": 49.11522073234793, "img/sec/core": 542.1404321617896, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.18541485029028, "core_hours": 32.18541485029028} {"step": 61500, "l2_params": 341.91104985891434, "train/loss": 2.98317813873291, "l2_grads": 1.7734375, "lr": 0.0004969764004587793, "uptime": 116040.269785076, "examples_seen": 62976000.0, "progress": 0.54616662078275, "epoch": 49.155184296816884, "img/sec/core": 542.9772901821833, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.21160788355222, "core_hours": 32.21160788355222} {"step": 61550, "l2_params": 341.91104414653677, "train/loss": 3.2856736183166504, "l2_grads": 1.7734375, "lr": 0.0004962109453936971, "uptime": 116134.06754907001, "examples_seen": 63027200.0, "progress": 0.5466106586858254, "epoch": 49.19514786128585, "img/sec/core": 545.8552295902402, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.237662817995, "core_hours": 32.237662817995} {"step": 61600, "l2_params": 341.91106413985784, "train/loss": 2.518454670906067, "l2_grads": 2.0, "lr": 0.0004954454992093808, "uptime": 116228.435395554, "examples_seen": 63078400.0, "progress": 0.5470546965889008, "epoch": 49.2351114257548, "img/sec/core": 542.55768153707, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.263876108685004, "core_hours": 32.263876108685004} {"step": 61650, "l2_params": 341.9228142980518, "train/loss": 2.7551023364067078, "l2_grads": 1.84375, "lr": 0.0004946800636998787, "uptime": 116322.752881416, "examples_seen": 63129600.0, "progress": 0.5474987344919763, "epoch": 49.27507499022376, "img/sec/core": 542.8473790629948, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.290075410313335, "core_hours": 32.290075410313335} {"step": 61700, "l2_params": 341.9227743127825, "train/loss": 2.239854574203491, "l2_grads": 2.046875, "lr": 0.0004939146406592148, "uptime": 116415.89470454301, "examples_seen": 63180800.0, "progress": 0.5479427723950516, "epoch": 49.31503855469271, "img/sec/core": 549.6993539645902, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.315948138959726, "core_hours": 32.315948138959726} {"step": 61750, "l2_params": 341.92279716150836, "train/loss": 2.3368053436279297, "l2_grads": 2.09375, "lr": 0.0004931492318813837, "uptime": 116509.180847084, "examples_seen": 63232000.0, "progress": 0.5483868102981271, "epoch": 49.35500211916167, "img/sec/core": 548.8489351727736, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.341860956332226, "core_hours": 32.341860956332226} {"step": 61800, "l2_params": 341.92270576659575, "train/loss": 4.036749601364136, "l2_grads": 1.8984375, "lr": 0.0004923838391603458, "uptime": 116602.48418109301, "examples_seen": 63283200.0, "progress": 0.5488308482012024, "epoch": 49.39496568363063, "img/sec/core": 548.7478078228049, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.3677785491125, "core_hours": 32.3677785491125} {"step": 61850, "l2_params": 341.92274289578194, "train/loss": 2.177886188030243, "l2_grads": 2.09375, "lr": 0.0004916184642900242, "uptime": 116696.230202964, "examples_seen": 63334400.0, "progress": 0.5492748861042779, "epoch": 49.434929248099586, "img/sec/core": 546.1565085978796, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.39381911074333, "core_hours": 32.39381911074333} {"step": 61900, "l2_params": 341.92278002496414, "train/loss": 2.356680691242218, "l2_grads": 2.046875, "lr": 0.000490853109064301, "uptime": 116790.20143643, "examples_seen": 63385600.0, "progress": 0.5497189240073532, "epoch": 49.47489281256854, "img/sec/core": 544.8475891137995, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.41992223115055, "core_hours": 32.41992223115055} {"step": 61950, "l2_params": 341.9228200102327, "train/loss": 4.425592660903931, "l2_grads": 1.984375, "lr": 0.0004900877752770113, "uptime": 116884.08582841301, "examples_seen": 63436800.0, "progress": 0.5501629619104287, "epoch": 49.514856377037496, "img/sec/core": 545.3515639667263, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.44600122892361, "core_hours": 32.44600122892361} {"step": 62001, "l2_params": 341.9228714198569, "train/loss": 2.288738787174225, "l2_grads": 2.109375, "lr": 0.0004893224647219407, "uptime": 116977.641400302, "examples_seen": 63488000.0, "progress": 0.550606999813504, "epoch": 49.55481994150645, "img/sec/core": 547.2683130059775, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.47198888778167, "core_hours": 32.47198888778167} {"step": 62050, "l2_params": 341.922848571136, "train/loss": 3.9380733966827393, "l2_grads": 1.84375, "lr": 0.0004885571791928197, "uptime": 117071.082005, "examples_seen": 63539200.0, "progress": 0.5510510377165795, "epoch": 49.594783505975414, "img/sec/core": 547.9416594689027, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.49794461130889, "core_hours": 32.49794461130889} {"step": 62100, "l2_params": 341.9287092180181, "train/loss": 2.7537102699279785, "l2_grads": 1.953125, "lr": 0.0004877919204833206, "uptime": 117165.094360773, "examples_seen": 63590400.0, "progress": 0.5514950756196549, "epoch": 49.63474707044437, "img/sec/core": 544.6092652292228, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.52405915457917, "core_hours": 32.52405915457917} {"step": 62151, "l2_params": 341.93452406857074, "train/loss": 2.88679438829422, "l2_grads": 2.015625, "lr": 0.0004870266903870524, "uptime": 117258.263834639, "examples_seen": 63641600.0, "progress": 0.5519391135227303, "epoch": 49.674710634913325, "img/sec/core": 549.5362147653365, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.549939563986385, "core_hours": 32.549939563986385} {"step": 62200, "l2_params": 341.9404130747783, "train/loss": 4.5673863887786865, "l2_grads": 1.9609375, "lr": 0.00048626149069755706, "uptime": 117353.06600514, "examples_seen": 63692800.0, "progress": 0.5523831514258057, "epoch": 49.71467419938228, "img/sec/core": 540.0720229233376, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.57627350023667, "core_hours": 32.57627350023667} {"step": 62250, "l2_params": 341.9404416342121, "train/loss": 2.4631490111351013, "l2_grads": 2.0, "lr": 0.00048549632320830574, "uptime": 117446.262043971, "examples_seen": 63744000.0, "progress": 0.5528271893288811, "epoch": 49.754637763851235, "img/sec/core": 549.3795728040245, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.60216128880083, "core_hours": 32.60216128880083} {"step": 62300, "l2_params": 341.94036737967923, "train/loss": 2.3922234773635864, "l2_grads": 2.125, "lr": 0.0004847311897126943, "uptime": 117539.557576504, "examples_seen": 63795200.0, "progress": 0.5532712272319565, "epoch": 49.7946013283202, "img/sec/core": 548.7936947237168, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.628076714504445, "core_hours": 32.628076714504445} {"step": 62350, "l2_params": 341.94619059966874, "train/loss": 3.6503689885139465, "l2_grads": 2.03125, "lr": 0.0004839660920040378, "uptime": 117632.84660759, "examples_seen": 63846400.0, "progress": 0.5537152651350319, "epoch": 49.83456489278915, "img/sec/core": 548.831940947005, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.65399033425056, "core_hours": 32.65399033425056} {"step": 62400, "l2_params": 341.9578681559323, "train/loss": 2.4383875727653503, "l2_grads": 2.1875, "lr": 0.00048320103187556826, "uptime": 117727.062226457, "examples_seen": 63897600.0, "progress": 0.5541593030381073, "epoch": 49.87452845725811, "img/sec/core": 543.4343118021853, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.680161339491384, "core_hours": 32.680161339491384} {"step": 62450, "l2_params": 341.95791099289545, "train/loss": 2.36009818315506, "l2_grads": 2.109375, "lr": 0.00048243601112042976, "uptime": 117820.417290868, "examples_seen": 63948800.0, "progress": 0.5546033409411827, "epoch": 49.914492021727064, "img/sec/core": 548.443732785461, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.70609330182778, "core_hours": 32.70609330182778} {"step": 62500, "l2_params": 341.98129060666463, "train/loss": 4.2069478034973145, "l2_grads": 1.8984375, "lr": 0.0004816710315316735, "uptime": 117914.21179346301, "examples_seen": 64000000.0, "progress": 0.5550473788442581, "epoch": 49.954455586196026, "img/sec/core": 545.87420993187, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.73214733032639, "core_hours": 32.73214733032639, "val/acc@1": 0.6509287308673469, "val/loss": 1.4403992632822114, "z/secs/eval/val": 31.71503464100533} {"step": 62551, "l2_params": 341.98131345148084, "train/loss": 2.668458044528961, "l2_grads": 2.046875, "lr": 0.00048090609490225497, "uptime": 118038.913947078, "examples_seen": 64051200.0, "progress": 0.5554914167473336, "epoch": 49.99441915066498, "img/sec/core": 410.5783141329956, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.76678681744167, "core_hours": 32.76678681744167} {"step": 62600, "l2_params": 341.9812763286537, "train/loss": 3.540153443813324, "l2_grads": 1.8125, "lr": 0.0004801412030250284, "uptime": 118132.128606984, "examples_seen": 64102400.0, "progress": 0.5559354546504089, "epoch": 50.03438271513394, "img/sec/core": 549.269825708054, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.79267977852667, "core_hours": 32.79267977852667} {"step": 62650, "l2_params": 341.98131630708275, "train/loss": 2.2580453753471375, "l2_grads": 2.265625, "lr": 0.00047937635769274267, "uptime": 118225.387908938, "examples_seen": 64153600.0, "progress": 0.5563794925534844, "epoch": 50.07434627960289, "img/sec/core": 549.0068971913423, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.81858514018056, "core_hours": 32.81858514018056} {"step": 62700, "l2_params": 341.98130488467496, "train/loss": 2.234683573246002, "l2_grads": 2.09375, "lr": 0.00047861156069803877, "uptime": 118320.108080269, "examples_seen": 64204800.0, "progress": 0.5568235304565597, "epoch": 50.11430984407185, "img/sec/core": 540.5395628042736, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.84489629888361, "core_hours": 32.84489629888361} {"step": 62750, "l2_params": 341.9812706174492, "train/loss": 3.994873285293579, "l2_grads": 1.8125, "lr": 0.0004778468138334433, "uptime": 118413.28563927801, "examples_seen": 64256000.0, "progress": 0.5572675683596352, "epoch": 50.15427340854081, "img/sec/core": 549.4885307635989, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.87077895416389, "core_hours": 32.87077895416389} {"step": 62800, "l2_params": 341.9812706174492, "train/loss": 2.553517699241638, "l2_grads": 1.921875, "lr": 0.0004770821188913667, "uptime": 118506.57184633, "examples_seen": 64307200.0, "progress": 0.5577116062627105, "epoch": 50.194236973009765, "img/sec/core": 548.84855562264, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.89669178945611, "core_hours": 32.89669178945611} {"step": 62850, "l2_params": 341.9812591950398, "train/loss": 2.6913090348243713, "l2_grads": 1.9375, "lr": 0.000476317477664096, "uptime": 118600.891099817, "examples_seen": 64358400.0, "progress": 0.558155644165786, "epoch": 50.23420053747872, "img/sec/core": 542.8372056300803, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.92289158209139, "core_hours": 32.92289158209139} {"step": 62900, "l2_params": 341.98123635021994, "train/loss": 2.1456997394561768, "l2_grads": 2.078125, "lr": 0.000475552891943793, "uptime": 118695.038623397, "examples_seen": 64409600.0, "progress": 0.5585996820688613, "epoch": 50.274164101947676, "img/sec/core": 543.8273685073872, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.94904367197473, "core_hours": 32.94904367197473} {"step": 62950, "l2_params": 341.9812192166041, "train/loss": 2.176910936832428, "l2_grads": 2.125, "lr": 0.00047478836352249024, "uptime": 118788.286331491, "examples_seen": 64460800.0, "progress": 0.5590437199719368, "epoch": 50.31412766641663, "img/sec/core": 549.0751574117677, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 32.974945813111944, "core_hours": 32.974945813111944} {"step": 63000, "l2_params": 341.98123635021994, "train/loss": 4.862104773521423, "l2_grads": 1.96875, "lr": 0.00047402389419208535, "uptime": 118883.175034951, "examples_seen": 64512000.0, "progress": 0.5594877578750123, "epoch": 50.354091230885594, "img/sec/core": 539.5795087619514, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.001303786295274, "core_hours": 33.001303786295274} {"step": 63050, "l2_params": 341.9812220722068, "train/loss": 2.2539929151535034, "l2_grads": 2.078125, "lr": 0.00047325948574433713, "uptime": 118976.677179064, "examples_seen": 64563200.0, "progress": 0.5599317957780876, "epoch": 50.39405479535455, "img/sec/core": 547.5810259294027, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.02727660410444, "core_hours": 33.02727660410444} {"step": 63100, "l2_params": 341.9812220722068, "train/loss": 2.2770944833755493, "l2_grads": 2.328125, "lr": 0.000472495139970862, "uptime": 119071.420390314, "examples_seen": 64614400.0, "progress": 0.5603758336811631, "epoch": 50.434018359823504, "img/sec/core": 540.4081128820977, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.053594162785, "core_hours": 33.053594162785} {"step": 63150, "l2_params": 341.98131916268466, "train/loss": 2.2062580585479736, "l2_grads": 2.09375, "lr": 0.0004717308586631294, "uptime": 119164.743129137, "examples_seen": 64665600.0, "progress": 0.5608198715842384, "epoch": 50.47398192429246, "img/sec/core": 548.6337054156521, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.07951714579139, "core_hours": 33.07951714579139} {"step": 63200, "l2_params": 342.03976833841995, "train/loss": 2.65756094455719, "l2_grads": 2.046875, "lr": 0.0004709666436124575, "uptime": 119259.226493858, "examples_seen": 64716800.0, "progress": 0.5612639094873139, "epoch": 50.513945488761415, "img/sec/core": 541.8943340045801, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.105762524880554, "core_hours": 33.105762524880554} {"step": 63250, "l2_params": 342.039785469103, "train/loss": 2.1504536867141724, "l2_grads": 2.03125, "lr": 0.0004702024966100105, "uptime": 119353.62133394, "examples_seen": 64768000.0, "progress": 0.5617079473903892, "epoch": 50.55390905323038, "img/sec/core": 542.4025291586538, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.13198331379222, "core_hours": 33.13198331379222} {"step": 63300, "l2_params": 342.0397340770513, "train/loss": 2.2042062878608704, "l2_grads": 2.046875, "lr": 0.00046943841944679113, "uptime": 119447.998898829, "examples_seen": 64819200.0, "progress": 0.5621519852934647, "epoch": 50.59387261769933, "img/sec/core": 542.5018123768867, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.158199304039165, "core_hours": 33.158199304039165} {"step": 63350, "l2_params": 342.0398654122791, "train/loss": 2.2636444568634033, "l2_grads": 2.078125, "lr": 0.00046867441391363924, "uptime": 119542.18297034, "examples_seen": 64870400.0, "progress": 0.56259602319654, "epoch": 50.63383618216829, "img/sec/core": 543.616337440027, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.18436154612555, "core_hours": 33.18436154612555} {"step": 63400, "l2_params": 342.0398340060336, "train/loss": 2.66814923286438, "l2_grads": 2.140625, "lr": 0.0004679104818012266, "uptime": 119635.50347272301, "examples_seen": 64921600.0, "progress": 0.5630400610996155, "epoch": 50.67379974663724, "img/sec/core": 548.6468535056046, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.210283907898614, "core_hours": 33.210283907898614} {"step": 63450, "l2_params": 342.0398768327313, "train/loss": 3.2059910893440247, "l2_grads": 1.9140625, "lr": 0.0004671466249000537, "uptime": 119730.129471444, "examples_seen": 64972800.0, "progress": 0.5634840990026909, "epoch": 50.713763311106206, "img/sec/core": 541.0775124388886, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.23656890754333, "core_hours": 33.23656890754333} {"step": 63500, "l2_params": 342.0398482816001, "train/loss": 3.3712443113327026, "l2_grads": 1.859375, "lr": 0.00046638284500044483, "uptime": 119824.652153346, "examples_seen": 65024000.0, "progress": 0.5639281369057663, "epoch": 50.75372687557516, "img/sec/core": 541.6689303534797, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.26282520807167, "core_hours": 33.26282520807167} {"step": 63550, "l2_params": 342.03985970205287, "train/loss": 3.4293468594551086, "l2_grads": 1.8671875, "lr": 0.0004656191438925422, "uptime": 119918.813058856, "examples_seen": 65075200.0, "progress": 0.5643721748088417, "epoch": 50.79369044004412, "img/sec/core": 543.750081020234, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.28898101515777, "core_hours": 33.28898101515777} {"step": 63600, "l2_params": 342.0398311509202, "train/loss": 3.8791893124580383, "l2_grads": 1.875, "lr": 0.0004648555233663048, "uptime": 120012.690065457, "examples_seen": 65126400.0, "progress": 0.5648162127119171, "epoch": 50.83365400451307, "img/sec/core": 545.3944672267866, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.31505796143583, "core_hours": 33.31505796143583} {"step": 63650, "l2_params": 342.0398425713735, "train/loss": 2.2084845304489136, "l2_grads": 2.0625, "lr": 0.0004640919852115021, "uptime": 120106.613629229, "examples_seen": 65177600.0, "progress": 0.5652602506149925, "epoch": 50.87361756898203, "img/sec/core": 545.1241194838989, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.34114784026139, "core_hours": 33.34114784026139} {"step": 63700, "l2_params": 342.0398140202395, "train/loss": 3.0967302918434143, "l2_grads": 2.0625, "lr": 0.0004633285312177111, "uptime": 120201.375560261, "examples_seen": 65228800.0, "progress": 0.5657042885180679, "epoch": 50.91358113345099, "img/sec/core": 540.3013577542024, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.36747059888139, "core_hours": 33.36747059888139} {"step": 63750, "l2_params": 342.03979688955786, "train/loss": 2.4817798733711243, "l2_grads": 2.078125, "lr": 0.0004625651631743107, "uptime": 120295.848074316, "examples_seen": 65280000.0, "progress": 0.5661483264211433, "epoch": 50.953544697919945, "img/sec/core": 541.9565734240166, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.39371296389667, "core_hours": 33.39371296389667} {"step": 63800, "l2_params": 342.039816875353, "train/loss": 2.433400273323059, "l2_grads": 2.140625, "lr": 0.00046180188287047943, "uptime": 120389.16434215, "examples_seen": 65331200.0, "progress": 0.5665923643242187, "epoch": 50.9935082623889, "img/sec/core": 548.6717502577233, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.419634149406114, "core_hours": 33.419634149406114} {"step": 63850, "l2_params": 342.0398739776183, "train/loss": 3.2587008476257324, "l2_grads": 1.8671875, "lr": 0.0004610386920951889, "uptime": 120483.887061759, "examples_seen": 65382400.0, "progress": 0.5670364022272941, "epoch": 51.033471826857856, "img/sec/core": 540.5250209384596, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.44594601596417, "core_hours": 33.44594601596417} {"step": 63900, "l2_params": 342.0398340060336, "train/loss": 3.7014458179473877, "l2_grads": 1.890625, "lr": 0.0004602755926372017, "uptime": 120577.211669546, "examples_seen": 65433600.0, "progress": 0.5674804401303696, "epoch": 51.07343539132681, "img/sec/core": 548.6227182101553, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.47186951812722, "core_hours": 33.47186951812722} {"step": 63950, "l2_params": 342.0398511367133, "train/loss": 2.301235616207123, "l2_grads": 2.28125, "lr": 0.0004595125862850661, "uptime": 120671.536665914, "examples_seen": 65484800.0, "progress": 0.5679244780334449, "epoch": 51.11339895579577, "img/sec/core": 542.8041555416397, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.49807090600722, "core_hours": 33.49807090600722} {"step": 64000, "l2_params": 342.0398511367133, "train/loss": 4.7908759117126465, "l2_grads": 2.09375, "lr": 0.00045874967482711205, "uptime": 120764.928784489, "examples_seen": 65536000.0, "progress": 0.5683685159365204, "epoch": 51.15336252026473, "img/sec/core": 548.2261327959787, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.52401316116695, "core_hours": 33.52401316116695} {"step": 64050, "l2_params": 342.0398482816001, "train/loss": 3.5628653168678284, "l2_grads": 1.921875, "lr": 0.0004579868600514482, "uptime": 120858.580191219, "examples_seen": 65587200.0, "progress": 0.5688125538395957, "epoch": 51.193326084733684, "img/sec/core": 546.7082854143399, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.55002744081417, "core_hours": 33.55002744081417} {"step": 64100, "l2_params": 342.0631937458706, "train/loss": 2.2209659814834595, "l2_grads": 2.28125, "lr": 0.0004572241437459551, "uptime": 120951.955101803, "examples_seen": 65638400.0, "progress": 0.5692565917426712, "epoch": 51.23328964920264, "img/sec/core": 548.3271649716082, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.57596491597639, "core_hours": 33.57596491597639} {"step": 64150, "l2_params": 342.06321087538043, "train/loss": 4.600641250610352, "l2_grads": 1.890625, "lr": 0.0004564615276982831, "uptime": 121045.798125475, "examples_seen": 65689600.0, "progress": 0.5697006296457465, "epoch": 51.273253213671595, "img/sec/core": 545.5919683380342, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.60203242255194, "core_hours": 33.60203242255194} {"step": 64201, "l2_params": 342.06320516554393, "train/loss": 3.3294451236724854, "l2_grads": 2.03125, "lr": 0.00045569901369584795, "uptime": 121139.01146674, "examples_seen": 65740800.0, "progress": 0.570144667548822, "epoch": 51.31321677814056, "img/sec/core": 549.2775959445698, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.62792501734778, "core_hours": 33.62792501734778} {"step": 64250, "l2_params": 342.06904627848894, "train/loss": 3.3232781887054443, "l2_grads": 1.828125, "lr": 0.00045493660352582537, "uptime": 121233.562676965, "examples_seen": 65792000.0, "progress": 0.5705887054518973, "epoch": 51.35318034260951, "img/sec/core": 541.5054961027517, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.654189242410276, "core_hours": 33.654189242410276} {"step": 64300, "l2_params": 342.0690634077057, "train/loss": 2.218291401863098, "l2_grads": 2.140625, "lr": 0.00045417429897514846, "uptime": 121327.265224457, "examples_seen": 65843200.0, "progress": 0.5710327433549728, "epoch": 51.39314390707847, "img/sec/core": 546.4099042170304, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.680217727824726, "core_hours": 33.680217727824726} {"step": 64350, "l2_params": 342.092466826405, "train/loss": 4.748225808143616, "l2_grads": 2.25, "lr": 0.0004534121018305025, "uptime": 121420.578600162, "examples_seen": 65894400.0, "progress": 0.5714767812580482, "epoch": 51.43310747154742, "img/sec/core": 548.6887556384861, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.706138109964996, "core_hours": 33.706138109964996} {"step": 64400, "l2_params": 342.0924554077085, "train/loss": 4.537981748580933, "l2_grads": 1.9609375, "lr": 0.0004526500138783212, "uptime": 121515.064837178, "examples_seen": 65945600.0, "progress": 0.5719208191611236, "epoch": 51.473071036016385, "img/sec/core": 541.877860913558, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.73238428691389, "core_hours": 33.73238428691389} {"step": 64450, "l2_params": 342.09248395444905, "train/loss": 4.603744626045227, "l2_grads": 1.90625, "lr": 0.0004518880369047819, "uptime": 121608.390047933, "examples_seen": 65996800.0, "progress": 0.572364857064199, "epoch": 51.51303460048534, "img/sec/core": 548.6191735950949, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.75830795656806, "core_hours": 33.75830795656806} {"step": 64500, "l2_params": 342.092466826405, "train/loss": 4.867883086204529, "l2_grads": 1.9609375, "lr": 0.00045112617269580274, "uptime": 121702.670583792, "examples_seen": 66048000.0, "progress": 0.5728088949672744, "epoch": 51.552998164954296, "img/sec/core": 543.0601293629978, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.78449699430667, "core_hours": 33.78449699430667} {"step": 64550, "l2_params": 342.09246111705676, "train/loss": 2.9035568833351135, "l2_grads": 1.953125, "lr": 0.00045036442303703604, "uptime": 121796.250128313, "examples_seen": 66099200.0, "progress": 0.5732529328703498, "epoch": 51.59296172942325, "img/sec/core": 547.1281171764304, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.81049131222917, "core_hours": 33.81049131222917} {"step": 64600, "l2_params": 342.11582297246207, "train/loss": 4.411445498466492, "l2_grads": 1.953125, "lr": 0.00044960278971386717, "uptime": 121890.392605738, "examples_seen": 66150400.0, "progress": 0.5736969707734252, "epoch": 51.63292529389221, "img/sec/core": 543.8565183371853, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.836642000402776, "core_hours": 33.836642000402776} {"step": 64650, "l2_params": 342.1158686441262, "train/loss": 2.2640982270240784, "l2_grads": 2.296875, "lr": 0.00044884127451140775, "uptime": 121984.987003869, "examples_seen": 66201600.0, "progress": 0.5741410086765006, "epoch": 51.67288885836117, "img/sec/core": 541.2582669969162, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.86291822210583, "core_hours": 33.86291822210583} {"step": 64700, "l2_params": 342.1158400993368, "train/loss": 4.238696336746216, "l2_grads": 1.9375, "lr": 0.0004480798792144932, "uptime": 122078.167205752, "examples_seen": 66252800.0, "progress": 0.574585046579576, "epoch": 51.712852422830125, "img/sec/core": 549.4729455972326, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.88880161151778, "core_hours": 33.88880161151778} {"step": 64750, "l2_params": 342.11588006204124, "train/loss": 2.2665818333625793, "l2_grads": 2.203125, "lr": 0.00044731860560767825, "uptime": 122172.41564266001, "examples_seen": 66304000.0, "progress": 0.5750290844826514, "epoch": 51.75281598729908, "img/sec/core": 543.2450837351917, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.91498173288111, "core_hours": 33.91498173288111} {"step": 64800, "l2_params": 342.1158686441262, "train/loss": 3.6218472719192505, "l2_grads": 1.875, "lr": 0.0004465574554752308, "uptime": 122266.15321125, "examples_seen": 66355200.0, "progress": 0.5754731223857269, "epoch": 51.792779551768035, "img/sec/core": 546.205761149513, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.94101994637833, "core_hours": 33.94101994637833} {"step": 64850, "l2_params": 342.1159028978703, "train/loss": 2.197308301925659, "l2_grads": 2.171875, "lr": 0.000445796430601131, "uptime": 122359.94196582, "examples_seen": 66406400.0, "progress": 0.5759171602888022, "epoch": 51.83274311623699, "img/sec/core": 545.9076648872943, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.96707237820333, "core_hours": 33.96707237820333} {"step": 64900, "l2_params": 342.1159028978703, "train/loss": 3.589724123477936, "l2_grads": 1.9453125, "lr": 0.0004450355327690654, "uptime": 122453.13763410601, "examples_seen": 66457600.0, "progress": 0.5763611981918777, "epoch": 51.87270668070595, "img/sec/core": 549.3817571314025, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 33.99296006383834, "core_hours": 33.99296006383834} {"step": 64950, "l2_params": 342.11589718891315, "train/loss": 4.452842116355896, "l2_grads": 1.921875, "lr": 0.00044427476376242145, "uptime": 122547.368218018, "examples_seen": 66508800.0, "progress": 0.576805236094953, "epoch": 51.91267024517491, "img/sec/core": 543.3480073499028, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.01913522603611, "core_hours": 34.01913522603611} {"step": 65000, "l2_params": 342.11589718891315, "train/loss": 2.916839599609375, "l2_grads": 1.9296875, "lr": 0.0004435141253642857, "uptime": 122640.71204348201, "examples_seen": 66560000.0, "progress": 0.5772492739980285, "epoch": 51.952633809643864, "img/sec/core": 548.5097674697627, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.045064066442784, "core_hours": 34.045064066442784, "val/acc@1": 0.6534797512755102, "val/loss": 1.4301267558214616, "z/secs/eval/val": 31.825043151999125} {"step": 65050, "l2_params": 342.11581726350363, "train/loss": 2.3096887469291687, "l2_grads": 2.21875, "lr": 0.0004427536193574383, "uptime": 122765.65222960501, "examples_seen": 66611200.0, "progress": 0.5776933119011038, "epoch": 51.99259737411282, "img/sec/core": 409.7960919443095, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.07976967369917, "core_hours": 34.07976967369917} {"step": 65100, "l2_params": 342.1158629351685, "train/loss": 2.38356351852417, "l2_grads": 2.0625, "lr": 0.0004419932475243492, "uptime": 122858.817701401, "examples_seen": 66662400.0, "progress": 0.5781373498041793, "epoch": 52.032560938581774, "img/sec/core": 549.559820961522, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.10564897142028, "core_hours": 34.10564897142028} {"step": 65150, "l2_params": 342.1158572262107, "train/loss": 4.3084716796875, "l2_grads": 1.8828125, "lr": 0.00044123301164717397, "uptime": 122953.029764423, "examples_seen": 66713600.0, "progress": 0.5785813877072546, "epoch": 52.07252450305074, "img/sec/core": 543.4548226381919, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.13181898892639, "core_hours": 34.13181898892639} {"step": 65200, "l2_params": 342.1158115545451, "train/loss": 2.174705535173416, "l2_grads": 2.109375, "lr": 0.0004404729135077492, "uptime": 123046.32971797501, "examples_seen": 66764800.0, "progress": 0.5790254256103301, "epoch": 52.11248806751969, "img/sec/core": 548.7676901303112, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.15773564269083, "core_hours": 34.15773564269083} {"step": 65250, "l2_params": 342.11584580829486, "train/loss": 4.507139682769775, "l2_grads": 1.8046875, "lr": 0.00043971295488758825, "uptime": 123141.28200109, "examples_seen": 66816000.0, "progress": 0.5794694635134056, "epoch": 52.15245163198865, "img/sec/core": 539.2182085605301, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.184111276889446, "core_hours": 34.184111276889446} {"step": 65300, "l2_params": 342.11576588287335, "train/loss": 2.1840202808380127, "l2_grads": 2.171875, "lr": 0.0004389531375678787, "uptime": 123234.43712502401, "examples_seen": 66867200.0, "progress": 0.5799135014164809, "epoch": 52.1924151964576, "img/sec/core": 549.6208671921542, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.209987700204444, "core_hours": 34.209987700204444} {"step": 65350, "l2_params": 342.12740054419055, "train/loss": 3.8983025550842285, "l2_grads": 1.921875, "lr": 0.00043819346332947594, "uptime": 123328.976174539, "examples_seen": 66918400.0, "progress": 0.5803575393195564, "epoch": 52.23237876092656, "img/sec/core": 541.5751508257025, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.23624854729194, "core_hours": 34.23624854729194} {"step": 65401, "l2_params": 342.1274890300398, "train/loss": 2.1316543221473694, "l2_grads": 2.140625, "lr": 0.0004374339339529008, "uptime": 123422.198266256, "examples_seen": 66969600.0, "progress": 0.5808015772226317, "epoch": 52.27234232539552, "img/sec/core": 549.2260370581266, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.26214357276889, "core_hours": 34.26214357276889} {"step": 65450, "l2_params": 342.1274091073383, "train/loss": 4.3442299365997314, "l2_grads": 1.8671875, "lr": 0.0004366745512183338, "uptime": 123516.22031407601, "examples_seen": 67020800.0, "progress": 0.5812456151257072, "epoch": 52.312305889864476, "img/sec/core": 544.553125433049, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.288260808274444, "core_hours": 34.288260808274444} {"step": 65500, "l2_params": 342.1274519230735, "train/loss": 2.792426288127899, "l2_grads": 2.140625, "lr": 0.0004359153169056123, "uptime": 123609.986407218, "examples_seen": 67072000.0, "progress": 0.5816896530287825, "epoch": 52.35226945433343, "img/sec/core": 546.0396000765926, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.31430694525833, "core_hours": 34.31430694525833} {"step": 65550, "l2_params": 342.12745763183784, "train/loss": 4.102423071861267, "l2_grads": 1.9609375, "lr": 0.00043515623279422527, "uptime": 123703.195027717, "examples_seen": 67123200.0, "progress": 0.582133690931858, "epoch": 52.392233018802386, "img/sec/core": 549.305415377913, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.34019822873028, "core_hours": 34.34019822873028} {"step": 65600, "l2_params": 342.1274804668941, "train/loss": 2.1664584279060364, "l2_grads": 2.28125, "lr": 0.00043439730066331027, "uptime": 123798.380962268, "examples_seen": 67174400.0, "progress": 0.5825777288349333, "epoch": 52.43219658327135, "img/sec/core": 537.8945979940587, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.36663876610555, "core_hours": 34.36663876610555} {"step": 65650, "l2_params": 342.12748332127603, "train/loss": 2.310885429382324, "l2_grads": 2.09375, "lr": 0.0004336385222916484, "uptime": 123891.48495270501, "examples_seen": 67225600.0, "progress": 0.5830217667380088, "epoch": 52.472160147740304, "img/sec/core": 549.9227236091307, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.39250098567139, "core_hours": 34.39250098567139} {"step": 65700, "l2_params": 342.12746048621995, "train/loss": 3.3225268721580505, "l2_grads": 1.859375, "lr": 0.00043287989945765994, "uptime": 123985.813117672, "examples_seen": 67276800.0, "progress": 0.5834658046410842, "epoch": 52.51212371220926, "img/sec/core": 542.7859220829167, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.41870325371778, "core_hours": 34.41870325371778} {"step": 65750, "l2_params": 342.12746048621995, "train/loss": 2.2786723375320435, "l2_grads": 2.1875, "lr": 0.00043212143393940106, "uptime": 124079.618231663, "examples_seen": 67328000.0, "progress": 0.5839098425441596, "epoch": 52.552087276678215, "img/sec/core": 545.812459701452, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.44476022982639, "core_hours": 34.44476022982639} {"step": 65800, "l2_params": 342.12751186509394, "train/loss": 2.2091394662857056, "l2_grads": 2.109375, "lr": 0.00043136312751455906, "uptime": 124173.20630779701, "examples_seen": 67379200.0, "progress": 0.584353880447235, "epoch": 52.59205084114717, "img/sec/core": 547.0782402523887, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.470756917641395, "core_hours": 34.470756917641395} {"step": 65850, "l2_params": 342.12752899138354, "train/loss": 4.698309540748596, "l2_grads": 2.0625, "lr": 0.00043060498196044895, "uptime": 124266.820654204, "examples_seen": 67430400.0, "progress": 0.5847979183503104, "epoch": 52.63201440561613, "img/sec/core": 546.9247178996162, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.496760902754446, "core_hours": 34.496760902754446} {"step": 65900, "l2_params": 342.12738627227725, "train/loss": 4.69272243976593, "l2_grads": 2.1875, "lr": 0.0004298469990540078, "uptime": 124360.35608928201, "examples_seen": 67481600.0, "progress": 0.5852419562533858, "epoch": 52.67197797008509, "img/sec/core": 547.386131868612, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.52274296805389, "core_hours": 34.52274296805389} {"step": 65950, "l2_params": 342.12746048621995, "train/loss": 2.2780995965003967, "l2_grads": 2.203125, "lr": 0.000429089180571792, "uptime": 124453.842590346, "examples_seen": 67532800.0, "progress": 0.5856859941564612, "epoch": 52.71194153455404, "img/sec/core": 547.67265238597, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.548711440571665, "core_hours": 34.548711440571665} {"step": 66000, "l2_params": 342.12748332127603, "train/loss": 4.089780807495117, "l2_grads": 1.7890625, "lr": 0.00042833152828997264, "uptime": 124547.31680050101, "examples_seen": 67584000.0, "progress": 0.5861300320595366, "epoch": 52.751905099023, "img/sec/core": 547.7446657756783, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.57467649894806, "core_hours": 34.57467649894806} {"step": 66050, "l2_params": 342.1274661949841, "train/loss": 2.2193177342414856, "l2_grads": 2.125, "lr": 0.00042757404398433073, "uptime": 124641.72524830101, "examples_seen": 67635200.0, "progress": 0.586574069962612, "epoch": 52.791868663491954, "img/sec/core": 542.3243490716492, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.600901067781386, "core_hours": 34.600901067781386} {"step": 66100, "l2_params": 342.12747761251217, "train/loss": 2.6214576959609985, "l2_grads": 2.1875, "lr": 0.0004268167294302539, "uptime": 124735.049059214, "examples_seen": 67686400.0, "progress": 0.5870181078656874, "epoch": 52.831832227960916, "img/sec/core": 548.6274027936632, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.62682434859055, "core_hours": 34.62682434859055} {"step": 66150, "l2_params": 342.1391661069732, "train/loss": 2.4303587675094604, "l2_grads": 1.953125, "lr": 0.0004260595864027321, "uptime": 124829.31782594901, "examples_seen": 67737600.0, "progress": 0.5874621457687628, "epoch": 52.87179579242987, "img/sec/core": 543.1279285102236, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.653010117128055, "core_hours": 34.653010117128055} {"step": 66200, "l2_params": 342.13917181554206, "train/loss": 2.80750435590744, "l2_grads": 1.96875, "lr": 0.00042530261667635274, "uptime": 124923.585629848, "examples_seen": 67788800.0, "progress": 0.5879061836718382, "epoch": 52.91175935689883, "img/sec/core": 543.1334759305265, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.67919561821111, "core_hours": 34.67919561821111} {"step": 66250, "l2_params": 342.1391661069732, "train/loss": 4.089340329170227, "l2_grads": 1.8828125, "lr": 0.00042454582202529773, "uptime": 125016.77900398901, "examples_seen": 67840000.0, "progress": 0.5883502215749137, "epoch": 52.95172292136778, "img/sec/core": 549.395281283985, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.705082666583614, "core_hours": 34.705082666583614} {"step": 66300, "l2_params": 342.139188941248, "train/loss": 2.568770408630371, "l2_grads": 1.953125, "lr": 0.00042378920422333816, "uptime": 125111.289263599, "examples_seen": 67891200.0, "progress": 0.588794259477989, "epoch": 52.99168648583674, "img/sec/core": 541.740126535302, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.731335516475276, "core_hours": 34.731335516475276} {"step": 66351, "l2_params": 342.15087988981554, "train/loss": 2.2522002458572388, "l2_grads": 2.1875, "lr": 0.0004230327650438306, "uptime": 125204.462184673, "examples_seen": 67942400.0, "progress": 0.5892382973810645, "epoch": 53.0316500503057, "img/sec/core": 549.5158830464817, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.75721688344028, "core_hours": 34.75721688344028} {"step": 66400, "l2_params": 342.1508627646948, "train/loss": 3.449886441230774, "l2_grads": 1.9296875, "lr": 0.0004222765062597134, "uptime": 125297.719031247, "examples_seen": 67993600.0, "progress": 0.5896823352841398, "epoch": 53.071613614774655, "img/sec/core": 549.0213521145618, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.78312156304416, "core_hours": 34.78312156304416} {"step": 66450, "l2_params": 342.1508513479471, "train/loss": 2.0972741842269897, "l2_grads": 2.21875, "lr": 0.00042152042964350197, "uptime": 125392.107801246, "examples_seen": 68044800.0, "progress": 0.5901263731872153, "epoch": 53.11157717924361, "img/sec/core": 542.437410727377, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.809340665821665, "core_hours": 34.809340665821665} {"step": 66500, "l2_params": 342.1508913065623, "train/loss": 2.191623866558075, "l2_grads": 2.1875, "lr": 0.00042076453696728407, "uptime": 125485.3132965, "examples_seen": 68096000.0, "progress": 0.5905704110902906, "epoch": 53.151540743712566, "img/sec/core": 549.3238339700533, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.83523108117, "core_hours": 34.83523108117} {"step": 66550, "l2_params": 342.15092555680013, "train/loss": 2.1895188093185425, "l2_grads": 2.140625, "lr": 0.0004200088300027172, "uptime": 125579.77365415101, "examples_seen": 68147200.0, "progress": 0.5910144489933661, "epoch": 53.19150430818153, "img/sec/core": 542.0263195398895, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.861470069406394, "core_hours": 34.861470069406394} {"step": 66600, "l2_params": 342.15090843168167, "train/loss": 3.4763075709342957, "l2_grads": 2.015625, "lr": 0.00041925331052102287, "uptime": 125673.281178766, "examples_seen": 68198400.0, "progress": 0.5914584868964414, "epoch": 53.231467872650484, "img/sec/core": 547.5495176544355, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.88744438179945, "core_hours": 34.88744438179945} {"step": 66650, "l2_params": 342.1626075420866, "train/loss": 2.266411542892456, "l2_grads": 2.078125, "lr": 0.0004184979802929841, "uptime": 125766.613438267, "examples_seen": 68249600.0, "progress": 0.5919025247995169, "epoch": 53.27143143711944, "img/sec/core": 548.5777401483963, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.91337000943861, "core_hours": 34.91337000943861} {"step": 66701, "l2_params": 342.16256758483973, "train/loss": 2.9924283623695374, "l2_grads": 1.8984375, "lr": 0.00041774284108893984, "uptime": 125860.909303744, "examples_seen": 68300800.0, "progress": 0.5923465627025923, "epoch": 53.311395001588394, "img/sec/core": 542.9718444281725, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.93956330540445, "core_hours": 34.93956330540445} {"step": 66750, "l2_params": 342.1509027233086, "train/loss": 4.790957093238831, "l2_grads": 2.015625, "lr": 0.000416987894678781, "uptime": 125954.206227645, "examples_seen": 68352000.0, "progress": 0.5927906006056677, "epoch": 53.35135856605735, "img/sec/core": 548.7855103811441, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.965479117599166, "core_hours": 34.965479117599166} {"step": 66800, "l2_params": 342.1626018339088, "train/loss": 3.050676643848419, "l2_grads": 1.90625, "lr": 0.0004162331428319469, "uptime": 126048.234359678, "examples_seen": 68403200.0, "progress": 0.5932346385087431, "epoch": 53.39132213052631, "img/sec/core": 544.5178894124274, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 34.99159804316389, "core_hours": 34.99159804316389} {"step": 66850, "l2_params": 342.1625847093747, "train/loss": 4.585168480873108, "l2_grads": 2.03125, "lr": 0.0004154785873174209, "uptime": 126141.46791334401, "examples_seen": 68454400.0, "progress": 0.5936786764118185, "epoch": 53.43128569499527, "img/sec/core": 549.1585162935364, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.017496252515556, "core_hours": 35.017496252515556} {"step": 66901, "l2_params": 342.16245342125137, "train/loss": 2.1865638494491577, "l2_grads": 2.125, "lr": 0.00041472422990372604, "uptime": 126235.569642121, "examples_seen": 68505600.0, "progress": 0.5941227143148939, "epoch": 53.47124925946422, "img/sec/core": 544.0920232330263, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.043635621620275, "core_hours": 35.043635621620275} {"step": 66950, "l2_params": 342.16245342125137, "train/loss": 2.1920087337493896, "l2_grads": 2.15625, "lr": 0.00041397007235892126, "uptime": 126328.796429209, "examples_seen": 68556800.0, "progress": 0.5945667522179693, "epoch": 53.51121282393318, "img/sec/core": 549.1983752659982, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.06953195136694, "core_hours": 35.06953195136694} {"step": 67000, "l2_params": 342.16244771307095, "train/loss": 3.504334330558777, "l2_grads": 1.890625, "lr": 0.0004132161164505971, "uptime": 126423.228133088, "examples_seen": 68608000.0, "progress": 0.5950107901210447, "epoch": 53.55117638840213, "img/sec/core": 542.1907886529651, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.095762980222226, "core_hours": 35.095762980222226} {"step": 67050, "l2_params": 342.1624420048904, "train/loss": 3.4758511185646057, "l2_grads": 1.9765625, "lr": 0.00041246236394587105, "uptime": 126516.862762779, "examples_seen": 68659200.0, "progress": 0.5954548280241201, "epoch": 53.591139952871096, "img/sec/core": 546.8062421880484, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.12177259958083, "core_hours": 35.12177259958083} {"step": 67100, "l2_params": 342.18578766694856, "train/loss": 2.261996805667877, "l2_grads": 2.21875, "lr": 0.00041170881661138436, "uptime": 126611.153652026, "examples_seen": 68710400.0, "progress": 0.5958988659271955, "epoch": 53.63110351734005, "img/sec/core": 543.0004999303658, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.147964513260554, "core_hours": 35.147964513260554} {"step": 67150, "l2_params": 342.18581620590294, "train/loss": 2.15329247713089, "l2_grads": 2.1875, "lr": 0.0004109554762132973, "uptime": 126705.331333893, "examples_seen": 68761600.0, "progress": 0.596342903830271, "epoch": 53.67106708180901, "img/sec/core": 543.6532200092122, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.17412498044583, "core_hours": 35.17412498044583} {"step": 67200, "l2_params": 342.1858333292745, "train/loss": 2.2856668829917908, "l2_grads": 2.109375, "lr": 0.0004102023445172849, "uptime": 126798.55502137801, "examples_seen": 68812800.0, "progress": 0.5967869417333463, "epoch": 53.71103064627796, "img/sec/core": 549.2166356135074, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.20002044919167, "core_hours": 35.20002044919167} {"step": 67250, "l2_params": 342.18584189095986, "train/loss": 3.043447196483612, "l2_grads": 2.015625, "lr": 0.0004094494232885333, "uptime": 126892.821882917, "examples_seen": 68864000.0, "progress": 0.5972309796364218, "epoch": 53.75099421074692, "img/sec/core": 543.138905487225, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.22620568850805, "core_hours": 35.22620568850805} {"step": 67300, "l2_params": 342.1858247675888, "train/loss": 2.2397298216819763, "l2_grads": 2.15625, "lr": 0.00040869671429173487, "uptime": 126986.91553053801, "examples_seen": 68915200.0, "progress": 0.5976750175394971, "epoch": 53.79095777521588, "img/sec/core": 544.1387521314747, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.252342812847225, "core_hours": 35.252342812847225} {"step": 67350, "l2_params": 342.18584189095986, "train/loss": 3.812985897064209, "l2_grads": 1.84375, "lr": 0.0004079442192910856, "uptime": 127080.194377028, "examples_seen": 68966400.0, "progress": 0.5981190554425726, "epoch": 53.830921339684835, "img/sec/core": 548.8918648398238, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.27825360353889, "core_hours": 35.27825360353889} {"step": 67400, "l2_params": 342.18583047537925, "train/loss": 2.285180628299713, "l2_grads": 2.140625, "lr": 0.00040719194005027856, "uptime": 127174.91330227401, "examples_seen": 69017600.0, "progress": 0.598563093345648, "epoch": 53.87088490415379, "img/sec/core": 540.5466739304838, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.304564416107226, "core_hours": 35.304564416107226} {"step": 67450, "l2_params": 342.185844744855, "train/loss": 2.306501805782318, "l2_grads": 2.203125, "lr": 0.00040643987833250176, "uptime": 127268.232656356, "examples_seen": 69068800.0, "progress": 0.5990071312487234, "epoch": 53.910848468622746, "img/sec/core": 548.6536046425564, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.33048645890778, "core_hours": 35.33048645890778} {"step": 67500, "l2_params": 342.18582191369353, "train/loss": 2.1944337487220764, "l2_grads": 2.15625, "lr": 0.00040568803590043374, "uptime": 127362.78476637299, "examples_seen": 69120000.0, "progress": 0.5994511691517987, "epoch": 53.95081203309171, "img/sec/core": 541.5003429410717, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.3567509339125, "core_hours": 35.3567509339125, "val/acc@1": 0.656867825255102, "val/loss": 1.4320069326429952, "z/secs/eval/val": 31.72886970199761} {"step": 67550, "l2_params": 342.18582762148407, "train/loss": 2.237284302711487, "l2_grads": 2.203125, "lr": 0.00040493641451623877, "uptime": 127487.487382108, "examples_seen": 69171200.0, "progress": 0.5998952070548742, "epoch": 53.99077559756066, "img/sec/core": 410.5767926215833, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.391390549394444, "core_hours": 35.391390549394444} {"step": 67600, "l2_params": 342.18582191369353, "train/loss": 2.2165114283561707, "l2_grads": 2.171875, "lr": 0.00040418501594156246, "uptime": 127580.70493446101, "examples_seen": 69222400.0, "progress": 0.6003392449579497, "epoch": 54.03073916202962, "img/sec/core": 549.2527824170339, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.41728431393695, "core_hours": 35.41728431393695} {"step": 67650, "l2_params": 342.1858247675888, "train/loss": 2.1819682121276855, "l2_grads": 2.125, "lr": 0.0004034338419375295, "uptime": 127673.987928733, "examples_seen": 69273600.0, "progress": 0.600783282861025, "epoch": 54.070702726498574, "img/sec/core": 548.8674586357835, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.44319625679028, "core_hours": 35.44319625679028} {"step": 67700, "l2_params": 342.1858247675888, "train/loss": 2.320738673210144, "l2_grads": 2.125, "lr": 0.0004026828942647367, "uptime": 127767.247563426, "examples_seen": 69324800.0, "progress": 0.6012273207641005, "epoch": 54.11066629096753, "img/sec/core": 549.0049384017029, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.46910171087167, "core_hours": 35.46910171087167} {"step": 67750, "l2_params": 342.18581335200764, "train/loss": 2.196956515312195, "l2_grads": 2.109375, "lr": 0.00040193217468325194, "uptime": 127860.553993832, "examples_seen": 69376000.0, "progress": 0.6016713586671758, "epoch": 54.15062985543649, "img/sec/core": 548.729597490959, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.49502016376222, "core_hours": 35.49502016376222} {"step": 67800, "l2_params": 342.1858361831696, "train/loss": 2.5947152972221375, "l2_grads": 2.171875, "lr": 0.000401181684952607, "uptime": 127953.879944007, "examples_seen": 69427200.0, "progress": 0.6021153965702513, "epoch": 54.19059341990545, "img/sec/core": 548.6148268942611, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.52094403881083, "core_hours": 35.52094403881083} {"step": 67850, "l2_params": 342.18587328380465, "train/loss": 2.2763167023658752, "l2_grads": 2.09375, "lr": 0.000400431426831796, "uptime": 128047.18909275299, "examples_seen": 69478400.0, "progress": 0.6025594344733266, "epoch": 54.2305569843744, "img/sec/core": 548.7136115599868, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.54686324679583, "core_hours": 35.54686324679583} {"step": 67900, "l2_params": 342.18588469938385, "train/loss": 2.3084400296211243, "l2_grads": 2.109375, "lr": 0.00039968140207927014, "uptime": 128141.63087145201, "examples_seen": 69529600.0, "progress": 0.6030034723764021, "epoch": 54.27052054884336, "img/sec/core": 542.132949053928, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.57309707421223, "core_hours": 35.57309707421223} {"step": 67950, "l2_params": 342.1859703162156, "train/loss": 2.308559477329254, "l2_grads": 2.09375, "lr": 0.0003989316124529332, "uptime": 128235.293701208, "examples_seen": 69580800.0, "progress": 0.6034475102794774, "epoch": 54.31048411331231, "img/sec/core": 546.6416094131627, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.59911452692222, "core_hours": 35.59911452692222} {"step": 68000, "l2_params": 342.18601597851716, "train/loss": 4.44524872303009, "l2_grads": 1.8984375, "lr": 0.0003981820597101377, "uptime": 128328.548423542, "examples_seen": 69632000.0, "progress": 0.6038915481825529, "epoch": 54.350447677781276, "img/sec/core": 549.033858217049, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.62501861645944, "core_hours": 35.62501861645944} {"step": 68050, "l2_params": 342.1860273940916, "train/loss": 2.2831488847732544, "l2_grads": 2.15625, "lr": 0.0003974327456076817, "uptime": 128422.035351781, "examples_seen": 69683200.0, "progress": 0.6043355860856283, "epoch": 54.39041124225023, "img/sec/core": 547.6701498749358, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.650987207636945, "core_hours": 35.650987207636945} {"step": 68100, "l2_params": 342.18595890063926, "train/loss": 4.643216848373413, "l2_grads": 2.046875, "lr": 0.0003966836719018034, "uptime": 128515.24286723402, "examples_seen": 69734400.0, "progress": 0.6047796239887037, "epoch": 54.430374806719186, "img/sec/core": 549.311927811315, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.67687818415167, "core_hours": 35.67687818415167} {"step": 68150, "l2_params": 342.1859646084275, "train/loss": 3.650056004524231, "l2_grads": 1.9453125, "lr": 0.0003959348403481776, "uptime": 128608.46893497501, "examples_seen": 69785600.0, "progress": 0.6052236618917791, "epoch": 54.47033837118814, "img/sec/core": 549.2026129670808, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.702774314079726, "core_hours": 35.702774314079726} {"step": 68200, "l2_params": 342.18598173179157, "train/loss": 4.596729636192322, "l2_grads": 2.140625, "lr": 0.000395186252701912, "uptime": 128701.68438806501, "examples_seen": 69836800.0, "progress": 0.6056676997948545, "epoch": 54.5103019356571, "img/sec/core": 549.2651518902748, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.72866749549361, "core_hours": 35.72866749549361} {"step": 68250, "l2_params": 342.18597602400365, "train/loss": 3.0132683515548706, "l2_grads": 2.046875, "lr": 0.00039443791071754226, "uptime": 128794.87311881999, "examples_seen": 69888000.0, "progress": 0.6061117376979299, "epoch": 54.55026550012606, "img/sec/core": 549.4226564220653, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.75455325403666, "core_hours": 35.75455325403666} {"step": 68300, "l2_params": 342.1859703162156, "train/loss": 4.398979663848877, "l2_grads": 1.9453125, "lr": 0.0003936898161490278, "uptime": 128888.26237997902, "examples_seen": 69939200.0, "progress": 0.6065557756010053, "epoch": 54.590229064595015, "img/sec/core": 548.2429067814816, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.78049471546972, "core_hours": 35.78049471546972} {"step": 68350, "l2_params": 342.1859703162156, "train/loss": 2.193723440170288, "l2_grads": 2.15625, "lr": 0.00039294197074974904, "uptime": 128981.448608556, "examples_seen": 69990400.0, "progress": 0.6069998135040807, "epoch": 54.63019262906397, "img/sec/core": 549.4374091736007, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.80637977896333, "core_hours": 35.80637977896333} {"step": 68400, "l2_params": 342.18595890063926, "train/loss": 2.21409147977829, "l2_grads": 2.15625, "lr": 0.000392194376272502, "uptime": 129074.55007940001, "examples_seen": 70041600.0, "progress": 0.6074438514071561, "epoch": 54.670156193532925, "img/sec/core": 549.9376060963353, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.832241298642224, "core_hours": 35.832241298642224} {"step": 68450, "l2_params": 342.18596746232157, "train/loss": 2.3196184635162354, "l2_grads": 2.171875, "lr": 0.00039144703446949465, "uptime": 129167.77859792102, "examples_seen": 70092800.0, "progress": 0.6078878893102315, "epoch": 54.71011975800189, "img/sec/core": 549.1881755952594, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.8581381093425, "core_hours": 35.8581381093425} {"step": 68500, "l2_params": 342.18595890063926, "train/loss": 3.6412554383277893, "l2_grads": 1.9453125, "lr": 0.0003906999470923425, "uptime": 129261.013100543, "examples_seen": 70144000.0, "progress": 0.608331927213307, "epoch": 54.75008332247084, "img/sec/core": 549.1529268685894, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.88403658229306, "core_hours": 35.88403658229306} {"step": 68550, "l2_params": 342.18597602400365, "train/loss": 3.3118863701820374, "l2_grads": 1.9609375, "lr": 0.000389953115892065, "uptime": 129354.21048455001, "examples_seen": 70195200.0, "progress": 0.6087759651163823, "epoch": 54.7900468869398, "img/sec/core": 549.3716432657291, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.90992474451722, "core_hours": 35.90992474451722} {"step": 68600, "l2_params": 342.18597602400365, "train/loss": 2.718969762325287, "l2_grads": 2.0625, "lr": 0.0003892065426190808, "uptime": 129447.409422295, "examples_seen": 70246400.0, "progress": 0.6092200030194578, "epoch": 54.830010451408754, "img/sec/core": 549.3624845821628, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.93581333833527, "core_hours": 35.93581333833527} {"step": 68650, "l2_params": 342.18603310187865, "train/loss": 2.163155108690262, "l2_grads": 2.15625, "lr": 0.0003884602290232045, "uptime": 129540.530726976, "examples_seen": 70297600.0, "progress": 0.6096640409225331, "epoch": 54.86997401587771, "img/sec/core": 549.8204752971654, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.96168036741333, "core_hours": 35.96168036741333} {"step": 68700, "l2_params": 342.18598173179157, "train/loss": 2.3754783868789673, "l2_grads": 2.3125, "lr": 0.0003877141768536419, "uptime": 129633.73542750801, "examples_seen": 70348800.0, "progress": 0.6101080788256086, "epoch": 54.90993758034667, "img/sec/core": 549.3285178509904, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 35.98757056200556, "core_hours": 35.98757056200556} {"step": 68750, "l2_params": 342.18597602400365, "train/loss": 2.2138383984565735, "l2_grads": 2.15625, "lr": 0.00038696838785898637, "uptime": 129726.93984776901, "examples_seen": 70400000.0, "progress": 0.6105521167286839, "epoch": 54.94990114481563, "img/sec/core": 549.3301697132612, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.01346067874473, "core_hours": 36.01346067874473} {"step": 68800, "l2_params": 342.1859931473671, "train/loss": 2.2195976972579956, "l2_grads": 2.1875, "lr": 0.00038622286378721377, "uptime": 129820.16477192802, "examples_seen": 70451200.0, "progress": 0.6109961546317594, "epoch": 54.98986470928458, "img/sec/core": 549.2093499874973, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.03935649101111, "core_hours": 36.03935649101111} {"step": 68850, "l2_params": 342.18594748506257, "train/loss": 4.821352601051331, "l2_grads": 2.015625, "lr": 0.00038547760638567947, "uptime": 129913.45279493701, "examples_seen": 70502400.0, "progress": 0.6114401925348347, "epoch": 55.02982827375354, "img/sec/core": 548.8378716640154, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.065269830735836, "core_hours": 36.065269830735836} {"step": 68900, "l2_params": 342.1859703162156, "train/loss": 2.1468129754066467, "l2_grads": 2.203125, "lr": 0.00038473261740111384, "uptime": 130006.70821629901, "examples_seen": 70553600.0, "progress": 0.6118842304379102, "epoch": 55.06979183822249, "img/sec/core": 549.0297427454639, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.091174114447504, "core_hours": 36.091174114447504} {"step": 68950, "l2_params": 342.18598173179157, "train/loss": 2.1715680956840515, "l2_grads": 2.265625, "lr": 0.00038398789857961775, "uptime": 130099.955355829, "examples_seen": 70604800.0, "progress": 0.6123282683409856, "epoch": 55.109755402691455, "img/sec/core": 549.0785053361416, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.117076097650276, "core_hours": 36.117076097650276} {"step": 69000, "l2_params": 342.1859417772741, "train/loss": 3.8711900115013123, "l2_grads": 2.09375, "lr": 0.00038324345166665944, "uptime": 130193.20607982401, "examples_seen": 70656000.0, "progress": 0.612772306244061, "epoch": 55.14971896716041, "img/sec/core": 549.0573993049294, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.142979076537785, "core_hours": 36.142979076537785} {"step": 69050, "l2_params": 342.1859988551548, "train/loss": 2.2978506684303284, "l2_grads": 2.171875, "lr": 0.0003824992784070699, "uptime": 130286.65637800001, "examples_seen": 70707200.0, "progress": 0.6132163441471364, "epoch": 55.189682531629366, "img/sec/core": 547.8848221925567, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.16893749269778, "core_hours": 36.16893749269778} {"step": 69100, "l2_params": 342.18590753054104, "train/loss": 3.4060736894607544, "l2_grads": 1.9453125, "lr": 0.00038175538054503765, "uptime": 130379.881135287, "examples_seen": 70758400.0, "progress": 0.6136603820502118, "epoch": 55.22964609609832, "img/sec/core": 549.2103330705015, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.194833258610835, "core_hours": 36.194833258610835} {"step": 69150, "l2_params": 342.1859931473671, "train/loss": 4.518410325050354, "l2_grads": 1.8515625, "lr": 0.00038101175982410685, "uptime": 130473.143647917, "examples_seen": 70809600.0, "progress": 0.6141044199532872, "epoch": 55.269609660567276, "img/sec/core": 548.9879969578676, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.22073951211917, "core_hours": 36.22073951211917} {"step": 69200, "l2_params": 342.1859931473671, "train/loss": 3.345633327960968, "l2_grads": 1.9296875, "lr": 0.0003802684179871713, "uptime": 130566.367427674, "examples_seen": 70860800.0, "progress": 0.6145484578563626, "epoch": 55.30957322503624, "img/sec/core": 549.2160920041293, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.24663500649611, "core_hours": 36.24663500649611} {"step": 69250, "l2_params": 342.18598173179157, "train/loss": 2.217877209186554, "l2_grads": 2.234375, "lr": 0.00037952535677647275, "uptime": 130659.569373618, "examples_seen": 70912000.0, "progress": 0.614992495759438, "epoch": 55.349536789505194, "img/sec/core": 549.3447532819583, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.272524435925, "core_hours": 36.272524435925} {"step": 69300, "l2_params": 342.18597602400365, "train/loss": 2.1220136880874634, "l2_grads": 2.203125, "lr": 0.00037878257793359327, "uptime": 130752.792586972, "examples_seen": 70963200.0, "progress": 0.6154365336625134, "epoch": 55.38950035397415, "img/sec/core": 549.2194289159639, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.29841977296778, "core_hours": 36.29841977296778} {"step": 69350, "l2_params": 342.18595890063926, "train/loss": 2.2624886631965637, "l2_grads": 2.234375, "lr": 0.0003780400831994539, "uptime": 130845.945995858, "examples_seen": 71014400.0, "progress": 0.6158805715655888, "epoch": 55.429463918443105, "img/sec/core": 549.6309862654894, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.32429571988055, "core_hours": 36.32429571988055} {"step": 69400, "l2_params": 342.1859703162156, "train/loss": 2.137821316719055, "l2_grads": 2.140625, "lr": 0.0003772978743143094, "uptime": 130939.13136431799, "examples_seen": 71065600.0, "progress": 0.6163246094686643, "epoch": 55.46942748291207, "img/sec/core": 549.4424805755011, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.350180544452776, "core_hours": 36.350180544452776} {"step": 69450, "l2_params": 342.18597602400365, "train/loss": 3.287795305252075, "l2_grads": 1.96875, "lr": 0.0003765559530177456, "uptime": 131032.35172321601, "examples_seen": 71116800.0, "progress": 0.6167686473717396, "epoch": 55.50939104738102, "img/sec/core": 549.2362463012137, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.376075088591115, "core_hours": 36.376075088591115} {"step": 69500, "l2_params": 342.1859189461191, "train/loss": 2.484284222126007, "l2_grads": 2.171875, "lr": 0.00037581432104867325, "uptime": 131125.605151736, "examples_seen": 71168000.0, "progress": 0.6172126852748151, "epoch": 55.54935461184998, "img/sec/core": 549.0414756066818, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.40197881873556, "core_hours": 36.40197881873556} {"step": 69550, "l2_params": 342.2093200805612, "train/loss": 2.3883712887763977, "l2_grads": 2.125, "lr": 0.00037507298014532607, "uptime": 131218.867623762, "examples_seen": 71219200.0, "progress": 0.6176567231778904, "epoch": 55.58931817631893, "img/sec/core": 548.9882359726726, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.427885060965, "core_hours": 36.427885060965} {"step": 69600, "l2_params": 342.20931437316256, "train/loss": 2.192826807498932, "l2_grads": 2.203125, "lr": 0.0003743319320452542, "uptime": 131312.390345104, "examples_seen": 71270400.0, "progress": 0.6181007610809659, "epoch": 55.62928174078789, "img/sec/core": 547.4605450450952, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.45386359467111, "core_hours": 36.45386359467111} {"step": 69650, "l2_params": 342.2093600323492, "train/loss": 2.3562276363372803, "l2_grads": 2.078125, "lr": 0.00037359117848532195, "uptime": 131405.591814911, "examples_seen": 71321600.0, "progress": 0.6185447989840412, "epoch": 55.66924530525685, "img/sec/core": 549.3475597115927, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.479752891839716, "core_hours": 36.479752891839716} {"step": 69700, "l2_params": 342.2093372027566, "train/loss": 4.674843907356262, "l2_grads": 2.078125, "lr": 0.00037285072120170424, "uptime": 131498.822572405, "examples_seen": 71372800.0, "progress": 0.6189888368871167, "epoch": 55.709208869725806, "img/sec/core": 549.1749866269594, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.505650324476946, "core_hours": 36.505650324476946} {"step": 69750, "l2_params": 342.20933149535824, "train/loss": 2.2742421627044678, "l2_grads": 2.15625, "lr": 0.0003721105619298805, "uptime": 131592.117428295, "examples_seen": 71424000.0, "progress": 0.619432874790192, "epoch": 55.74917243419476, "img/sec/core": 548.7976749798332, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.531565562224166, "core_hours": 36.531565562224166} {"step": 69800, "l2_params": 342.2093229342605, "train/loss": 2.4111730456352234, "l2_grads": 2.34375, "lr": 0.00037137070240463184, "uptime": 131685.429108225, "examples_seen": 71475200.0, "progress": 0.6198769126932675, "epoch": 55.78913599866372, "img/sec/core": 548.6987270875268, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.557485473315836, "core_hours": 36.557485473315836} {"step": 69850, "l2_params": 342.20933149535824, "train/loss": 2.2576982975006104, "l2_grads": 2.171875, "lr": 0.0003706311443600378, "uptime": 131779.939819803, "examples_seen": 71526400.0, "progress": 0.620320950596343, "epoch": 55.82909956313267, "img/sec/core": 541.7375358321553, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.58373844875416, "core_hours": 36.58373844875416} {"step": 69900, "l2_params": 342.20935717865024, "train/loss": 2.309596359729767, "l2_grads": 2.125, "lr": 0.00036989188952946974, "uptime": 131873.22138105, "examples_seen": 71577600.0, "progress": 0.6207649884994183, "epoch": 55.869063127601635, "img/sec/core": 548.8758905355312, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.609649993545, "core_hours": 36.609649993545} {"step": 69950, "l2_params": 342.20938286194024, "train/loss": 4.620411515235901, "l2_grads": 2.015625, "lr": 0.0003691529396455893, "uptime": 131966.517720895, "examples_seen": 71628800.0, "progress": 0.6212090264024938, "epoch": 55.90902669207059, "img/sec/core": 548.7889459014759, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.63556564350195, "core_hours": 36.63556564350195} {"step": 70000, "l2_params": 342.2327567104368, "train/loss": 2.9909916520118713, "l2_grads": 2.0, "lr": 0.0003684142964403433, "uptime": 132059.836185208, "examples_seen": 71680000.0, "progress": 0.6216530643055691, "epoch": 55.948990256539545, "img/sec/core": 548.6588359220463, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.661487439144445, "core_hours": 36.661487439144445, "val/acc@1": 0.6576849489795918, "val/loss": 1.4142553867125998, "z/secs/eval/val": 31.75059388601221} {"step": 70050, "l2_params": 342.2326996403544, "train/loss": 2.312730312347412, "l2_grads": 2.28125, "lr": 0.00036767596164495966, "uptime": 132184.76671459302, "examples_seen": 71731200.0, "progress": 0.6220971022086446, "epoch": 55.9889538210085, "img/sec/core": 409.82776789657544, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.696190363973614, "core_hours": 36.696190363973614} {"step": 70101, "l2_params": 342.23267681231874, "train/loss": 3.7156063318252563, "l2_grads": 1.8671875, "lr": 0.00036693793698994355, "uptime": 132278.040781699, "examples_seen": 71782400.0, "progress": 0.6225411401117199, "epoch": 56.028917385477456, "img/sec/core": 548.9199901814234, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.722099827058614, "core_hours": 36.722099827058614} {"step": 70150, "l2_params": 342.23267681231874, "train/loss": 2.196609616279602, "l2_grads": 2.234375, "lr": 0.0003662002242050735, "uptime": 132371.358125793, "examples_seen": 71833600.0, "progress": 0.6229851780147954, "epoch": 56.06888094994642, "img/sec/core": 548.6654222438324, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.748021311529165, "core_hours": 36.748021311529165} {"step": 70200, "l2_params": 342.23266539830036, "train/loss": 4.567290782928467, "l2_grads": 1.9765625, "lr": 0.00036546282501939605, "uptime": 132464.607318101, "examples_seen": 71884800.0, "progress": 0.6234292159178707, "epoch": 56.108844514415374, "img/sec/core": 549.0664179789861, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.77392386494806, "core_hours": 36.77392386494806} {"step": 70250, "l2_params": 342.2326825193278, "train/loss": 4.4232337474823, "l2_grads": 1.9375, "lr": 0.00036472574116122423, "uptime": 132557.865074237, "examples_seen": 71936000.0, "progress": 0.6238732538209462, "epoch": 56.14880807888433, "img/sec/core": 549.0159973969899, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.79982879720806, "core_hours": 36.79982879720806} {"step": 70300, "l2_params": 342.2326996403544, "train/loss": 4.2215012311935425, "l2_grads": 1.875, "lr": 0.0003639889743581306, "uptime": 132651.110650705, "examples_seen": 71987200.0, "progress": 0.6243172917240216, "epoch": 56.188771643353284, "img/sec/core": 549.0877094589886, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.82573034622694, "core_hours": 36.82573034622694} {"step": 70350, "l2_params": 342.2326739588142, "train/loss": 3.825348734855652, "l2_grads": 1.953125, "lr": 0.0003632525263369456, "uptime": 132744.403778097, "examples_seen": 72038400.0, "progress": 0.624761329627097, "epoch": 56.22873520782224, "img/sec/core": 548.8078428849444, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.851645103835835, "core_hours": 36.851645103835835} {"step": 70400, "l2_params": 342.23267966582324, "train/loss": 3.8306546807289124, "l2_grads": 1.9609375, "lr": 0.00036251639882375187, "uptime": 132837.698649529, "examples_seen": 72089600.0, "progress": 0.6252053675301724, "epoch": 56.2686987722912, "img/sec/core": 548.7975835555944, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.87756034590028, "core_hours": 36.87756034590028} {"step": 70450, "l2_params": 342.2326625447957, "train/loss": 2.2572620511054993, "l2_grads": 2.359375, "lr": 0.0003617805935438813, "uptime": 132930.934287327, "examples_seen": 72140800.0, "progress": 0.6256494054332478, "epoch": 56.30866233676016, "img/sec/core": 549.1462407424702, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.903459134177496, "core_hours": 36.903459134177496} {"step": 70500, "l2_params": 342.23266825180497, "train/loss": 3.488305687904358, "l2_grads": 1.8984375, "lr": 0.00036104511222191004, "uptime": 133024.196756323, "examples_seen": 72192000.0, "progress": 0.6260934433363232, "epoch": 56.34862590122911, "img/sec/core": 548.988253808553, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.929365375565276, "core_hours": 36.929365375565276} {"step": 70550, "l2_params": 342.2326853728323, "train/loss": 2.54155832529068, "l2_grads": 2.109375, "lr": 0.0003603099565816554, "uptime": 133117.488600619, "examples_seen": 72243200.0, "progress": 0.6265374812393986, "epoch": 56.38858946569807, "img/sec/core": 548.8153909527468, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.95527977675861, "core_hours": 36.95527977675861} {"step": 70600, "l2_params": 342.23266825180497, "train/loss": 2.5313316583633423, "l2_grads": 2.125, "lr": 0.0003595751283461715, "uptime": 133210.69587949102, "examples_seen": 72294400.0, "progress": 0.626981519142474, "epoch": 56.42855303016703, "img/sec/core": 549.3133220882702, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 36.98117068755639, "core_hours": 36.98117068755639} {"step": 70650, "l2_params": 342.2326625447957, "train/loss": 2.9528303146362305, "l2_grads": 2.015625, "lr": 0.00035884062923774456, "uptime": 133303.933909965, "examples_seen": 72345600.0, "progress": 0.6274255570455494, "epoch": 56.468516594635986, "img/sec/core": 549.1321485419134, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.007070140465835, "core_hours": 37.007070140465835} {"step": 70700, "l2_params": 342.2326910798412, "train/loss": 2.7571953535079956, "l2_grads": 1.9609375, "lr": 0.0003581064609778893, "uptime": 133397.232155059, "examples_seen": 72396800.0, "progress": 0.6278695949486248, "epoch": 56.50848015910494, "img/sec/core": 548.7777390498712, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.032986319658605, "core_hours": 37.032986319658605} {"step": 70750, "l2_params": 342.23257693964496, "train/loss": 2.870854437351227, "l2_grads": 2.109375, "lr": 0.0003573726252873454, "uptime": 133490.496426448, "examples_seen": 72448000.0, "progress": 0.6283136328517002, "epoch": 56.5484437235739, "img/sec/core": 548.9776442518989, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.05889306171111, "core_hours": 37.05889306171111} {"step": 70800, "l2_params": 342.24433317989354, "train/loss": 2.103826880455017, "l2_grads": 2.140625, "lr": 0.0003566391238860735, "uptime": 133583.827997081, "examples_seen": 72499200.0, "progress": 0.6287576707547756, "epoch": 56.58840728804285, "img/sec/core": 548.5817891281376, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.08481849799806, "core_hours": 37.08481849799806} {"step": 70850, "l2_params": 342.2443503003373, "train/loss": 4.742801904678345, "l2_grads": 1.984375, "lr": 0.0003559059584932502, "uptime": 133677.38235513002, "examples_seen": 72550400.0, "progress": 0.6292017086578511, "epoch": 56.628370852511814, "img/sec/core": 547.2754136496867, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.11080581967834, "core_hours": 37.11080581967834} {"step": 70900, "l2_params": 342.24435600715174, "train/loss": 2.2693424820899963, "l2_grads": 2.234375, "lr": 0.0003551731308272641, "uptime": 133770.669476961, "examples_seen": 72601600.0, "progress": 0.6296457465609264, "epoch": 56.66833441698077, "img/sec/core": 548.8431735815464, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.13671890907583, "core_hours": 37.13671890907583} {"step": 70950, "l2_params": 342.2442532844781, "train/loss": 3.3320721983909607, "l2_grads": 1.984375, "lr": 0.00035444064260571303, "uptime": 133863.997592489, "examples_seen": 72652800.0, "progress": 0.6300897844640019, "epoch": 56.708297981449725, "img/sec/core": 548.6020982030017, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.16264338561139, "core_hours": 37.16264338561139} {"step": 71000, "l2_params": 342.2443503003373, "train/loss": 2.1535271406173706, "l2_grads": 2.265625, "lr": 0.00035370849554539904, "uptime": 133957.324925458, "examples_seen": 72704000.0, "progress": 0.6305338223670772, "epoch": 56.74826154591868, "img/sec/core": 548.6066982864256, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.18856764476945, "core_hours": 37.18856764476945} {"step": 71050, "l2_params": 342.2443503003373, "train/loss": 2.4517300724983215, "l2_grads": 2.15625, "lr": 0.00035297669136232423, "uptime": 134050.788730085, "examples_seen": 72755200.0, "progress": 0.6309778602701527, "epoch": 56.788225110387636, "img/sec/core": 547.80564737681, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.21452981272139, "core_hours": 37.21452981272139} {"step": 71100, "l2_params": 342.2443503003373, "train/loss": 2.5956472158432007, "l2_grads": 2.0625, "lr": 0.00035224523177168756, "uptime": 134144.03372444402, "examples_seen": 72806400.0, "progress": 0.631421898173228, "epoch": 56.8281886748566, "img/sec/core": 549.0911372987412, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.24043120004333, "core_hours": 37.24043120004333} {"step": 71150, "l2_params": 342.2443274730788, "train/loss": 3.1067545413970947, "l2_grads": 1.828125, "lr": 0.0003515141184878798, "uptime": 134237.28628146, "examples_seen": 72857600.0, "progress": 0.6318659360763035, "epoch": 56.86815223932555, "img/sec/core": 549.0466067458873, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.266334688103335, "core_hours": 37.266334688103335} {"step": 71200, "l2_params": 342.24433888670825, "train/loss": 3.374411880970001, "l2_grads": 2.0625, "lr": 0.00035078335322448007, "uptime": 134330.621914051, "examples_seen": 72908800.0, "progress": 0.6323099739793788, "epoch": 56.90811580379451, "img/sec/core": 548.557914900012, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.292261252711945, "core_hours": 37.292261252711945} {"step": 71250, "l2_params": 342.24435600715174, "train/loss": 2.2383884489536285, "l2_grads": 2.234375, "lr": 0.0003500529376942527, "uptime": 134423.952406425, "examples_seen": 72960000.0, "progress": 0.6327540118824543, "epoch": 56.948079368263464, "img/sec/core": 548.5881269631814, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.318186389482506, "core_hours": 37.318186389482506} {"step": 71300, "l2_params": 342.2443274730788, "train/loss": 2.7099488973617554, "l2_grads": 2.265625, "lr": 0.00034932287360914135, "uptime": 134517.25017040301, "examples_seen": 73011200.0, "progress": 0.6331980497855297, "epoch": 56.98804293273242, "img/sec/core": 548.7805689755342, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.34410243503194, "core_hours": 37.34410243503194} {"step": 71350, "l2_params": 342.2443503003373, "train/loss": 2.2208524346351624, "l2_grads": 2.40625, "lr": 0.0003485931626802663, "uptime": 134610.6259912, "examples_seen": 73062400.0, "progress": 0.6336420876886051, "epoch": 57.02800649720138, "img/sec/core": 548.3218199635652, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.37004016303111, "core_hours": 37.37004016303111} {"step": 71400, "l2_params": 342.24435600715174, "train/loss": 2.1228451132774353, "l2_grads": 2.171875, "lr": 0.00034786380661792, "uptime": 134703.96422270001, "examples_seen": 73113600.0, "progress": 0.6340861255916805, "epoch": 57.06797006167034, "img/sec/core": 548.5426408576968, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.39596744955889, "core_hours": 37.39596744955889} {"step": 71450, "l2_params": 342.24435600715174, "train/loss": 2.14079612493515, "l2_grads": 2.25, "lr": 0.00034713480713156333, "uptime": 134797.332164668, "examples_seen": 73164800.0, "progress": 0.6345301634947559, "epoch": 57.10793362613929, "img/sec/core": 548.3680899547852, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.42190298899445, "core_hours": 37.42190298899445} {"step": 71500, "l2_params": 342.24437883440834, "train/loss": 2.239999294281006, "l2_grads": 2.21875, "lr": 0.00034640616592982154, "uptime": 134891.998211863, "examples_seen": 73216000.0, "progress": 0.6349742013978313, "epoch": 57.14789719060825, "img/sec/core": 540.8486095815703, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.44819911321528, "core_hours": 37.44819911321528} {"step": 71550, "l2_params": 342.24433317989354, "train/loss": 3.478872239589691, "l2_grads": 2.015625, "lr": 0.00034567788472047957, "uptime": 134985.315036176, "examples_seen": 73267200.0, "progress": 0.6354182393009067, "epoch": 57.18786075507721, "img/sec/core": 548.6684783471796, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.47412045330223, "core_hours": 37.47412045330223} {"step": 71600, "l2_params": 342.2443503003373, "train/loss": 2.1406443119049072, "l2_grads": 2.203125, "lr": 0.00034494996521047946, "uptime": 135078.70161478702, "examples_seen": 73318400.0, "progress": 0.6358622772039821, "epoch": 57.227824319546166, "img/sec/core": 548.2586551678548, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.50006116958306, "core_hours": 37.50006116958306} {"step": 71650, "l2_params": 342.2443731275943, "train/loss": 4.7573630809783936, "l2_grads": 1.9921875, "lr": 0.0003442224091059148, "uptime": 135172.09590831, "examples_seen": 73369600.0, "progress": 0.6363063151070575, "epoch": 57.26778788401512, "img/sec/core": 548.213365813391, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.526004028895, "core_hours": 37.526004028895} {"step": 71700, "l2_params": 342.24433317989354, "train/loss": 3.785961151123047, "l2_grads": 1.9140625, "lr": 0.00034349521811202755, "uptime": 135265.46071094, "examples_seen": 73420800.0, "progress": 0.6367503530101329, "epoch": 57.307751448484076, "img/sec/core": 548.3865285175953, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.551938696292225, "core_hours": 37.551938696292225} {"step": 71750, "l2_params": 342.24433317989354, "train/loss": 2.1581397652626038, "l2_grads": 2.09375, "lr": 0.00034276839393320406, "uptime": 135358.797507563, "examples_seen": 73472000.0, "progress": 0.6371943909132084, "epoch": 57.34771501295303, "img/sec/core": 548.5510736651037, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.57786558424305, "core_hours": 37.57786558424305} {"step": 71800, "l2_params": 342.2442418708458, "train/loss": 4.36127781867981, "l2_grads": 1.96875, "lr": 0.00034204193827297094, "uptime": 135452.183226017, "examples_seen": 73523200.0, "progress": 0.6376384288162837, "epoch": 57.387678577421994, "img/sec/core": 548.2637050677349, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.603806061591385, "core_hours": 37.603806061591385} {"step": 71850, "l2_params": 342.2442418708458, "train/loss": 2.288016617298126, "l2_grads": 2.265625, "lr": 0.000341315852833991, "uptime": 135545.54487246, "examples_seen": 73574400.0, "progress": 0.6380824667193592, "epoch": 57.42764214189095, "img/sec/core": 548.4050672911632, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.62973985227, "core_hours": 37.62973985227} {"step": 71900, "l2_params": 342.24423616402953, "train/loss": 2.160999894142151, "l2_grads": 2.1875, "lr": 0.00034059013931805974, "uptime": 135638.902740821, "examples_seen": 73625600.0, "progress": 0.6385265046224345, "epoch": 57.467605706359905, "img/sec/core": 548.4272605927555, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.65567259348139, "core_hours": 37.65567259348139} {"step": 71950, "l2_params": 342.24423616402953, "train/loss": 2.762095630168915, "l2_grads": 2.109375, "lr": 0.00033986479942610013, "uptime": 135732.169776865, "examples_seen": 73676800.0, "progress": 0.63897054252551, "epoch": 57.50756927082886, "img/sec/core": 548.9613712593626, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.68158010349361, "core_hours": 37.68158010349361} {"step": 72000, "l2_params": 342.2442532844781, "train/loss": 2.2792879939079285, "l2_grads": 2.1875, "lr": 0.00033913983485816054, "uptime": 135825.493434822, "examples_seen": 73728000.0, "progress": 0.6394145804285853, "epoch": 57.547532835297815, "img/sec/core": 548.6283019851077, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.707503341815006, "core_hours": 37.707503341815006} {"step": 72050, "l2_params": 342.24420762994663, "train/loss": 2.2618733048439026, "l2_grads": 2.265625, "lr": 0.000338415247313408, "uptime": 135919.062210859, "examples_seen": 73779200.0, "progress": 0.6398586183316608, "epoch": 57.58749639976678, "img/sec/core": 547.1910841257434, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.73349466849194, "core_hours": 37.73349466849194} {"step": 72100, "l2_params": 342.2442019231297, "train/loss": 2.797356605529785, "l2_grads": 2.140625, "lr": 0.0003376910384901277, "uptime": 136012.36640063, "examples_seen": 73830400.0, "progress": 0.6403026562347361, "epoch": 57.62745996423573, "img/sec/core": 548.7427748492175, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.75941249898389, "core_hours": 37.75941249898389} {"step": 72150, "l2_params": 342.24420762994663, "train/loss": 3.3415544629096985, "l2_grads": 2.0, "lr": 0.00033696721008571627, "uptime": 136105.872932211, "examples_seen": 73881600.0, "progress": 0.6407466941378116, "epoch": 57.66742352870469, "img/sec/core": 547.5553325989065, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.785386535534165, "core_hours": 37.785386535534165} {"step": 72200, "l2_params": 342.24420762994663, "train/loss": 3.8048835396766663, "l2_grads": 2.046875, "lr": 0.00033624376379667864, "uptime": 136199.24370108, "examples_seen": 73932800.0, "progress": 0.6411907320408871, "epoch": 57.707387093173644, "img/sec/core": 548.3514875178064, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.81132286022, "core_hours": 37.81132286022} {"step": 72250, "l2_params": 342.2441962163128, "train/loss": 2.268941879272461, "l2_grads": 2.46875, "lr": 0.0003355207013186243, "uptime": 136292.616095661, "examples_seen": 73984000.0, "progress": 0.6416347699439624, "epoch": 57.7473506576426, "img/sec/core": 548.341940139293, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.837259636492504, "core_hours": 37.837259636492504} {"step": 72300, "l2_params": 342.2442019231297, "train/loss": 2.13894921541214, "l2_grads": 2.40625, "lr": 0.0003347980243462632, "uptime": 136386.026837439, "examples_seen": 74035200.0, "progress": 0.6420788078470379, "epoch": 57.78731422211156, "img/sec/core": 548.1168335187846, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.86320706476417, "core_hours": 37.86320706476417} {"step": 72350, "l2_params": 342.2441905094957, "train/loss": 2.131053388118744, "l2_grads": 2.15625, "lr": 0.0003340757345734019, "uptime": 136479.402950522, "examples_seen": 74086400.0, "progress": 0.6425228457501132, "epoch": 57.82727778658052, "img/sec/core": 548.3201036061546, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.88914487395389, "core_hours": 37.88914487395389} {"step": 72400, "l2_params": 342.24417909586134, "train/loss": 2.721307873725891, "l2_grads": 2.15625, "lr": 0.0003333538336929389, "uptime": 136572.762929436, "examples_seen": 74137600.0, "progress": 0.6429668836531887, "epoch": 57.86724135104947, "img/sec/core": 548.414862509387, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.91507820143, "core_hours": 37.91507820143} {"step": 72450, "l2_params": 342.2442304572131, "train/loss": 2.9884414672851562, "l2_grads": 2.015625, "lr": 0.000332632323396862, "uptime": 136666.054877227, "examples_seen": 74188800.0, "progress": 0.643410921556264, "epoch": 57.90720491551843, "img/sec/core": 548.8147821149613, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.94099263137194, "core_hours": 37.94099263137194} {"step": 72500, "l2_params": 342.2442190435801, "train/loss": 2.763931691646576, "l2_grads": 2.15625, "lr": 0.00033191120537624325, "uptime": 136759.33706675, "examples_seen": 74240000.0, "progress": 0.6438549594593395, "epoch": 57.94716847998739, "img/sec/core": 548.8721937360559, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 37.96690435068389, "core_hours": 37.96690435068389, "val/acc@1": 0.6608139349489796, "val/loss": 1.406020565604677, "z/secs/eval/val": 31.774380210001254} {"step": 72550, "l2_params": 342.24423616402953, "train/loss": 2.1597060561180115, "l2_grads": 2.171875, "lr": 0.0003311904813212346, "uptime": 136884.102503923, "examples_seen": 74291200.0, "progress": 0.6442989973624148, "epoch": 57.987132044456345, "img/sec/core": 410.37006049208173, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.00156141656528, "core_hours": 38.00156141656528} {"step": 72600, "l2_params": 342.24425043107004, "train/loss": 4.053862273693085, "l2_grads": 1.9765625, "lr": 0.0003304701529210657, "uptime": 136977.38056439, "examples_seen": 74342400.0, "progress": 0.6447430352654903, "epoch": 58.0270956089253, "img/sec/core": 548.8964901677738, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.02747198891723, "core_hours": 38.02747198891723} {"step": 72650, "l2_params": 342.24418194926994, "train/loss": 2.2228968739509583, "l2_grads": 2.234375, "lr": 0.0003297502218640381, "uptime": 137070.756048414, "examples_seen": 74393600.0, "progress": 0.6451870731685657, "epoch": 58.067059173394256, "img/sec/core": 548.3237975702518, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.05340962336834, "core_hours": 38.05340962336834} {"step": 72700, "l2_params": 342.24418765608715, "train/loss": 2.281442880630493, "l2_grads": 2.234375, "lr": 0.0003290306898375224, "uptime": 137164.161855221, "examples_seen": 74444800.0, "progress": 0.6456311110716411, "epoch": 58.10702273786321, "img/sec/core": 548.1457925394263, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.07935568081472, "core_hours": 38.07935568081472} {"step": 72750, "l2_params": 342.24418194926994, "train/loss": 2.230642318725586, "l2_grads": 2.28125, "lr": 0.0003283115585279539, "uptime": 137257.417753579, "examples_seen": 74496000.0, "progress": 0.6460751489747165, "epoch": 58.146986302332174, "img/sec/core": 549.0269345049174, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.10526009702528, "core_hours": 38.10526009702528} {"step": 72800, "l2_params": 342.2441962163128, "train/loss": 3.6489030718803406, "l2_grads": 1.8828125, "lr": 0.000327592829620829, "uptime": 137350.727537153, "examples_seen": 74547200.0, "progress": 0.6465191868777919, "epoch": 58.18694986680113, "img/sec/core": 548.7098784169932, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.13117948135139, "core_hours": 38.13117948135139} {"step": 72850, "l2_params": 342.24417338904397, "train/loss": 2.326537609100342, "l2_grads": 2.28125, "lr": 0.00032687450480069994, "uptime": 137444.023574624, "examples_seen": 74598400.0, "progress": 0.6469632247808673, "epoch": 58.226913431270084, "img/sec/core": 548.7907245354326, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.15709504731556, "core_hours": 38.15709504731556} {"step": 72900, "l2_params": 342.2442704049258, "train/loss": 4.6726847887039185, "l2_grads": 2.0625, "lr": 0.00032615658575117307, "uptime": 137537.371549099, "examples_seen": 74649600.0, "progress": 0.6474072626839427, "epoch": 58.26687699573904, "img/sec/core": 548.4853880113704, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.18302504022528, "core_hours": 38.18302504022528} {"step": 72950, "l2_params": 342.24417338904397, "train/loss": 2.587092638015747, "l2_grads": 2.25, "lr": 0.0003254390741549035, "uptime": 137630.726529387, "examples_seen": 74700800.0, "progress": 0.6478513005870181, "epoch": 58.306840560207995, "img/sec/core": 548.4442269930933, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.20895697919416, "core_hours": 38.20895697919416} {"step": 73000, "l2_params": 342.24418480267855, "train/loss": 2.751080274581909, "l2_grads": 2.0625, "lr": 0.00032472197169359, "uptime": 137724.002717825, "examples_seen": 74752000.0, "progress": 0.6482953384900935, "epoch": 58.34680412467696, "img/sec/core": 548.9075063785589, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.23486703153806, "core_hours": 38.23486703153806} {"step": 73051, "l2_params": 342.244161975409, "train/loss": 2.2671412229537964, "l2_grads": 2.234375, "lr": 0.00032400528004797454, "uptime": 137817.540608023, "examples_seen": 74803200.0, "progress": 0.6487393763931689, "epoch": 58.38676768914591, "img/sec/core": 547.3717644434812, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.26084977881528, "core_hours": 38.26084977881528} {"step": 73100, "l2_params": 342.24417909586134, "train/loss": 4.808195352554321, "l2_grads": 2.125, "lr": 0.0003232890008978343, "uptime": 137910.813820882, "examples_seen": 74854400.0, "progress": 0.6491834142962444, "epoch": 58.42673125361487, "img/sec/core": 548.9250174902696, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.28675900460944, "core_hours": 38.28675900460944} {"step": 73150, "l2_params": 342.24418480267855, "train/loss": 2.8776628971099854, "l2_grads": 2.046875, "lr": 0.00032257313592198096, "uptime": 138004.089010221, "examples_seen": 74905600.0, "progress": 0.6496274521993197, "epoch": 58.46669481808382, "img/sec/core": 548.9133858942233, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.312668779425834, "core_hours": 38.312668779425834} {"step": 73200, "l2_params": 342.24417909586134, "train/loss": 2.1965587735176086, "l2_grads": 2.21875, "lr": 0.00032185768679825503, "uptime": 138097.34255019302, "examples_seen": 74956800.0, "progress": 0.6500714901023952, "epoch": 58.50665838255278, "img/sec/core": 549.0408194195003, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.33857254052917, "core_hours": 38.33857254052917} {"step": 73250, "l2_params": 342.24417909586134, "train/loss": 2.897850751876831, "l2_grads": 2.109375, "lr": 0.0003211426552035218, "uptime": 138190.619431803, "examples_seen": 75008000.0, "progress": 0.6505155280054705, "epoch": 58.54662194702174, "img/sec/core": 548.9034272616498, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.36448278542083, "core_hours": 38.36448278542083} {"step": 73300, "l2_params": 342.2441905094957, "train/loss": 2.6143460273742676, "l2_grads": 2.203125, "lr": 0.0003204280428136689, "uptime": 138283.944523427, "examples_seen": 75059200.0, "progress": 0.650959565908546, "epoch": 58.586585511490696, "img/sec/core": 548.6198739164956, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.39040642198305, "core_hours": 38.39040642198305} {"step": 73350, "l2_params": 342.24417909586134, "train/loss": 2.1879855394363403, "l2_grads": 2.3125, "lr": 0.0003197138513036011, "uptime": 138377.240656362, "examples_seen": 75110400.0, "progress": 0.6514036038116213, "epoch": 58.62654907595965, "img/sec/core": 548.7901629927934, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.416322014464996, "core_hours": 38.416322014464996} {"step": 73400, "l2_params": 342.24417338904397, "train/loss": 2.274429678916931, "l2_grads": 2.15625, "lr": 0.0003190000823472359, "uptime": 138470.615366544, "examples_seen": 75161600.0, "progress": 0.6518476417146968, "epoch": 58.66651264042861, "img/sec/core": 548.3283417984351, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.44225943396, "core_hours": 38.44225943396} {"step": 73450, "l2_params": 342.24418480267855, "train/loss": 3.208728849887848, "l2_grads": 2.046875, "lr": 0.0003182867376175022, "uptime": 138563.903108599, "examples_seen": 75212800.0, "progress": 0.6522916796177721, "epoch": 58.70647620489757, "img/sec/core": 548.839524594798, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.46817269564195, "core_hours": 38.46817269564195} {"step": 73500, "l2_params": 342.24418480267855, "train/loss": 4.09929621219635, "l2_grads": 1.984375, "lr": 0.000317573818786333, "uptime": 138657.115403013, "examples_seen": 75264000.0, "progress": 0.6527357175208476, "epoch": 58.746439769366525, "img/sec/core": 549.2837647853294, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.494064999645836, "core_hours": 38.494064999645836} {"step": 73550, "l2_params": 342.24418480267855, "train/loss": 3.5491310358047485, "l2_grads": 1.953125, "lr": 0.00031686132752466325, "uptime": 138750.369526809, "examples_seen": 75315200.0, "progress": 0.653179755423923, "epoch": 58.78640333383548, "img/sec/core": 549.0373821109928, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.5199689229225, "core_hours": 38.5199689229225} {"step": 73600, "l2_params": 342.24417053563525, "train/loss": 4.592372536659241, "l2_grads": 2.0625, "lr": 0.00031614926550242663, "uptime": 138844.687203794, "examples_seen": 75366400.0, "progress": 0.6536237933269984, "epoch": 58.826366898304435, "img/sec/core": 542.8462790505838, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.54616827764055, "core_hours": 38.54616827764055} {"step": 73650, "l2_params": 342.24417338904397, "train/loss": 2.205401837825775, "l2_grads": 2.1875, "lr": 0.00031543763438855, "uptime": 138937.876933777, "examples_seen": 75417600.0, "progress": 0.6540678312300738, "epoch": 58.86633046277339, "img/sec/core": 549.4167652307954, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.57205431374694, "core_hours": 38.57205431374694} {"step": 73700, "l2_params": 342.24416768222653, "train/loss": 4.513331055641174, "l2_grads": 1.953125, "lr": 0.0003147264358509509, "uptime": 139031.171531311, "examples_seen": 75468800.0, "progress": 0.6545118691331492, "epoch": 58.90629402724235, "img/sec/core": 548.79919473732, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.59796947972861, "core_hours": 38.59796947972861} {"step": 73750, "l2_params": 342.24416768222653, "train/loss": 2.360186517238617, "l2_grads": 2.21875, "lr": 0.0003140156715565325, "uptime": 139124.52109680302, "examples_seen": 75520000.0, "progress": 0.6549559070362246, "epoch": 58.94625759171131, "img/sec/core": 548.4760398202544, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.623899914587504, "core_hours": 38.623899914587504} {"step": 73800, "l2_params": 342.244161975409, "train/loss": 2.3214500546455383, "l2_grads": 2.171875, "lr": 0.0003133053431711799, "uptime": 139217.861283392, "examples_seen": 75571200.0, "progress": 0.6553999449393, "epoch": 58.986221156180264, "img/sec/core": 548.531151169129, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.649827744195555, "core_hours": 38.649827744195555} {"step": 73850, "l2_params": 342.244161975409, "train/loss": 2.6172571182250977, "l2_grads": 2.1875, "lr": 0.0003125954523597573, "uptime": 139311.222889143, "examples_seen": 75622400.0, "progress": 0.6558439828423754, "epoch": 59.02618472064922, "img/sec/core": 548.4053063156231, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.675761523570834, "core_hours": 38.675761523570834} {"step": 73900, "l2_params": 342.244161975409, "train/loss": 4.593106985092163, "l2_grads": 2.078125, "lr": 0.0003118860007861026, "uptime": 139404.580462441, "examples_seen": 75673600.0, "progress": 0.6562880207454508, "epoch": 59.066148285118174, "img/sec/core": 548.4289939347367, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.701694182820276, "core_hours": 38.701694182820276} {"step": 73950, "l2_params": 342.2441648288178, "train/loss": 2.192857563495636, "l2_grads": 2.171875, "lr": 0.0003111769901130252, "uptime": 139497.868155403, "examples_seen": 75724800.0, "progress": 0.6567320586485262, "epoch": 59.10611184958714, "img/sec/core": 548.8398134237287, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.72760743086528, "core_hours": 38.72760743086528} {"step": 74000, "l2_params": 342.24417053563525, "train/loss": 2.025169998407364, "l2_grads": 2.25, "lr": 0.00031046842200229985, "uptime": 139591.177871164, "examples_seen": 75776000.0, "progress": 0.6571760965516017, "epoch": 59.14607541405609, "img/sec/core": 548.7102771928728, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.75352679635444, "core_hours": 38.75352679635444} {"step": 74050, "l2_params": 342.2500142668003, "train/loss": 3.4133164286613464, "l2_grads": 1.9375, "lr": 0.00030976029811466524, "uptime": 139685.072656144, "examples_seen": 75827200.0, "progress": 0.657620134454677, "epoch": 59.18603897852505, "img/sec/core": 545.2912002609789, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.77960868107111, "core_hours": 38.77960868107111} {"step": 74100, "l2_params": 342.24998573319914, "train/loss": 2.153037816286087, "l2_grads": 2.234375, "lr": 0.00030905262010981764, "uptime": 139779.447459985, "examples_seen": 75878400.0, "progress": 0.6580641723577525, "epoch": 59.226002542994, "img/sec/core": 542.5176839176439, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.80582390436028, "core_hours": 38.80582390436028} {"step": 74150, "l2_params": 342.25000856008023, "train/loss": 3.328559696674347, "l2_grads": 2.0625, "lr": 0.00030834538964640977, "uptime": 139872.718748954, "examples_seen": 75929600.0, "progress": 0.6585082102608278, "epoch": 59.26596610746296, "img/sec/core": 548.9363400672682, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.831732595740554, "core_hours": 38.831732595740554} {"step": 74200, "l2_params": 342.25000856008023, "train/loss": 4.376598954200745, "l2_grads": 1.9375, "lr": 0.00030763860838204407, "uptime": 139966.67901194, "examples_seen": 75980800.0, "progress": 0.6589522481639033, "epoch": 59.30592967193192, "img/sec/core": 544.9112036610162, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.85783266879222, "core_hours": 38.85783266879222} {"step": 74250, "l2_params": 342.2442047765382, "train/loss": 2.283259630203247, "l2_grads": 2.265625, "lr": 0.00030693227797327064, "uptime": 140059.922768183, "examples_seen": 76032000.0, "progress": 0.6593962860669786, "epoch": 59.345893236400876, "img/sec/core": 549.0984282804934, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.88373371219305, "core_hours": 38.88373371219305} {"step": 74300, "l2_params": 342.24418765608715, "train/loss": 2.210647940635681, "l2_grads": 2.328125, "lr": 0.000306226400075583, "uptime": 140154.342832122, "examples_seen": 76083200.0, "progress": 0.6598403239700541, "epoch": 59.38585680086983, "img/sec/core": 542.2576289831331, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.909961507731666, "core_hours": 38.909961507731666} {"step": 74350, "l2_params": 342.25589213792216, "train/loss": 2.1439013183116913, "l2_grads": 2.265625, "lr": 0.0003055209763434141, "uptime": 140247.691242368, "examples_seen": 76134400.0, "progress": 0.6602843618731294, "epoch": 59.42582036533879, "img/sec/core": 548.4828275605108, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.93589162168889, "core_hours": 38.93589162168889} {"step": 74400, "l2_params": 342.2558407783204, "train/loss": 2.429973840713501, "l2_grads": 2.296875, "lr": 0.0003048160084301321, "uptime": 140342.039505672, "examples_seen": 76185600.0, "progress": 0.6607283997762049, "epoch": 59.46578392980775, "img/sec/core": 542.6702962726739, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.96209947260666, "core_hours": 38.96209947260666} {"step": 74450, "l2_params": 342.25000856008023, "train/loss": 2.1803559064865112, "l2_grads": 2.296875, "lr": 0.0003041114979880368, "uptime": 140435.44399866, "examples_seen": 76236800.0, "progress": 0.6611724376792804, "epoch": 59.505747494276704, "img/sec/core": 548.1535027076669, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 38.98804516510333, "core_hours": 38.98804516510333} {"step": 74500, "l2_params": 342.2558521915659, "train/loss": 2.462563157081604, "l2_grads": 2.234375, "lr": 0.0003034074466683564, "uptime": 140528.8916076, "examples_seen": 76288000.0, "progress": 0.6616164755823557, "epoch": 59.54571105874566, "img/sec/core": 547.900589226069, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.01400283425333, "core_hours": 39.01400283425333} {"step": 74550, "l2_params": 342.2558350716975, "train/loss": 2.189504623413086, "l2_grads": 2.265625, "lr": 0.0003027038561212423, "uptime": 140623.562915776, "examples_seen": 76339200.0, "progress": 0.6620605134854312, "epoch": 59.585674623214615, "img/sec/core": 540.818554073538, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.04030041985778, "core_hours": 39.04030041985778} {"step": 74600, "l2_params": 342.25584648494316, "train/loss": 2.386276960372925, "l2_grads": 2.265625, "lr": 0.00030200072799576623, "uptime": 140716.89335493, "examples_seen": 76390400.0, "progress": 0.6625045513885065, "epoch": 59.62563818768357, "img/sec/core": 548.5884397856214, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.06622554184501, "core_hours": 39.06622554184501} {"step": 74650, "l2_params": 342.25584648494316, "train/loss": 4.301434636116028, "l2_grads": 2.0, "lr": 0.0003012980639399164, "uptime": 140810.54700348902, "examples_seen": 76441600.0, "progress": 0.662948589291582, "epoch": 59.66560175215253, "img/sec/core": 546.6951986151694, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.092240444222504, "core_hours": 39.092240444222504} {"step": 74700, "l2_params": 342.2675334487994, "train/loss": 3.1413604021072388, "l2_grads": 2.046875, "lr": 0.00030059586560059263, "uptime": 140903.909920847, "examples_seen": 76492800.0, "progress": 0.6633926271946573, "epoch": 59.70556531662149, "img/sec/core": 548.397602055161, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.118174587933055, "core_hours": 39.118174587933055} {"step": 74750, "l2_params": 342.2675163295153, "train/loss": 3.1437399983406067, "l2_grads": 2.078125, "lr": 0.0002998941346236038, "uptime": 140998.587430509, "examples_seen": 76544000.0, "progress": 0.6638366650977328, "epoch": 59.74552888109044, "img/sec/core": 540.7831298350206, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.1444738961725, "core_hours": 39.1444738961725} {"step": 74800, "l2_params": 342.26751062308705, "train/loss": 2.4556758403778076, "l2_grads": 2.078125, "lr": 0.00029919287265366324, "uptime": 141093.586448387, "examples_seen": 76595200.0, "progress": 0.6642807030008081, "epoch": 59.7854924455594, "img/sec/core": 538.9529401846322, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.17086251224973, "core_hours": 39.17086251224973} {"step": 74850, "l2_params": 342.2675134763012, "train/loss": 2.2464877367019653, "l2_grads": 2.265625, "lr": 0.00029849208133438473, "uptime": 141186.753621362, "examples_seen": 76646400.0, "progress": 0.6647247409038836, "epoch": 59.825456010028354, "img/sec/core": 549.5497863152073, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.19674228252055, "core_hours": 39.19674228252055} {"step": 74900, "l2_params": 342.2675705405787, "train/loss": 2.269317924976349, "l2_grads": 2.140625, "lr": 0.0002977917623082793, "uptime": 141280.06380886902, "examples_seen": 76697600.0, "progress": 0.665168778806959, "epoch": 59.86541957449732, "img/sec/core": 548.7075030917898, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.222661779050284, "core_hours": 39.222661779050284} {"step": 74950, "l2_params": 342.2675705405787, "train/loss": 2.2937192916870117, "l2_grads": 2.328125, "lr": 0.00029709191721675137, "uptime": 141375.179142765, "examples_seen": 76748800.0, "progress": 0.6656128167100344, "epoch": 59.90538313896627, "img/sec/core": 538.2938576022951, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.2490827051325, "core_hours": 39.2490827051325} {"step": 75000, "l2_params": 342.2675591277239, "train/loss": 2.23869389295578, "l2_grads": 2.375, "lr": 0.0002963925477000936, "uptime": 141468.49066807202, "examples_seen": 76800000.0, "progress": 0.6660568546131098, "epoch": 59.94534670343523, "img/sec/core": 548.6996363154682, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.27500257327334, "core_hours": 39.27500257327334, "val/acc@1": 0.6611128826530612, "val/loss": 1.401102740545662, "z/secs/eval/val": 31.771039348997874} {"step": 75050, "l2_params": 342.2675220359434, "train/loss": 2.3361615538597107, "l2_grads": 2.28125, "lr": 0.0002956936553974843, "uptime": 141593.53933045702, "examples_seen": 76851200.0, "progress": 0.6665008925161852, "epoch": 59.98531026790418, "img/sec/core": 409.4406051490973, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.30973831282473, "core_hours": 39.30973831282473} {"step": 75100, "l2_params": 342.2675591277239, "train/loss": 2.4064360857009888, "l2_grads": 2.140625, "lr": 0.0002949952419469839, "uptime": 141687.651920421, "examples_seen": 76902400.0, "progress": 0.6669449304192606, "epoch": 60.02527383237314, "img/sec/core": 544.0292315788923, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.335880698925834, "core_hours": 39.335880698925834} {"step": 75150, "l2_params": 342.26751918272936, "train/loss": 2.3423666954040527, "l2_grads": 2.140625, "lr": 0.00029429730898552993, "uptime": 141781.122942796, "examples_seen": 76953600.0, "progress": 0.667388968322336, "epoch": 60.0652373968421, "img/sec/core": 547.7633463190374, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.361844871807776, "core_hours": 39.361844871807776} {"step": 75200, "l2_params": 342.26751918272936, "train/loss": 4.852719664573669, "l2_grads": 2.15625, "lr": 0.00029359985814893393, "uptime": 141875.359733657, "examples_seen": 77004800.0, "progress": 0.6678330062254114, "epoch": 60.105200961311056, "img/sec/core": 543.3122194867472, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.38802175815806, "core_hours": 39.38802175815806} {"step": 75250, "l2_params": 342.2675220359434, "train/loss": 2.1482053995132446, "l2_grads": 2.078125, "lr": 0.0002929028910718774, "uptime": 141969.796774188, "examples_seen": 77056000.0, "progress": 0.6682770441284868, "epoch": 60.14516452578001, "img/sec/core": 542.1601493663802, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.414254269416666, "core_hours": 39.414254269416666} {"step": 75300, "l2_params": 342.2675220359434, "train/loss": 3.196113169193268, "l2_grads": 2.0, "lr": 0.0002922064093879079, "uptime": 142063.547952285, "examples_seen": 77107200.0, "progress": 0.6687210820315622, "epoch": 60.185128090248966, "img/sec/core": 546.1264705070782, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.4402962633325, "core_hours": 39.4402962633325} {"step": 75350, "l2_params": 342.2675220359434, "train/loss": 3.679912567138672, "l2_grads": 2.140625, "lr": 0.0002915104147294353, "uptime": 142158.35343262, "examples_seen": 77158400.0, "progress": 0.6691651199346377, "epoch": 60.22509165471793, "img/sec/core": 540.0531680139676, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.46663111898111, "core_hours": 39.46663111898111} {"step": 75400, "l2_params": 342.2675163295153, "train/loss": 3.655310332775116, "l2_grads": 1.90625, "lr": 0.0002908149087277285, "uptime": 142251.963165297, "examples_seen": 77209600.0, "progress": 0.669609157837713, "epoch": 60.265055219186884, "img/sec/core": 546.951674102816, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.4926338225025, "core_hours": 39.4926338225025} {"step": 75450, "l2_params": 342.26751062308705, "train/loss": 4.6786733865737915, "l2_grads": 2.171875, "lr": 0.000290119893012911, "uptime": 142345.954518145, "examples_seen": 77260800.0, "progress": 0.6700531957407885, "epoch": 60.30501878365584, "img/sec/core": 544.730961398051, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.51874253162694, "core_hours": 39.51874253162694} {"step": 75500, "l2_params": 342.2675163295153, "train/loss": 2.2126729488372803, "l2_grads": 2.1875, "lr": 0.00028942536921395634, "uptime": 142440.414192814, "examples_seen": 77312000.0, "progress": 0.6704972336438638, "epoch": 60.344982348124795, "img/sec/core": 542.0302386115106, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.544981330146115, "core_hours": 39.544981330146115} {"step": 75550, "l2_params": 342.2675163295153, "train/loss": 3.16576224565506, "l2_grads": 2.046875, "lr": 0.00028873133895868574, "uptime": 142534.8053442, "examples_seen": 77363200.0, "progress": 0.6709412715469393, "epoch": 60.38494591259375, "img/sec/core": 542.4237256162735, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.57120109442, "core_hours": 39.57120109442} {"step": 75600, "l2_params": 342.2675163295153, "train/loss": 2.1228834986686707, "l2_grads": 2.328125, "lr": 0.0002880378038737637, "uptime": 142629.603366585, "examples_seen": 77414400.0, "progress": 0.6713853094500146, "epoch": 60.42490947706271, "img/sec/core": 540.095655076578, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.59753387841583, "core_hours": 39.59753387841583} {"step": 75650, "l2_params": 342.2675163295153, "train/loss": 4.200791001319885, "l2_grads": 2.078125, "lr": 0.00028734476558469376, "uptime": 142723.022299411, "examples_seen": 77465600.0, "progress": 0.6718293473530901, "epoch": 60.46487304153167, "img/sec/core": 548.068774189125, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.62348358197861, "core_hours": 39.62348358197861} {"step": 75700, "l2_params": 342.2675163295153, "train/loss": 3.534627377986908, "l2_grads": 1.953125, "lr": 0.00028665222571581575, "uptime": 142817.455356277, "examples_seen": 77516800.0, "progress": 0.6722733852561654, "epoch": 60.50483660600062, "img/sec/core": 542.1830204295525, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.64971498666361, "core_hours": 39.64971498666361} {"step": 75750, "l2_params": 342.2675220359434, "train/loss": 2.1246074438095093, "l2_grads": 2.25, "lr": 0.0002859601858903004, "uptime": 142912.355260535, "examples_seen": 77568000.0, "progress": 0.6727174231592409, "epoch": 60.54480017046958, "img/sec/core": 539.5158235440043, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.67607607117972, "core_hours": 39.67607607117972} {"step": 75800, "l2_params": 342.26756198093767, "train/loss": 2.5311811566352844, "l2_grads": 2.140625, "lr": 0.0002852686477301473, "uptime": 143006.131488593, "examples_seen": 77619200.0, "progress": 0.6731614610623162, "epoch": 60.584763734938534, "img/sec/core": 545.9805865547252, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.702125023418056, "core_hours": 39.702125023418056} {"step": 75850, "l2_params": 342.26756198093767, "train/loss": 2.0161866545677185, "l2_grads": 2.234375, "lr": 0.0002845776128561796, "uptime": 143100.088442454, "examples_seen": 77670400.0, "progress": 0.6736054989653917, "epoch": 60.624727299407496, "img/sec/core": 544.9303952078801, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.72822417726833, "core_hours": 39.72822417726833} {"step": 75900, "l2_params": 342.26756198093767, "train/loss": 2.1948158740997314, "l2_grads": 2.328125, "lr": 0.00028388708288804135, "uptime": 143194.443910177, "examples_seen": 77721600.0, "progress": 0.6740495368684671, "epoch": 60.66469086387645, "img/sec/core": 542.6288612155585, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.75443402941361, "core_hours": 39.75443402941361} {"step": 75950, "l2_params": 342.26756198093767, "train/loss": 2.719475269317627, "l2_grads": 2.125, "lr": 0.0002831970594441926, "uptime": 143289.011510431, "examples_seen": 77772800.0, "progress": 0.6744935747715425, "epoch": 60.70465442834541, "img/sec/core": 541.4116448179105, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.780702807261946, "core_hours": 39.780702807261946} {"step": 76000, "l2_params": 342.2675591277239, "train/loss": 2.180921256542206, "l2_grads": 2.265625, "lr": 0.0002825075441419067, "uptime": 143382.995361184, "examples_seen": 77824000.0, "progress": 0.6749376126746179, "epoch": 60.74461799281436, "img/sec/core": 544.7744435856655, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.80680943247111, "core_hours": 39.80680943247111} {"step": 76050, "l2_params": 342.2675591277239, "train/loss": 2.3743796944618225, "l2_grads": 2.359375, "lr": 0.0002818185385972662, "uptime": 143477.61315921802, "examples_seen": 77875200.0, "progress": 0.6753816505776933, "epoch": 60.78458155728332, "img/sec/core": 541.1244085557134, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.83309215414723, "core_hours": 39.83309215414723} {"step": 76100, "l2_params": 342.26751062308705, "train/loss": 2.7294466495513916, "l2_grads": 2.1875, "lr": 0.0002811300444251584, "uptime": 143571.89361591102, "examples_seen": 77926400.0, "progress": 0.6758256884807687, "epoch": 60.82454512175228, "img/sec/core": 543.0605853630954, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.85928116989528, "core_hours": 39.85928116989528} {"step": 76150, "l2_params": 342.26751062308705, "train/loss": 2.9139404892921448, "l2_grads": 2.046875, "lr": 0.00028044206323927227, "uptime": 143665.768952075, "examples_seen": 77977600.0, "progress": 0.6762697263838441, "epoch": 60.864508686221235, "img/sec/core": 545.404172087918, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.88535765216306, "core_hours": 39.88535765216306} {"step": 76200, "l2_params": 342.2675562745102, "train/loss": 4.3322718143463135, "l2_grads": 1.9296875, "lr": 0.0002797545966520944, "uptime": 143760.027500509, "examples_seen": 78028800.0, "progress": 0.6767137642869195, "epoch": 60.90447225069019, "img/sec/core": 543.1868074635303, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.91154058228361, "core_hours": 39.91154058228361} {"step": 76250, "l2_params": 342.26751062308705, "train/loss": 2.407955229282379, "l2_grads": 2.34375, "lr": 0.000279067646274905, "uptime": 143854.38286596801, "examples_seen": 78080000.0, "progress": 0.6771578021899949, "epoch": 60.944435815159146, "img/sec/core": 542.6294493261879, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.937750406022225, "core_hours": 39.937750406022225} {"step": 76300, "l2_params": 342.26751062308705, "train/loss": 2.2430025935173035, "l2_grads": 2.25, "lr": 0.0002783812137177752, "uptime": 143948.233332214, "examples_seen": 78131200.0, "progress": 0.6776018400930703, "epoch": 60.9843993796281, "img/sec/core": 545.5487015461487, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.96381997997945, "core_hours": 39.96381997997945} {"step": 76350, "l2_params": 342.26755056808264, "train/loss": 4.390437483787537, "l2_grads": 1.8671875, "lr": 0.00027769530058956133, "uptime": 144042.82787051902, "examples_seen": 78182400.0, "progress": 0.6780458779961458, "epoch": 61.024362944097064, "img/sec/core": 541.257464938509, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 39.99009624061973, "core_hours": 39.99009624061973} {"step": 76400, "l2_params": 342.267544861655, "train/loss": 2.1810641288757324, "l2_grads": 2.1875, "lr": 0.0002770099084979035, "uptime": 144136.30230942, "examples_seen": 78233600.0, "progress": 0.6784899158992211, "epoch": 61.06432650856602, "img/sec/core": 547.743325362369, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.01606136253666, "core_hours": 40.01606136253666} {"step": 76450, "l2_params": 342.267544861655, "train/loss": 3.1604671478271484, "l2_grads": 2.0625, "lr": 0.0002763250390492193, "uptime": 144230.728946424, "examples_seen": 78284800.0, "progress": 0.6789339538022966, "epoch": 61.104290073034974, "img/sec/core": 542.2198822756335, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.04229098392667, "core_hours": 40.04229098392667} {"step": 76500, "l2_params": 342.26751062308705, "train/loss": 2.23871248960495, "l2_grads": 2.265625, "lr": 0.0002756406938487025, "uptime": 144324.380722341, "examples_seen": 78336000.0, "progress": 0.6793779917053719, "epoch": 61.14425363750393, "img/sec/core": 546.7061302219358, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.068305366125834, "core_hours": 40.068305366125834} {"step": 76550, "l2_params": 342.2674992102303, "train/loss": 4.583644866943359, "l2_grads": 2.125, "lr": 0.00027495687450031773, "uptime": 144418.66191262202, "examples_seen": 78387200.0, "progress": 0.6798220296084474, "epoch": 61.18421720197289, "img/sec/core": 543.0563598889423, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.09449458564834, "core_hours": 40.09449458564834} {"step": 76600, "l2_params": 342.2674992102303, "train/loss": 2.2658233642578125, "l2_grads": 2.328125, "lr": 0.00027427358260679696, "uptime": 144512.890545386, "examples_seen": 78438400.0, "progress": 0.6802660675115227, "epoch": 61.22418076644185, "img/sec/core": 543.3592582016869, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.12066920586055, "core_hours": 40.12066920586055} {"step": 76650, "l2_params": 342.2674992102303, "train/loss": 2.2519689798355103, "l2_grads": 2.265625, "lr": 0.00027359081976963606, "uptime": 144606.050701759, "examples_seen": 78489600.0, "progress": 0.6807101054145982, "epoch": 61.2641443309108, "img/sec/core": 549.591177101576, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.14654702707528, "core_hours": 40.14654702707528} {"step": 76700, "l2_params": 342.267544861655, "train/loss": 2.2093072533607483, "l2_grads": 2.203125, "lr": 0.00027290858758909065, "uptime": 144700.387813652, "examples_seen": 78540800.0, "progress": 0.6811541433176735, "epoch": 61.30410789537976, "img/sec/core": 542.7344442988257, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.17275178037889, "core_hours": 40.17275178037889} {"step": 76750, "l2_params": 342.267544861655, "train/loss": 2.9786601662635803, "l2_grads": 2.078125, "lr": 0.00027222688766417294, "uptime": 144794.861510722, "examples_seen": 78592000.0, "progress": 0.681598181220749, "epoch": 61.34407145984871, "img/sec/core": 541.9497869556407, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.19899447400944, "core_hours": 40.19899447400944} {"step": 76800, "l2_params": 342.26751062308705, "train/loss": 3.5501087307929993, "l2_grads": 2.046875, "lr": 0.00027154572159264815, "uptime": 144889.280820199, "examples_seen": 78643200.0, "progress": 0.6820422191238245, "epoch": 61.384035024317676, "img/sec/core": 542.2619619186171, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.22522205997528, "core_hours": 40.22522205997528} {"step": 76850, "l2_params": 342.2675562745102, "train/loss": 3.0318292379379272, "l2_grads": 2.125, "lr": 0.0002708650909710289, "uptime": 144983.47817804202, "examples_seen": 78694400.0, "progress": 0.6824862570268998, "epoch": 61.42399858878663, "img/sec/core": 543.5396615404594, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.25138799270945, "core_hours": 40.25138799270945} {"step": 76900, "l2_params": 342.26756768736504, "train/loss": 3.340505361557007, "l2_grads": 1.9921875, "lr": 0.0002701849973945738, "uptime": 145076.688246044, "examples_seen": 78745600.0, "progress": 0.6829302949299753, "epoch": 61.463962153255586, "img/sec/core": 549.2968849556546, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.27727967826556, "core_hours": 40.27727967826556} {"step": 76950, "l2_params": 342.2675562745102, "train/loss": 2.3067057132720947, "l2_grads": 2.375, "lr": 0.00026950544245728263, "uptime": 145171.015380445, "examples_seen": 78796800.0, "progress": 0.6833743328330506, "epoch": 61.50392571772454, "img/sec/core": 542.7918522611837, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.30348166004361, "core_hours": 40.30348166004361} {"step": 77001, "l2_params": 342.26756198093767, "train/loss": 2.353286564350128, "l2_grads": 2.140625, "lr": 0.0002688264277518926, "uptime": 145264.77057938802, "examples_seen": 78848000.0, "progress": 0.6838183707361261, "epoch": 61.5438892821935, "img/sec/core": 546.1030489745564, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.32952477086111, "core_hours": 40.32952477086111} {"step": 77050, "l2_params": 342.2675562745102, "train/loss": 2.1550782918930054, "l2_grads": 2.21875, "lr": 0.00026814795486987435, "uptime": 145359.449836824, "examples_seen": 78899200.0, "progress": 0.6842624086392014, "epoch": 61.58385284666246, "img/sec/core": 540.7731470075905, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.355824564593334, "core_hours": 40.355824564593334} {"step": 77100, "l2_params": 342.2675562745102, "train/loss": 2.105943977832794, "l2_grads": 2.234375, "lr": 0.0002674700254014294, "uptime": 145453.204741226, "examples_seen": 78950400.0, "progress": 0.6847064465422769, "epoch": 61.623816411131415, "img/sec/core": 546.1047646153962, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.381867593593896, "core_hours": 40.381867593593896} {"step": 77150, "l2_params": 342.2675562745102, "train/loss": 2.7126651406288147, "l2_grads": 2.296875, "lr": 0.0002667926409354846, "uptime": 145547.037014747, "examples_seen": 79001600.0, "progress": 0.6851504844453522, "epoch": 61.66377997560037, "img/sec/core": 545.6544755738443, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.40793211401639, "core_hours": 40.40793211401639} {"step": 77200, "l2_params": 342.26751062308705, "train/loss": 4.738367557525635, "l2_grads": 2.03125, "lr": 0.0002661158030596906, "uptime": 145641.798128828, "examples_seen": 79052800.0, "progress": 0.6855945223484277, "epoch": 61.703743540069325, "img/sec/core": 540.3060157802797, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.43425464570556, "core_hours": 40.43425464570556} {"step": 77250, "l2_params": 342.26751062308705, "train/loss": 4.692117094993591, "l2_grads": 2.140625, "lr": 0.0002654395133604163, "uptime": 145735.614760136, "examples_seen": 79104000.0, "progress": 0.6860385602515031, "epoch": 61.74370710453828, "img/sec/core": 545.7454535103735, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.46031482106889, "core_hours": 40.46031482106889} {"step": 77300, "l2_params": 342.2675562745102, "train/loss": 4.741680264472961, "l2_grads": 2.09375, "lr": 0.00026476377342274566, "uptime": 145829.65462886202, "examples_seen": 79155200.0, "progress": 0.6864825981545785, "epoch": 61.78367066900724, "img/sec/core": 544.449930583912, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.486437006826115, "core_hours": 40.486437006826115} {"step": 77350, "l2_params": 342.26756768736504, "train/loss": 2.2655996084213257, "l2_grads": 2.40625, "lr": 0.0002640885848304743, "uptime": 145923.524438379, "examples_seen": 79206400.0, "progress": 0.6869266360576539, "epoch": 61.8236342334762, "img/sec/core": 545.4362831185828, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.51251195391417, "core_hours": 40.51251195391417} {"step": 77400, "l2_params": 342.26755056808264, "train/loss": 2.3549392223358154, "l2_grads": 2.21875, "lr": 0.0002634139491661055, "uptime": 146018.214565361, "examples_seen": 79257600.0, "progress": 0.6873706739607293, "epoch": 61.863597797945154, "img/sec/core": 540.7110712792287, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.53881476696472, "core_hours": 40.53881476696472} {"step": 77450, "l2_params": 342.26755056808264, "train/loss": 2.668576657772064, "l2_grads": 2.1875, "lr": 0.0002627398680108469, "uptime": 146112.02486334, "examples_seen": 79308800.0, "progress": 0.6878147118638047, "epoch": 61.90356136241411, "img/sec/core": 545.7822979250136, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.56487318306999, "core_hours": 40.56487318306999} {"step": 77500, "l2_params": 342.2675562745102, "train/loss": 2.213330030441284, "l2_grads": 2.359375, "lr": 0.00026206634294460656, "uptime": 146205.64635735, "examples_seen": 79360000.0, "progress": 0.6882587497668801, "epoch": 61.94352492688307, "img/sec/core": 546.8829625227861, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.59087915362833, "core_hours": 40.59087915362833, "val/acc@1": 0.6631257971938775, "val/loss": 1.3786892863560696, "z/secs/eval/val": 31.814825279987417} {"step": 77550, "l2_params": 342.267544861655, "train/loss": 2.0822448432445526, "l2_grads": 2.296875, "lr": 0.0002613933755459883, "uptime": 146330.414801826, "examples_seen": 79411200.0, "progress": 0.6887027876699555, "epoch": 61.98348849135203, "img/sec/core": 410.36016931224145, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.625537054871664, "core_hours": 40.625537054871664} {"step": 77600, "l2_params": 342.26755056808264, "train/loss": 2.426100254058838, "l2_grads": 2.078125, "lr": 0.0002607209673922898, "uptime": 146425.185037542, "examples_seen": 79462400.0, "progress": 0.6891468255730309, "epoch": 62.02345205582098, "img/sec/core": 540.2540113273454, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.65186212034833, "core_hours": 40.65186212034833} {"step": 77650, "l2_params": 342.2675562745102, "train/loss": 2.3123170733451843, "l2_grads": 2.34375, "lr": 0.00026004912005949754, "uptime": 146518.367945421, "examples_seen": 79513600.0, "progress": 0.6895908634761063, "epoch": 62.06341562028994, "img/sec/core": 549.4569891130943, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.67774626142583, "core_hours": 40.67774626142583} {"step": 77700, "l2_params": 342.2675562745102, "train/loss": 2.240897536277771, "l2_grads": 2.15625, "lr": 0.0002593778351222838, "uptime": 146612.90495466, "examples_seen": 79564800.0, "progress": 0.6900349013791818, "epoch": 62.10337918475889, "img/sec/core": 541.5868389759269, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.704006541770006, "core_hours": 40.704006541770006} {"step": 77750, "l2_params": 342.26755056808264, "train/loss": 2.913766086101532, "l2_grads": 2.109375, "lr": 0.0002587071141540027, "uptime": 146707.132138129, "examples_seen": 79616000.0, "progress": 0.6904789392822571, "epoch": 62.143342749227855, "img/sec/core": 543.3676155336885, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.73018075940028, "core_hours": 40.73018075940028} {"step": 77800, "l2_params": 342.267544861655, "train/loss": 2.8728835582733154, "l2_grads": 2.15625, "lr": 0.0002580369587266861, "uptime": 146800.486885541, "examples_seen": 79667200.0, "progress": 0.6909229771853326, "epoch": 62.18330631369681, "img/sec/core": 548.4455951023158, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.75611263368139, "core_hours": 40.75611263368139} {"step": 77850, "l2_params": 342.2675391552272, "train/loss": 2.165088802576065, "l2_grads": 2.203125, "lr": 0.0002573673704110412, "uptime": 146896.574680856, "examples_seen": 79718400.0, "progress": 0.6913670150884079, "epoch": 62.223269878165766, "img/sec/core": 532.8460272416357, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.782803687935555, "core_hours": 40.782803687935555} {"step": 77900, "l2_params": 342.267544861655, "train/loss": 2.135894238948822, "l2_grads": 2.296875, "lr": 0.0002566983507764448, "uptime": 146989.85994817, "examples_seen": 79769600.0, "progress": 0.6918110529914834, "epoch": 62.26323344263472, "img/sec/core": 548.8540846183088, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.80871626218944, "core_hours": 40.80871626218944} {"step": 77950, "l2_params": 342.267544861655, "train/loss": 2.224395513534546, "l2_grads": 2.3125, "lr": 0.000256029901390942, "uptime": 147084.749211802, "examples_seen": 79820800.0, "progress": 0.6922550908945587, "epoch": 62.30319700710368, "img/sec/core": 539.5763233927005, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.83507439097611, "core_hours": 40.83507439097611} {"step": 78000, "l2_params": 342.267544861655, "train/loss": 2.0979813933372498, "l2_grads": 2.25, "lr": 0.00025536202382124047, "uptime": 147179.233234199, "examples_seen": 79872000.0, "progress": 0.6926991287976342, "epoch": 62.34316057157264, "img/sec/core": 541.890562034628, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.86131995275306, "core_hours": 40.86131995275306} {"step": 78050, "l2_params": 342.2675391552272, "train/loss": 2.2509230971336365, "l2_grads": 2.4375, "lr": 0.00025469471963270843, "uptime": 147274.044719904, "examples_seen": 79923200.0, "progress": 0.6931431667007095, "epoch": 62.383124136041594, "img/sec/core": 540.0189609865233, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.88765647656, "core_hours": 40.88765647656} {"step": 78100, "l2_params": 342.267544861655, "train/loss": 3.368812620639801, "l2_grads": 2.046875, "lr": 0.00025402799038936984, "uptime": 147367.503879809, "examples_seen": 79974400.0, "progress": 0.693587204603785, "epoch": 62.42308770051055, "img/sec/core": 547.8328721555184, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.91361735431139, "core_hours": 40.91361735431139} {"step": 78150, "l2_params": 342.2675391552272, "train/loss": 2.1146676540374756, "l2_grads": 2.3125, "lr": 0.00025336183765390063, "uptime": 147463.292702875, "examples_seen": 80025600.0, "progress": 0.6940312425068604, "epoch": 62.463051264979505, "img/sec/core": 534.5091249812425, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.940225360718614, "core_hours": 40.940225360718614} {"step": 78200, "l2_params": 342.2675334487994, "train/loss": 2.2594248056411743, "l2_grads": 2.3125, "lr": 0.00025269626298762685, "uptime": 147556.773726891, "examples_seen": 80076800.0, "progress": 0.6944752804099358, "epoch": 62.50301482944846, "img/sec/core": 547.7047404962578, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.96619231183417, "core_hours": 40.96619231183417} {"step": 78250, "l2_params": 342.2675391552272, "train/loss": 2.3768697381019592, "l2_grads": 2.078125, "lr": 0.00025203126795051806, "uptime": 147651.530710756, "examples_seen": 80128000.0, "progress": 0.6949193183130112, "epoch": 62.54297839391742, "img/sec/core": 540.3295663457122, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 40.992513696241105, "core_hours": 40.992513696241105} {"step": 78300, "l2_params": 342.26755056808264, "train/loss": 2.452639162540436, "l2_grads": 2.140625, "lr": 0.0002513668541011862, "uptime": 147745.878578024, "examples_seen": 80179200.0, "progress": 0.6953633562160866, "epoch": 62.58294195838638, "img/sec/core": 542.6725741934604, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.01872143714889, "core_hours": 41.01872143714889} {"step": 78350, "l2_params": 342.2675562745102, "train/loss": 2.1844500601291656, "l2_grads": 2.15625, "lr": 0.00025070302299688094, "uptime": 147840.473773094, "examples_seen": 80230400.0, "progress": 0.695807394119162, "epoch": 62.62290552285533, "img/sec/core": 541.2537070420351, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.044997880223896, "core_hours": 41.044997880223896} {"step": 78400, "l2_params": 342.2675562745102, "train/loss": 2.6999842524528503, "l2_grads": 2.09375, "lr": 0.0002500397761934863, "uptime": 147933.969883274, "examples_seen": 80281600.0, "progress": 0.6962514320222374, "epoch": 62.66286908732429, "img/sec/core": 547.6163650170798, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.07096902194055, "core_hours": 41.07096902194055} {"step": 78450, "l2_params": 342.2675562745102, "train/loss": 4.771874189376831, "l2_grads": 2.28125, "lr": 0.000249377115245516, "uptime": 148027.954755661, "examples_seen": 80332800.0, "progress": 0.6966954699253128, "epoch": 62.70283265179325, "img/sec/core": 544.7685217805857, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.097075930936946, "core_hours": 41.097075930936946} {"step": 78500, "l2_params": 342.2675391552272, "train/loss": 3.8767067790031433, "l2_grads": 1.921875, "lr": 0.00024871504170611154, "uptime": 148121.783890819, "examples_seen": 80384000.0, "progress": 0.6971395078283882, "epoch": 62.74279621626221, "img/sec/core": 545.672726427428, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.12313957959194, "core_hours": 41.12313957959194} {"step": 78550, "l2_params": 342.267544861655, "train/loss": 2.212772786617279, "l2_grads": 2.28125, "lr": 0.00024805355712703724, "uptime": 148215.58167324, "examples_seen": 80435200.0, "progress": 0.6975835457314636, "epoch": 62.78275978073116, "img/sec/core": 545.8551223545709, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.14919451915333, "core_hours": 41.14919451915333} {"step": 78600, "l2_params": 342.2675562745102, "train/loss": 3.964004874229431, "l2_grads": 1.9921875, "lr": 0.0002473926630586772, "uptime": 148309.516096698, "examples_seen": 80486400.0, "progress": 0.6980275836345391, "epoch": 62.82272334520012, "img/sec/core": 545.06109810627, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.17528741455833, "core_hours": 41.17528741455833} {"step": 78650, "l2_params": 342.26755056808264, "train/loss": 2.1444538235664368, "l2_grads": 2.359375, "lr": 0.00024673236105003123, "uptime": 148403.459796148, "examples_seen": 80537600.0, "progress": 0.6984716215376144, "epoch": 62.86268690966907, "img/sec/core": 545.0072788250241, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.20138288662778, "core_hours": 41.20138288662778} {"step": 78700, "l2_params": 342.2675733937923, "train/loss": 3.593628227710724, "l2_grads": 2.125, "lr": 0.00024607265264871167, "uptime": 148497.45822283102, "examples_seen": 80588800.0, "progress": 0.6989156594406899, "epoch": 62.902650474138035, "img/sec/core": 544.689967765726, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.22749356070639, "core_hours": 41.22749356070639} {"step": 78750, "l2_params": 342.26756768736504, "train/loss": 2.508605480194092, "l2_grads": 2.125, "lr": 0.00024541353940093954, "uptime": 148591.389282164, "examples_seen": 80640000.0, "progress": 0.6993596973437652, "epoch": 62.94261403860699, "img/sec/core": 545.0806193774889, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.25358552163222, "core_hours": 41.25358552163222} {"step": 78800, "l2_params": 342.26756198093767, "train/loss": 3.859917938709259, "l2_grads": 2.015625, "lr": 0.0002447550228515409, "uptime": 148685.324317461, "examples_seen": 80691200.0, "progress": 0.6998037352468407, "epoch": 62.982577603075946, "img/sec/core": 545.0575478905627, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.2796785869925, "core_hours": 41.2796785869925} {"step": 78850, "l2_params": 342.2675791002195, "train/loss": 2.1287894546985626, "l2_grads": 2.375, "lr": 0.00024409710454394347, "uptime": 148780.013924939, "examples_seen": 80742400.0, "progress": 0.700247773149916, "epoch": 63.0225411675449, "img/sec/core": 540.7140378302965, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.305981255736384, "core_hours": 41.305981255736384} {"step": 78900, "l2_params": 342.2675791002195, "train/loss": 4.030627489089966, "l2_grads": 1.9140625, "lr": 0.0002434397860201725, "uptime": 148875.087445906, "examples_seen": 80793600.0, "progress": 0.7006918110529915, "epoch": 63.062504732013856, "img/sec/core": 538.5305969447217, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.332390567116114, "core_hours": 41.332390567116114} {"step": 78950, "l2_params": 342.26758480664654, "train/loss": 2.4188196659088135, "l2_grads": 2.234375, "lr": 0.00024278306882084724, "uptime": 148968.312789262, "examples_seen": 80844800.0, "progress": 0.7011358489560668, "epoch": 63.10246829648282, "img/sec/core": 549.206880413241, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.35828649582611, "core_hours": 41.35828649582611} {"step": 79000, "l2_params": 342.2675733937923, "train/loss": 2.9855727553367615, "l2_grads": 2.125, "lr": 0.00024212695448517824, "uptime": 149064.081239287, "examples_seen": 80896000.0, "progress": 0.7015798868591423, "epoch": 63.142431860951774, "img/sec/core": 534.6228323276883, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.38488884305528, "core_hours": 41.38488884305528} {"step": 79050, "l2_params": 342.26758480664654, "train/loss": 2.237687647342682, "l2_grads": 2.234375, "lr": 0.00024147144455096304, "uptime": 149157.459335793, "examples_seen": 80947200.0, "progress": 0.7020239247622178, "epoch": 63.18239542542073, "img/sec/core": 548.3084568629046, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.410827203195836, "core_hours": 41.410827203195836} {"step": 79100, "l2_params": 342.2675791002195, "train/loss": 2.2004666328430176, "l2_grads": 2.265625, "lr": 0.0002408165405545818, "uptime": 149252.333770403, "examples_seen": 80998400.0, "progress": 0.7024679626652931, "epoch": 63.222358989889685, "img/sec/core": 539.6606600131626, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.43718121280972, "core_hours": 41.43718121280972} {"step": 79150, "l2_params": 342.2675733937923, "train/loss": 2.1286286413669586, "l2_grads": 2.40625, "lr": 0.00024016224403099526, "uptime": 149346.875412749, "examples_seen": 81049600.0, "progress": 0.7029120005683686, "epoch": 63.26232255435864, "img/sec/core": 541.5602979755066, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.463442780128055, "core_hours": 41.463442780128055} {"step": 79200, "l2_params": 342.2675791002195, "train/loss": 2.6925230026245117, "l2_grads": 2.0625, "lr": 0.00023950855651373991, "uptime": 149440.04445849, "examples_seen": 81100800.0, "progress": 0.7033560384714439, "epoch": 63.3022861188276, "img/sec/core": 549.5387399623078, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.48932307061167, "core_hours": 41.48932307061167} {"step": 79250, "l2_params": 342.2675791002195, "train/loss": 2.1854747533798218, "l2_grads": 2.25, "lr": 0.00023885547953492506, "uptime": 149534.878890952, "examples_seen": 81152000.0, "progress": 0.7038000763745194, "epoch": 63.34224968329656, "img/sec/core": 539.888294481196, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.51566596851778, "core_hours": 41.51566596851778} {"step": 79300, "l2_params": 342.26758480664654, "train/loss": 2.138046443462372, "l2_grads": 2.296875, "lr": 0.00023820301462522918, "uptime": 149629.007706443, "examples_seen": 81203200.0, "progress": 0.7042441142775947, "epoch": 63.38221324776551, "img/sec/core": 543.9354541214153, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.541812861709715, "core_hours": 41.541812861709715} {"step": 79350, "l2_params": 342.2675791002195, "train/loss": 2.5973334312438965, "l2_grads": 2.171875, "lr": 0.00023755116331389576, "uptime": 149722.32564481001, "examples_seen": 81254400.0, "progress": 0.7046881521806702, "epoch": 63.42217681223447, "img/sec/core": 548.6619281989429, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.56773451125612, "core_hours": 41.56773451125612} {"step": 79400, "l2_params": 342.2675791002195, "train/loss": 4.143317341804504, "l2_grads": 2.109375, "lr": 0.00023689992712873064, "uptime": 149816.922241917, "examples_seen": 81305600.0, "progress": 0.7051321900837455, "epoch": 63.46214037670343, "img/sec/core": 541.2456850017192, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.59401134378583, "core_hours": 41.59401134378583} {"step": 79450, "l2_params": 342.2675733937923, "train/loss": 2.2084586024284363, "l2_grads": 2.21875, "lr": 0.00023624930759609736, "uptime": 149910.219776029, "examples_seen": 81356800.0, "progress": 0.705576227986821, "epoch": 63.502103941172386, "img/sec/core": 548.7819210584327, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.61992732548361, "core_hours": 41.61992732548361} {"step": 79500, "l2_params": 342.2675733937923, "train/loss": 2.088246315717697, "l2_grads": 2.296875, "lr": 0.00023559930624091473, "uptime": 150005.448444063, "examples_seen": 81408000.0, "progress": 0.7060202658898964, "epoch": 63.54206750564134, "img/sec/core": 537.6532199497477, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.64637973327083, "core_hours": 41.64637973327083} {"step": 79550, "l2_params": 342.26756768736504, "train/loss": 2.2488420009613037, "l2_grads": 2.25, "lr": 0.00023494992458665244, "uptime": 150100.362441173, "examples_seen": 81459200.0, "progress": 0.7064643037929718, "epoch": 63.5820310701103, "img/sec/core": 539.4357161110546, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.672744732468054, "core_hours": 41.672744732468054} {"step": 79600, "l2_params": 342.26756768736504, "train/loss": 4.708610653877258, "l2_grads": 2.1875, "lr": 0.00023430116415532753, "uptime": 150193.686914644, "examples_seen": 81510400.0, "progress": 0.7069083416960472, "epoch": 63.62199463457925, "img/sec/core": 548.623507808043, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.69866819732111, "core_hours": 41.69866819732111} {"step": 79650, "l2_params": 342.26756768736504, "train/loss": 2.39142906665802, "l2_grads": 2.203125, "lr": 0.00023365302646750138, "uptime": 150289.05039177, "examples_seen": 81561600.0, "progress": 0.7073523795991226, "epoch": 63.661958199048215, "img/sec/core": 536.8931748614118, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.72515805207833, "core_hours": 41.72515805207833} {"step": 79700, "l2_params": 342.26756768736504, "train/loss": 4.697648048400879, "l2_grads": 2.171875, "lr": 0.0002330055130422755, "uptime": 150384.033890585, "examples_seen": 81612800.0, "progress": 0.707796417502198, "epoch": 63.70192176351717, "img/sec/core": 539.0409980550086, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.75154235730472, "core_hours": 41.75154235730472} {"step": 79750, "l2_params": 342.2675733937923, "train/loss": 4.005726456642151, "l2_grads": 2.046875, "lr": 0.00023235862539728848, "uptime": 150477.927401862, "examples_seen": 81664000.0, "progress": 0.7082404554052734, "epoch": 63.741885327986125, "img/sec/core": 545.2985973542033, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.777623888215, "core_hours": 41.777623888215} {"step": 79800, "l2_params": 342.2675733937923, "train/loss": 2.3063939213752747, "l2_grads": 2.25, "lr": 0.00023171236504871163, "uptime": 150571.438897771, "examples_seen": 81715200.0, "progress": 0.7086844933083488, "epoch": 63.78184889245508, "img/sec/core": 547.5262640415634, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.80359930374528, "core_hours": 41.80359930374528} {"step": 79850, "l2_params": 342.2675733937923, "train/loss": 2.358965218067169, "l2_grads": 2.21875, "lr": 0.0002310667335112469, "uptime": 150665.86011198, "examples_seen": 81766400.0, "progress": 0.7091285312114242, "epoch": 63.821812456924036, "img/sec/core": 542.2510230240367, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.82982741880333, "core_hours": 41.82982741880333} {"step": 79900, "l2_params": 342.2675733937923, "train/loss": 2.1219030022621155, "l2_grads": 2.1875, "lr": 0.0002304217322981221, "uptime": 150760.95032532502, "examples_seen": 81817600.0, "progress": 0.7095725691144996, "epoch": 63.861776021393, "img/sec/core": 538.4360619134565, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.85624136695473, "core_hours": 41.85624136695473} {"step": 79950, "l2_params": 342.26756768736504, "train/loss": 2.4114148020744324, "l2_grads": 2.234375, "lr": 0.00022977736292108738, "uptime": 150854.890697905, "examples_seen": 81868800.0, "progress": 0.7100166070175751, "epoch": 63.901739585861954, "img/sec/core": 545.0265800936834, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.88233591489361, "core_hours": 41.88233591489361} {"step": 80000, "l2_params": 342.267544861655, "train/loss": 4.598052382469177, "l2_grads": 2.109375, "lr": 0.0002291336268904125, "uptime": 150949.824191417, "examples_seen": 81920000.0, "progress": 0.7104606449206504, "epoch": 63.94170315033091, "img/sec/core": 539.3249327070921, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.908706329758054, "core_hours": 41.908706329758054, "val/acc@1": 0.6635841836734694, "val/loss": 1.3872923321869908, "z/secs/eval/val": 31.670321626996156} {"step": 80050, "l2_params": 342.2675733937923, "train/loss": 2.2485393285751343, "l2_grads": 2.28125, "lr": 0.00022849052571488222, "uptime": 151074.693259722, "examples_seen": 81971200.0, "progress": 0.7109046828237259, "epoch": 63.981666714799864, "img/sec/core": 410.02948684567485, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.943392182065004, "core_hours": 41.943392182065004} {"step": 80100, "l2_params": 342.26755056808264, "train/loss": 2.2866976857185364, "l2_grads": 2.28125, "lr": 0.00022784806090179338, "uptime": 151167.997733671, "examples_seen": 82022400.0, "progress": 0.7113487207268012, "epoch": 64.02163027926882, "img/sec/core": 548.7411035399867, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.96931009149528, "core_hours": 41.96931009149528} {"step": 80150, "l2_params": 342.26755056808264, "train/loss": 3.171656906604767, "l2_grads": 2.0625, "lr": 0.0002272062339569521, "uptime": 151262.883576951, "examples_seen": 82073600.0, "progress": 0.7117927586298767, "epoch": 64.06159384373778, "img/sec/core": 539.5957735120354, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 41.995667270184164, "core_hours": 41.995667270184164} {"step": 80200, "l2_params": 342.26755056808264, "train/loss": 3.5790520310401917, "l2_grads": 1.875, "lr": 0.0002265650463846686, "uptime": 151356.677215751, "examples_seen": 82124800.0, "progress": 0.712236796532952, "epoch": 64.10155740820673, "img/sec/core": 545.8792371748257, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.021721058739715, "core_hours": 42.021721058739715} {"step": 80250, "l2_params": 342.26755056808264, "train/loss": 2.207738995552063, "l2_grads": 2.28125, "lr": 0.00022592449968775468, "uptime": 151450.982112676, "examples_seen": 82176000.0, "progress": 0.7126808344360275, "epoch": 64.14152097267569, "img/sec/core": 542.9198447745748, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.0479168634411, "core_hours": 42.0479168634411} {"step": 80300, "l2_params": 342.26755056808264, "train/loss": 3.442346453666687, "l2_grads": 1.96875, "lr": 0.0002252845953675204, "uptime": 151545.211506146, "examples_seen": 82227200.0, "progress": 0.7131248723391028, "epoch": 64.18148453714466, "img/sec/core": 543.3548717077668, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.07409169496056, "core_hours": 42.07409169496056} {"step": 80350, "l2_params": 342.26755056808264, "train/loss": 2.175775170326233, "l2_grads": 2.25, "lr": 0.0002246453349237701, "uptime": 151639.86838139, "examples_seen": 82278400.0, "progress": 0.7135689102421783, "epoch": 64.2214481016136, "img/sec/core": 540.9010160965506, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.10038527141722, "core_hours": 42.10038527141722} {"step": 80400, "l2_params": 342.26755056808264, "train/loss": 2.235028088092804, "l2_grads": 2.25, "lr": 0.00022400671985479918, "uptime": 151734.681180974, "examples_seen": 82329600.0, "progress": 0.7140129481452537, "epoch": 64.26141166608257, "img/sec/core": 540.0114776131763, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.12672216019055, "core_hours": 42.12672216019055} {"step": 80450, "l2_params": 342.26755056808264, "train/loss": 2.2095197439193726, "l2_grads": 2.375, "lr": 0.0002233687516573901, "uptime": 151829.339162999, "examples_seen": 82380800.0, "progress": 0.7144569860483291, "epoch": 64.30137523055151, "img/sec/core": 540.8946916539508, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.15301604408639, "core_hours": 42.15301604408639} {"step": 80500, "l2_params": 342.26755056808264, "train/loss": 2.151654601097107, "l2_grads": 2.234375, "lr": 0.00022273143182680884, "uptime": 151923.854449766, "examples_seen": 82432000.0, "progress": 0.7149010239514045, "epoch": 64.34133879502048, "img/sec/core": 541.711312014832, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.17927029041055, "core_hours": 42.17927029041055} {"step": 80550, "l2_params": 342.2675733937923, "train/loss": 2.149315357208252, "l2_grads": 2.203125, "lr": 0.00022209476185680246, "uptime": 152017.114660816, "examples_seen": 82483200.0, "progress": 0.7153450618544799, "epoch": 64.38130235948944, "img/sec/core": 549.0015454987694, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.20517590459111, "core_hours": 42.20517590459111} {"step": 80600, "l2_params": 342.26756768736504, "train/loss": 2.115815371274948, "l2_grads": 2.25, "lr": 0.00022145874323959466, "uptime": 152111.839247387, "examples_seen": 82534400.0, "progress": 0.7157890997575553, "epoch": 64.42126592395839, "img/sec/core": 540.514367530459, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.23148828974971, "core_hours": 42.23148828974971} {"step": 80650, "l2_params": 342.26756768736504, "train/loss": 3.106166958808899, "l2_grads": 2.09375, "lr": 0.00022082337746588262, "uptime": 152206.601760828, "examples_seen": 82585600.0, "progress": 0.7162331376606307, "epoch": 64.46122948842735, "img/sec/core": 540.2980370700607, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.257811210149995, "core_hours": 42.257811210149995} {"step": 80700, "l2_params": 342.2675733937923, "train/loss": 4.019327402114868, "l2_grads": 1.9453125, "lr": 0.00022018866602483293, "uptime": 152300.996915602, "examples_seen": 82636800.0, "progress": 0.7166771755637061, "epoch": 64.5011930528963, "img/sec/core": 542.4007209117328, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.28403208647612, "core_hours": 42.28403208647612} {"step": 80750, "l2_params": 342.2675733937923, "train/loss": 2.274304211139679, "l2_grads": 2.28125, "lr": 0.00021955461040407874, "uptime": 152395.417876654, "examples_seen": 82688000.0, "progress": 0.7171212134667815, "epoch": 64.54115661736526, "img/sec/core": 542.2524768816992, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.31026013121278, "core_hours": 42.31026013121278} {"step": 80800, "l2_params": 342.26755056808264, "train/loss": 3.1831071376800537, "l2_grads": 2.03125, "lr": 0.0002189212120897165, "uptime": 152488.935301955, "examples_seen": 82739200.0, "progress": 0.7175652513698569, "epoch": 64.58112018183422, "img/sec/core": 547.491548609369, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.336237193796386, "core_hours": 42.336237193796386} {"step": 80850, "l2_params": 342.26755056808264, "train/loss": 2.284864902496338, "l2_grads": 2.421875, "lr": 0.0002182884725663018, "uptime": 152583.511382028, "examples_seen": 82790400.0, "progress": 0.7180092892729323, "epoch": 64.62108374630317, "img/sec/core": 541.3631011190694, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.362508327149996, "core_hours": 42.362508327149996} {"step": 80900, "l2_params": 342.26755056808264, "train/loss": 3.8321107029914856, "l2_grads": 1.9921875, "lr": 0.00021765639331684593, "uptime": 152677.786767508, "examples_seen": 82841600.0, "progress": 0.7184533271760077, "epoch": 64.66104731077213, "img/sec/core": 543.0897973985384, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.388695934227776, "core_hours": 42.388695934227776} {"step": 80950, "l2_params": 342.26755056808264, "train/loss": 2.17686265707016, "l2_grads": 2.390625, "lr": 0.00021702497582281287, "uptime": 152771.75662507, "examples_seen": 82892800.0, "progress": 0.7188973650790832, "epoch": 64.7010108752411, "img/sec/core": 544.8555667567312, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.414798672439446, "core_hours": 42.414798672439446} {"step": 81000, "l2_params": 342.26755056808264, "train/loss": 4.202906250953674, "l2_grads": 2.03125, "lr": 0.00021639422156411538, "uptime": 152866.53547193902, "examples_seen": 82944000.0, "progress": 0.7193414029821585, "epoch": 64.74097443971004, "img/sec/core": 540.2049264300523, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.44112612990306, "core_hours": 42.44112612990306} {"step": 81050, "l2_params": 342.26755056808264, "train/loss": 2.0917388200759888, "l2_grads": 2.234375, "lr": 0.00021576413201911205, "uptime": 152961.021039248, "examples_seen": 82995200.0, "progress": 0.719785440885234, "epoch": 64.780938004179, "img/sec/core": 541.8817017054381, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.467372120822226, "core_hours": 42.467372120822226} {"step": 81100, "l2_params": 342.26755056808264, "train/loss": 3.9998128414154053, "l2_grads": 2.109375, "lr": 0.00021513470866460363, "uptime": 153055.18039474, "examples_seen": 83046400.0, "progress": 0.7202294787883093, "epoch": 64.82090156864795, "img/sec/core": 543.7590320418022, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.49352749734778, "core_hours": 42.49352749734778} {"step": 81150, "l2_params": 342.26755056808264, "train/loss": 2.1779565513134003, "l2_grads": 2.34375, "lr": 0.00021450595297582866, "uptime": 153149.483921815, "examples_seen": 83097600.0, "progress": 0.7206735166913848, "epoch": 64.86086513311692, "img/sec/core": 542.9277312106701, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.519722921535276, "core_hours": 42.519722921535276} {"step": 81200, "l2_params": 342.26755056808264, "train/loss": 2.3441113233566284, "l2_grads": 2.296875, "lr": 0.0002138778664264616, "uptime": 153243.729974931, "examples_seen": 83148800.0, "progress": 0.7211175545944601, "epoch": 64.90082869758588, "img/sec/core": 543.2588241863897, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.54590238073417, "core_hours": 42.54590238073417} {"step": 81250, "l2_params": 342.26755056808264, "train/loss": 4.569891333580017, "l2_grads": 2.078125, "lr": 0.00021325045048860853, "uptime": 153338.55124839, "examples_seen": 83200000.0, "progress": 0.7215615924975356, "epoch": 64.94079226205483, "img/sec/core": 539.9632185085102, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.57224162336167, "core_hours": 42.57224162336167} {"step": 81300, "l2_params": 342.267544861655, "train/loss": 2.2059894800186157, "l2_grads": 2.09375, "lr": 0.0002126237066328029, "uptime": 153431.773566641, "examples_seen": 83251200.0, "progress": 0.7220056304006109, "epoch": 64.98075582652379, "img/sec/core": 549.2247024166602, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.598136711764724, "core_hours": 42.598136711764724} {"step": 81350, "l2_params": 342.2675733937923, "train/loss": 4.700339078903198, "l2_grads": 2.0, "lr": 0.00021199763632800432, "uptime": 153525.971229782, "examples_seen": 83302400.0, "progress": 0.7224496683036864, "epoch": 65.02071939099274, "img/sec/core": 543.537899909017, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.624302729303885, "core_hours": 42.624302729303885} {"step": 81400, "l2_params": 342.267544861655, "train/loss": 2.2515077590942383, "l2_grads": 2.25, "lr": 0.00021137224104159243, "uptime": 153621.054752875, "examples_seen": 83353600.0, "progress": 0.7228937062067619, "epoch": 65.0606829554617, "img/sec/core": 538.4739472676515, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.65071481905194, "core_hours": 42.65071481905194} {"step": 81450, "l2_params": 342.267544861655, "train/loss": 4.063801050186157, "l2_grads": 1.96875, "lr": 0.00021074752223936564, "uptime": 153715.581734145, "examples_seen": 83404800.0, "progress": 0.7233377441098372, "epoch": 65.10064651993066, "img/sec/core": 541.6442936409512, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.67697231384917, "core_hours": 42.67697231384917} {"step": 81500, "l2_params": 342.267544861655, "train/loss": 4.635900974273682, "l2_grads": 2.140625, "lr": 0.0002101234813855365, "uptime": 153809.212633764, "examples_seen": 83456000.0, "progress": 0.7237817820129127, "epoch": 65.14061008439961, "img/sec/core": 546.8280258797729, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.702980897076664, "core_hours": 42.702980897076664} {"step": 81550, "l2_params": 342.267544861655, "train/loss": 4.0177406668663025, "l2_grads": 1.9921875, "lr": 0.0002095001199427287, "uptime": 153903.715868627, "examples_seen": 83507200.0, "progress": 0.724225819915988, "epoch": 65.18057364886857, "img/sec/core": 541.7803959220386, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.729231795649724, "core_hours": 42.729231795649724} {"step": 81600, "l2_params": 342.267544861655, "train/loss": 2.4838082790374756, "l2_grads": 2.125, "lr": 0.00020887743937197297, "uptime": 153997.390697045, "examples_seen": 83558400.0, "progress": 0.7246698578190635, "epoch": 65.22053721333752, "img/sec/core": 546.5715909459193, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.755252581321386, "core_hours": 42.755252581321386} {"step": 81650, "l2_params": 342.267544861655, "train/loss": 2.208098351955414, "l2_grads": 2.28125, "lr": 0.0002082554411327049, "uptime": 154091.09464679201, "examples_seen": 83609600.0, "progress": 0.7251138957221388, "epoch": 65.26050077780648, "img/sec/core": 546.4017273362111, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.781281456251115, "core_hours": 42.781281456251115} {"step": 81700, "l2_params": 342.26755056808264, "train/loss": 4.0776753425598145, "l2_grads": 2.125, "lr": 0.0002076341266827607, "uptime": 154184.853942331, "examples_seen": 83660800.0, "progress": 0.7255579336252143, "epoch": 65.30046434227545, "img/sec/core": 546.0791882624948, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.80732570501195, "core_hours": 42.80732570501195} {"step": 81750, "l2_params": 342.26755056808264, "train/loss": 2.2366947531700134, "l2_grads": 2.296875, "lr": 0.00020701349747837415, "uptime": 154278.645295331, "examples_seen": 83712000.0, "progress": 0.7260019715282896, "epoch": 65.3404279067444, "img/sec/core": 545.89254086154, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.83337885862306, "core_hours": 42.83337885862306} {"step": 81800, "l2_params": 342.26755056808264, "train/loss": 2.6456207633018494, "l2_grads": 2.171875, "lr": 0.00020639355497417228, "uptime": 154372.331110413, "examples_seen": 83763200.0, "progress": 0.7264460094313651, "epoch": 65.38039147121336, "img/sec/core": 546.507493745729, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.859402696145835, "core_hours": 42.859402696145835} {"step": 81850, "l2_params": 342.26755056808264, "train/loss": 2.112944185733795, "l2_grads": 2.1875, "lr": 0.00020577430062317247, "uptime": 154466.665503433, "examples_seen": 83814400.0, "progress": 0.7268900473344405, "epoch": 65.4203550356823, "img/sec/core": 542.7500868018466, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.88560669420694, "core_hours": 42.88560669420694} {"step": 81900, "l2_params": 342.26755056808264, "train/loss": 2.23597913980484, "l2_grads": 2.296875, "lr": 0.0002051557358767805, "uptime": 154560.963534235, "examples_seen": 83865600.0, "progress": 0.7273340852375159, "epoch": 65.46031860015127, "img/sec/core": 542.9593764000342, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.91180059165195, "core_hours": 42.91180059165195} {"step": 81950, "l2_params": 342.26755056808264, "train/loss": 2.2336851358413696, "l2_grads": 2.453125, "lr": 0.00020453786218478493, "uptime": 154655.115117215, "examples_seen": 83916800.0, "progress": 0.7277781231405913, "epoch": 65.50028216462023, "img/sec/core": 543.8039210755869, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.937953809146386, "core_hours": 42.937953809146386} {"step": 82000, "l2_params": 342.26756768736504, "train/loss": 2.585016965866089, "l2_grads": 2.34375, "lr": 0.00020392068099535452, "uptime": 154749.333288393, "examples_seen": 83968000.0, "progress": 0.7282221610436667, "epoch": 65.54024572908918, "img/sec/core": 543.4195905083287, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.964125523362505, "core_hours": 42.964125523362505} {"step": 82050, "l2_params": 342.26756768736504, "train/loss": 2.212730288505554, "l2_grads": 2.40625, "lr": 0.00020330419375503563, "uptime": 154844.19501145, "examples_seen": 84019200.0, "progress": 0.7286661989467421, "epoch": 65.58020929355814, "img/sec/core": 539.7329750086687, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 42.99047600198945, "core_hours": 42.99047600198945} {"step": 82100, "l2_params": 342.26756768736504, "train/loss": 2.9255621433258057, "l2_grads": 2.09375, "lr": 0.00020268840190874727, "uptime": 154938.378016835, "examples_seen": 84070400.0, "progress": 0.7291102368498175, "epoch": 65.62017285802709, "img/sec/core": 543.622491029181, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.016637947929716, "core_hours": 43.016637947929716} {"step": 82150, "l2_params": 342.2675733937923, "train/loss": 3.917062819004059, "l2_grads": 1.9296875, "lr": 0.00020207330689977934, "uptime": 155031.761039707, "examples_seen": 84121600.0, "progress": 0.7295542747528929, "epoch": 65.66013642249605, "img/sec/core": 548.27953117536, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.042577676505275, "core_hours": 43.042577676505275} {"step": 82200, "l2_params": 342.2675733937923, "train/loss": 2.1402339935302734, "l2_grads": 2.28125, "lr": 0.00020145891016978826, "uptime": 155126.628456943, "examples_seen": 84172800.0, "progress": 0.7299983126559683, "epoch": 65.70009998696501, "img/sec/core": 539.7005788892551, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.06892973684861, "core_hours": 43.06892973684861} {"step": 82250, "l2_params": 342.2675733937923, "train/loss": 2.1785252690315247, "l2_grads": 2.3125, "lr": 0.00020084521315879346, "uptime": 155220.64757159402, "examples_seen": 84224000.0, "progress": 0.7304423505590437, "epoch": 65.74006355143396, "img/sec/core": 544.5701141735354, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.095046157585, "core_hours": 43.095046157585} {"step": 82300, "l2_params": 342.26756198093767, "train/loss": 2.1591707468032837, "l2_grads": 2.328125, "lr": 0.00020023221730517497, "uptime": 155314.92527391, "examples_seen": 84275200.0, "progress": 0.7308863884621192, "epoch": 65.78002711590293, "img/sec/core": 543.0764511888805, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.12123440822833, "core_hours": 43.12123440822833} {"step": 82350, "l2_params": 342.26755056808264, "train/loss": 2.407184362411499, "l2_grads": 2.296875, "lr": 0.00019961992404566892, "uptime": 155408.813149835, "examples_seen": 84326400.0, "progress": 0.7313304263651945, "epoch": 65.81999068037187, "img/sec/core": 545.3313273471847, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.14731437376306, "core_hours": 43.14731437376306} {"step": 82400, "l2_params": 342.26756768736504, "train/loss": 1.9740053415298462, "l2_grads": 2.140625, "lr": 0.0001990083348153652, "uptime": 155503.215479812, "examples_seen": 84377600.0, "progress": 0.73177446426827, "epoch": 65.85995424484084, "img/sec/core": 542.3594948607664, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.17353724320112, "core_hours": 43.17353724320112} {"step": 82450, "l2_params": 342.2675562745102, "train/loss": 4.199591279029846, "l2_grads": 2.046875, "lr": 0.00019839745104770332, "uptime": 155597.139414209, "examples_seen": 84428800.0, "progress": 0.7322185021713453, "epoch": 65.8999178093098, "img/sec/core": 545.1219684174262, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.19962722497805, "core_hours": 43.19962722497805} {"step": 82500, "l2_params": 342.26756768736504, "train/loss": 2.485893130302429, "l2_grads": 2.265625, "lr": 0.00019778727417446907, "uptime": 155691.295680285, "examples_seen": 84480000.0, "progress": 0.7326625400744208, "epoch": 65.93988137377875, "img/sec/core": 543.7768736355305, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.2257817433325, "core_hours": 43.2257817433325, "val/acc@1": 0.6636240433673469, "val/loss": 1.3784448574392163, "z/secs/eval/val": 31.718936628021766} {"step": 82550, "l2_params": 342.26755056808264, "train/loss": 3.858237326145172, "l2_grads": 1.9296875, "lr": 0.00019717780562579216, "uptime": 155815.859209129, "examples_seen": 84531200.0, "progress": 0.7331065779774961, "epoch": 65.97984493824771, "img/sec/core": 411.0352402115827, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.26038272356695, "core_hours": 43.26038272356695} {"step": 82600, "l2_params": 342.26756198093767, "train/loss": 4.652127623558044, "l2_grads": 2.21875, "lr": 0.00019656904683014117, "uptime": 155909.051213094, "examples_seen": 84582400.0, "progress": 0.7335506158805716, "epoch": 66.01980850271666, "img/sec/core": 549.4033588893465, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.286269391335004, "core_hours": 43.286269391335004} {"step": 82650, "l2_params": 342.26756768736504, "train/loss": 2.211924374103546, "l2_grads": 2.359375, "lr": 0.00019596099921432227, "uptime": 156003.06791799, "examples_seen": 84633600.0, "progress": 0.7339946537836469, "epoch": 66.05977206718562, "img/sec/core": 544.5840721245988, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.312385142695, "core_hours": 43.312385142695} {"step": 82700, "l2_params": 342.26756768736504, "train/loss": 2.0799463391304016, "l2_grads": 2.234375, "lr": 0.00019535366420347355, "uptime": 156097.412021312, "examples_seen": 84684800.0, "progress": 0.7344386916867224, "epoch": 66.09973563165458, "img/sec/core": 542.6942246221795, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.33859183806222, "core_hours": 43.33859183806222} {"step": 82750, "l2_params": 342.26756768736504, "train/loss": 3.294049084186554, "l2_grads": 1.9140625, "lr": 0.00019474704322106393, "uptime": 156191.200878393, "examples_seen": 84736000.0, "progress": 0.7348827295897978, "epoch": 66.13969919612353, "img/sec/core": 545.9070682115255, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.36464429836249, "core_hours": 43.36464429836249} {"step": 82800, "l2_params": 342.26756768736504, "train/loss": 2.7113521695137024, "l2_grads": 2.3125, "lr": 0.00019414113768888858, "uptime": 156285.907210362, "examples_seen": 84787200.0, "progress": 0.7353267674928732, "epoch": 66.17966276059249, "img/sec/core": 540.6185514264869, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.39095161279833, "core_hours": 43.39095161279833} {"step": 82850, "l2_params": 342.26756768736504, "train/loss": 2.1604619324207306, "l2_grads": 2.359375, "lr": 0.00019353594902706518, "uptime": 156379.140858486, "examples_seen": 84838400.0, "progress": 0.7357708053959486, "epoch": 66.21962632506145, "img/sec/core": 549.1579599234542, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.41684984838833, "core_hours": 43.41684984838833} {"step": 82900, "l2_params": 342.2675733937923, "train/loss": 4.286426663398743, "l2_grads": 2.046875, "lr": 0.00019293147865403202, "uptime": 156474.599602636, "examples_seen": 84889600.0, "progress": 0.736214843299024, "epoch": 66.2595898895304, "img/sec/core": 536.3573599873057, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.443366166207774, "core_hours": 43.443366166207774} {"step": 82950, "l2_params": 342.26756768736504, "train/loss": 4.205936431884766, "l2_grads": 1.9296875, "lr": 0.00019232772798654312, "uptime": 156567.865660833, "examples_seen": 84940800.0, "progress": 0.7366588812020994, "epoch": 66.29955345399937, "img/sec/core": 548.9671268390348, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.46927340459583, "core_hours": 43.46927340459583} {"step": 83000, "l2_params": 342.26756768736504, "train/loss": 3.1124156713485718, "l2_grads": 2.171875, "lr": 0.00019172469843966626, "uptime": 156662.35063697302, "examples_seen": 84992000.0, "progress": 0.7371029191051748, "epoch": 66.33951701846831, "img/sec/core": 541.8850921242997, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.495519231301394, "core_hours": 43.495519231301394} {"step": 83050, "l2_params": 342.26756768736504, "train/loss": 2.6834296584129333, "l2_grads": 2.015625, "lr": 0.00019112239142677901, "uptime": 156757.200218855, "examples_seen": 85043200.0, "progress": 0.7375469570082502, "epoch": 66.37948058293728, "img/sec/core": 539.8020632680052, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.52186633737972, "core_hours": 43.52186633737972} {"step": 83100, "l2_params": 342.26756198093767, "train/loss": 2.1807459592819214, "l2_grads": 2.40625, "lr": 0.00019052080835956506, "uptime": 156850.549020776, "examples_seen": 85094400.0, "progress": 0.7379909949113256, "epoch": 66.41944414740624, "img/sec/core": 548.4805262238611, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.54779656013556, "core_hours": 43.54779656013556} {"step": 83150, "l2_params": 342.26756198093767, "train/loss": 3.793718695640564, "l2_grads": 1.9609375, "lr": 0.00018991995064801176, "uptime": 156945.161330814, "examples_seen": 85145600.0, "progress": 0.738435032814401, "epoch": 66.45940771187519, "img/sec/core": 541.1557965283018, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.57407775736833, "core_hours": 43.57407775736833} {"step": 83200, "l2_params": 342.2675562745102, "train/loss": 3.37976211309433, "l2_grads": 1.9765625, "lr": 0.00018931981970040583, "uptime": 157039.873564739, "examples_seen": 85196800.0, "progress": 0.7388790707174765, "epoch": 66.49937127634415, "img/sec/core": 540.5848629918383, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.600386711236396, "core_hours": 43.600386711236396} {"step": 83250, "l2_params": 342.26756768736504, "train/loss": 4.685526728630066, "l2_grads": 2.078125, "lr": 0.00018872041692333095, "uptime": 157134.755259788, "examples_seen": 85248000.0, "progress": 0.7393231086205518, "epoch": 66.5393348408131, "img/sec/core": 539.619364657837, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.62674273763889, "core_hours": 43.62674273763889} {"step": 83300, "l2_params": 342.26756768736504, "train/loss": 2.137360990047455, "l2_grads": 2.3125, "lr": 0.00018812174372166463, "uptime": 157229.195681025, "examples_seen": 85299200.0, "progress": 0.7397671465236273, "epoch": 66.57929840528206, "img/sec/core": 542.1407415317763, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.6529761879825, "core_hours": 43.6529761879825} {"step": 83350, "l2_params": 342.26756198093767, "train/loss": 4.4854736328125, "l2_grads": 2.171875, "lr": 0.00018752380149857342, "uptime": 157323.069158807, "examples_seen": 85350400.0, "progress": 0.7402111844267026, "epoch": 66.61926196975102, "img/sec/core": 545.4149692729278, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.67905215403305, "core_hours": 43.67905215403305} {"step": 83400, "l2_params": 342.26756768736504, "train/loss": 2.2214440405368805, "l2_grads": 2.375, "lr": 0.0001869265916555113, "uptime": 157418.218260425, "examples_seen": 85401600.0, "progress": 0.7406552223297781, "epoch": 66.65922553421997, "img/sec/core": 538.1028210392461, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.705482460038056, "core_hours": 43.705482460038056} {"step": 83450, "l2_params": 342.2675733937923, "train/loss": 3.3810656666755676, "l2_grads": 2.125, "lr": 0.00018633011559221536, "uptime": 157511.399994705, "examples_seen": 85452800.0, "progress": 0.7410992602328534, "epoch": 66.69918909868893, "img/sec/core": 549.4639093768619, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.73136627511583, "core_hours": 43.73136627511583} {"step": 83500, "l2_params": 342.2675733937923, "train/loss": 3.6236605644226074, "l2_grads": 2.046875, "lr": 0.000185734374706703, "uptime": 157606.042404574, "examples_seen": 85504000.0, "progress": 0.7415432981359289, "epoch": 66.73915266315788, "img/sec/core": 540.9836887169998, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.75765583341277, "core_hours": 43.75765583341277} {"step": 83550, "l2_params": 342.26756768736504, "train/loss": 2.867653250694275, "l2_grads": 2.0, "lr": 0.00018513937039526878, "uptime": 157700.266426974, "examples_seen": 85555200.0, "progress": 0.7419873360390042, "epoch": 66.77911622762684, "img/sec/core": 543.3858446696203, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.78382917296833, "core_hours": 43.78382917296833} {"step": 83600, "l2_params": 342.26756198093767, "train/loss": 2.217512369155884, "l2_grads": 2.28125, "lr": 0.00018454510405248005, "uptime": 157793.908571174, "examples_seen": 85606400.0, "progress": 0.7424313739420797, "epoch": 66.8190797920958, "img/sec/core": 546.7623625817018, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.809840879690555, "core_hours": 43.809840879690555} {"step": 83650, "l2_params": 342.26756198093767, "train/loss": 4.334179043769836, "l2_grads": 1.9765625, "lr": 0.00018395157707117534, "uptime": 157889.110016158, "examples_seen": 85657600.0, "progress": 0.7428754118451552, "epoch": 66.85904335656475, "img/sec/core": 537.8069629993701, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.836285725519446, "core_hours": 43.836285725519446} {"step": 83700, "l2_params": 342.26756198093767, "train/loss": 2.2438803911209106, "l2_grads": 2.421875, "lr": 0.00018335879084245993, "uptime": 157983.18351445, "examples_seen": 85708800.0, "progress": 0.7433194497482305, "epoch": 66.89900692103372, "img/sec/core": 544.2552996282901, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.86241725282278, "core_hours": 43.86241725282278} {"step": 83750, "l2_params": 342.26756198093767, "train/loss": 2.2911027669906616, "l2_grads": 2.34375, "lr": 0.00018276674675570337, "uptime": 158077.276912692, "examples_seen": 85760000.0, "progress": 0.743763487651306, "epoch": 66.93897048550267, "img/sec/core": 544.1401942814358, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.88855430789, "core_hours": 43.88855430789} {"step": 83800, "l2_params": 342.26756198093767, "train/loss": 3.711134433746338, "l2_grads": 2.0625, "lr": 0.00018217544619853488, "uptime": 158171.64352408302, "examples_seen": 85811200.0, "progress": 0.7442075255543813, "epoch": 66.97893404997163, "img/sec/core": 542.5647826628965, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.91476725549862, "core_hours": 43.91476725549862} {"step": 83850, "l2_params": 342.26756198093767, "train/loss": 2.2160173654556274, "l2_grads": 2.171875, "lr": 0.00018158489055684183, "uptime": 158265.530428816, "examples_seen": 85862400.0, "progress": 0.7446515634574568, "epoch": 67.01889761444059, "img/sec/core": 545.3369684047896, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.940846951257775, "core_hours": 43.940846951257775} {"step": 83900, "l2_params": 342.26756768736504, "train/loss": 2.154929518699646, "l2_grads": 2.140625, "lr": 0.00018099508121476518, "uptime": 158359.097206507, "examples_seen": 85913600.0, "progress": 0.7450956013605321, "epoch": 67.05886117890954, "img/sec/core": 547.2027707216217, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.966837722838605, "core_hours": 43.966837722838605} {"step": 83950, "l2_params": 342.26756198093767, "train/loss": 2.3183756470680237, "l2_grads": 2.28125, "lr": 0.00018040601955469682, "uptime": 158453.712042575, "examples_seen": 85964800.0, "progress": 0.7455396392636076, "epoch": 67.0988247433785, "img/sec/core": 541.1413487330624, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 43.99311962174639, "core_hours": 43.99311962174639} {"step": 84000, "l2_params": 342.26756198093767, "train/loss": 4.768656969070435, "l2_grads": 2.046875, "lr": 0.0001798177069572765, "uptime": 158546.875868396, "examples_seen": 86016000.0, "progress": 0.7459836771666829, "epoch": 67.13878830784745, "img/sec/core": 549.5695303280124, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.01899846225221, "core_hours": 44.01899846225221} {"step": 84050, "l2_params": 342.2675562745102, "train/loss": 2.145091086626053, "l2_grads": 2.25, "lr": 0.00017923014480138803, "uptime": 158641.538949517, "examples_seen": 86067200.0, "progress": 0.7464277150697584, "epoch": 67.17875187231641, "img/sec/core": 540.8655559662649, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.04529376256361, "core_hours": 44.04529376256361} {"step": 84100, "l2_params": 342.26756198093767, "train/loss": 2.982805550098419, "l2_grads": 2.21875, "lr": 0.00017864333446415654, "uptime": 158736.004828786, "examples_seen": 86118400.0, "progress": 0.7468717529728338, "epoch": 67.21871543678537, "img/sec/core": 541.9946376003351, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.07153428458278, "core_hours": 44.07153428458278} {"step": 84150, "l2_params": 342.27924854477374, "train/loss": 2.8369637727737427, "l2_grads": 2.21875, "lr": 0.00017805727732094474, "uptime": 158830.320765156, "examples_seen": 86169600.0, "progress": 0.7473157908759092, "epoch": 67.25867900125432, "img/sec/core": 542.8562973615118, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.09773315579667, "core_hours": 44.09773315579667} {"step": 84200, "l2_params": 342.27924854477374, "train/loss": 4.178218245506287, "l2_grads": 1.953125, "lr": 0.0001774719747453501, "uptime": 158923.686104666, "examples_seen": 86220800.0, "progress": 0.7477598287789846, "epoch": 67.29864256572328, "img/sec/core": 548.3833751230311, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.12366797232722, "core_hours": 44.12366797232722} {"step": 84250, "l2_params": 342.2792542510063, "train/loss": 2.096850663423538, "l2_grads": 2.1875, "lr": 0.00017688742810920214, "uptime": 159018.605107405, "examples_seen": 86272000.0, "progress": 0.74820386668206, "epoch": 67.33860613019223, "img/sec/core": 539.4072685402457, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.15003436197694, "core_hours": 44.15003436197694} {"step": 84300, "l2_params": 342.27924854477374, "train/loss": 2.2050973773002625, "l2_grads": 2.453125, "lr": 0.00017630363878255758, "uptime": 159111.719092814, "examples_seen": 86323200.0, "progress": 0.7486479045851354, "epoch": 67.3785696946612, "img/sec/core": 549.8636942142032, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.17589935792388, "core_hours": 44.17589935792388} {"step": 84350, "l2_params": 342.2792542510063, "train/loss": 2.3698644042015076, "l2_grads": 2.3125, "lr": 0.000175720608133699, "uptime": 159206.985926568, "examples_seen": 86374400.0, "progress": 0.7490919424882108, "epoch": 67.41853325913016, "img/sec/core": 537.4378257620806, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.202362367300005, "core_hours": 44.202362367300005} {"step": 84400, "l2_params": 342.27924854477374, "train/loss": 2.7348524928092957, "l2_grads": 2.25, "lr": 0.0001751383375291303, "uptime": 159300.54370248, "examples_seen": 86425600.0, "progress": 0.7495359803912862, "epoch": 67.4584968235991, "img/sec/core": 547.2554205239246, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.22835063838667, "core_hours": 44.22835063838667} {"step": 84450, "l2_params": 342.27924854477374, "train/loss": 2.157134711742401, "l2_grads": 2.28125, "lr": 0.00017455682833357445, "uptime": 159395.023588273, "examples_seen": 86476800.0, "progress": 0.7499800182943616, "epoch": 67.49846038806807, "img/sec/core": 541.9142875783768, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.25459505110694, "core_hours": 44.25459505110694} {"step": 84500, "l2_params": 342.27924854477374, "train/loss": 2.568663239479065, "l2_grads": 2.1875, "lr": 0.00017397608190996902, "uptime": 159489.432184282, "examples_seen": 86528000.0, "progress": 0.750424056197437, "epoch": 67.53842395253702, "img/sec/core": 542.3234976942796, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.28081966110945, "core_hours": 44.28081966110945} {"step": 84550, "l2_params": 342.27924854477374, "train/loss": 3.5952083468437195, "l2_grads": 2.015625, "lr": 0.00017339609961946494, "uptime": 159583.414137811, "examples_seen": 86579200.0, "progress": 0.7508680941005125, "epoch": 67.57838751700598, "img/sec/core": 544.785441007042, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.306925759311945, "core_hours": 44.306925759311945} {"step": 84600, "l2_params": 342.27924854477374, "train/loss": 4.333750486373901, "l2_grads": 2.09375, "lr": 0.00017281688282142147, "uptime": 159677.50483649402, "examples_seen": 86630400.0, "progress": 0.7513121320035878, "epoch": 67.61835108147494, "img/sec/core": 544.1558062235754, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.33306206450167, "core_hours": 44.33306206450167} {"step": 84650, "l2_params": 342.27924854477374, "train/loss": 3.318799614906311, "l2_grads": 2.015625, "lr": 0.00017223843287340345, "uptime": 159771.838767579, "examples_seen": 86681600.0, "progress": 0.7517561699066633, "epoch": 67.65831464594389, "img/sec/core": 542.7527445440028, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.359265934247496, "core_hours": 44.359265934247496} {"step": 84700, "l2_params": 342.27924854477374, "train/loss": 3.7057291865348816, "l2_grads": 2.046875, "lr": 0.00017166075113117933, "uptime": 159865.345215165, "examples_seen": 86732800.0, "progress": 0.7522002078097386, "epoch": 67.69827821041285, "img/sec/core": 547.5558244570379, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.385239947465834, "core_hours": 44.385239947465834} {"step": 84750, "l2_params": 342.2792542510063, "train/loss": 2.2781689167022705, "l2_grads": 2.296875, "lr": 0.00017108383894871582, "uptime": 159960.031073553, "examples_seen": 86784000.0, "progress": 0.7526442457128141, "epoch": 67.7382417748818, "img/sec/core": 540.7354474223326, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.41154157479583, "core_hours": 44.41154157479583} {"step": 84800, "l2_params": 342.2792542510063, "train/loss": 4.4422407150268555, "l2_grads": 2.09375, "lr": 0.00017050769767817703, "uptime": 160053.192241327, "examples_seen": 86835200.0, "progress": 0.7530882836158894, "epoch": 67.77820533935076, "img/sec/core": 549.5852104839018, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.43741967695528, "core_hours": 44.43741967695528} {"step": 84850, "l2_params": 342.27924854477374, "train/loss": 2.29905104637146, "l2_grads": 2.265625, "lr": 0.00016993232866991984, "uptime": 160147.924623862, "examples_seen": 86886400.0, "progress": 0.7535323215189649, "epoch": 67.81816890381972, "img/sec/core": 540.4698861139892, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.463734227659444, "core_hours": 44.463734227659444} {"step": 84900, "l2_params": 342.27924854477374, "train/loss": 2.870417058467865, "l2_grads": 2.015625, "lr": 0.0001693577332724906, "uptime": 160241.152780722, "examples_seen": 86937600.0, "progress": 0.7539763594220402, "epoch": 67.85813246828867, "img/sec/core": 549.1903060668471, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.48963093789834, "core_hours": 44.48963093789834} {"step": 84950, "l2_params": 342.2792428385411, "train/loss": 2.256397545337677, "l2_grads": 2.359375, "lr": 0.00016878391283262344, "uptime": 160335.735170337, "examples_seen": 86988800.0, "progress": 0.7544203973251157, "epoch": 67.89809603275764, "img/sec/core": 541.3269870683218, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.5159038239025, "core_hours": 44.5159038239025} {"step": 85000, "l2_params": 342.27924854477374, "train/loss": 2.0681535601615906, "l2_grads": 2.3125, "lr": 0.000168210868695235, "uptime": 160430.063510979, "examples_seen": 87040000.0, "progress": 0.7548644352281911, "epoch": 67.9380595972266, "img/sec/core": 542.7849112104312, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.5421061407475, "core_hours": 44.5421061407475, "val/acc@1": 0.6640625, "val/loss": 1.380569151165534, "z/secs/eval/val": 31.71236803100328} {"step": 85051, "l2_params": 342.29094612168024, "train/loss": 3.4367374181747437, "l2_grads": 2.09375, "lr": 0.00016763860220342334, "uptime": 160554.841065351, "examples_seen": 87091200.0, "progress": 0.7553084731312665, "epoch": 67.97802316169555, "img/sec/core": 410.3302092887231, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.5767665725175, "core_hours": 44.5767665725175} {"step": 85100, "l2_params": 342.29094612168024, "train/loss": 4.653048515319824, "l2_grads": 2.1875, "lr": 0.00016706711469846372, "uptime": 160648.476019027, "examples_seen": 87142400.0, "progress": 0.7557525110343419, "epoch": 68.01798672616451, "img/sec/core": 546.8043501913522, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.60277628187194, "core_hours": 44.60277628187194} {"step": 85150, "l2_params": 342.29094041564264, "train/loss": 2.2633695006370544, "l2_grads": 2.46875, "lr": 0.00016649640751980534, "uptime": 160742.327249575, "examples_seen": 87193600.0, "progress": 0.7561965489374173, "epoch": 68.05795029063346, "img/sec/core": 545.5442587278163, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.62884606813528, "core_hours": 44.62884606813528} {"step": 85200, "l2_params": 342.29094041564264, "train/loss": 2.1530054211616516, "l2_grads": 2.21875, "lr": 0.0001659264820050684, "uptime": 160836.367311339, "examples_seen": 87244800.0, "progress": 0.7566405868404927, "epoch": 68.09791385510242, "img/sec/core": 544.4488129801913, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.65496830751417, "core_hours": 44.65496830751417} {"step": 85250, "l2_params": 342.29094041564264, "train/loss": 2.127996504306793, "l2_grads": 2.34375, "lr": 0.00016535733949004142, "uptime": 160930.6258155, "examples_seen": 87296000.0, "progress": 0.7570846247435681, "epoch": 68.13787741957138, "img/sec/core": 543.1870625969925, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.68115122533667, "core_hours": 44.68115122533667} {"step": 85300, "l2_params": 342.29093470960487, "train/loss": 2.870995342731476, "l2_grads": 2.109375, "lr": 0.00016478898130867754, "uptime": 161024.830275277, "examples_seen": 87347200.0, "progress": 0.7575286626466435, "epoch": 68.17784098404033, "img/sec/core": 543.4986848946229, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.70731913083027, "core_hours": 44.70731913083027} {"step": 85350, "l2_params": 342.29094612168024, "train/loss": 2.1833115816116333, "l2_grads": 2.328125, "lr": 0.0001642214087930918, "uptime": 161118.979499021, "examples_seen": 87398400.0, "progress": 0.7579727005497189, "epoch": 68.21780454850929, "img/sec/core": 543.8175479727736, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.73347169298139, "core_hours": 44.73347169298139} {"step": 85400, "l2_params": 342.29094612168024, "train/loss": 4.779126405715942, "l2_grads": 2.1875, "lr": 0.00016365462327355769, "uptime": 161213.14185936502, "examples_seen": 87449600.0, "progress": 0.7584167384527943, "epoch": 68.25776811297824, "img/sec/core": 543.7416799338914, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.75962790418806, "core_hours": 44.75962790418806} {"step": 85450, "l2_params": 342.29094041564264, "train/loss": 2.500058650970459, "l2_grads": 2.1875, "lr": 0.0001630886260785036, "uptime": 161306.943420849, "examples_seen": 87500800.0, "progress": 0.7588607763558697, "epoch": 68.2977316774472, "img/sec/core": 545.8331310266622, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.785683893489164, "core_hours": 44.785683893489164} {"step": 85500, "l2_params": 342.29093470960487, "train/loss": 4.702410101890564, "l2_grads": 2.125, "lr": 0.0001625234185345109, "uptime": 161401.41243891302, "examples_seen": 87552000.0, "progress": 0.7593048142589451, "epoch": 68.33769524191617, "img/sec/core": 541.9766294735065, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.81192528739584, "core_hours": 44.81192528739584} {"step": 85550, "l2_params": 342.29094041564264, "train/loss": 2.0820475220680237, "l2_grads": 2.28125, "lr": 0.00016195900196631013, "uptime": 161495.152605565, "examples_seen": 87603200.0, "progress": 0.7597488521620206, "epoch": 68.37765880638511, "img/sec/core": 546.1906227463976, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.83796422257694, "core_hours": 44.83796422257694} {"step": 85600, "l2_params": 342.2909518277178, "train/loss": 4.058906257152557, "l2_grads": 2.15625, "lr": 0.00016139537769677744, "uptime": 161589.04782144, "examples_seen": 87654400.0, "progress": 0.7601928900650959, "epoch": 68.41762237085408, "img/sec/core": 545.2886978625107, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.86404622698667, "core_hours": 44.86404622698667} {"step": 85650, "l2_params": 342.29094612168024, "train/loss": 4.24003267288208, "l2_grads": 2.140625, "lr": 0.00016083254704693273, "uptime": 161683.144736689, "examples_seen": 87705600.0, "progress": 0.7606369279681714, "epoch": 68.45758593532302, "img/sec/core": 544.1198562622614, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.89018425900028, "core_hours": 44.89018425900028} {"step": 85701, "l2_params": 342.29094612168024, "train/loss": 4.245756387710571, "l2_grads": 2.078125, "lr": 0.00016027051133593525, "uptime": 161777.76162945, "examples_seen": 87756800.0, "progress": 0.7610809658712467, "epoch": 68.49754949979199, "img/sec/core": 541.129585911589, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.916466729211656, "core_hours": 44.916466729211656} {"step": 85751, "l2_params": 342.29094612168024, "train/loss": 2.7157129049301147, "l2_grads": 2.21875, "lr": 0.00015970927188108127, "uptime": 161872.440495344, "examples_seen": 87808000.0, "progress": 0.7615250037743222, "epoch": 68.53751306426095, "img/sec/core": 540.7753833608339, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.942766414182216, "core_hours": 44.942766414182216} {"step": 85800, "l2_params": 342.29094612168024, "train/loss": 2.2167699337005615, "l2_grads": 2.296875, "lr": 0.000159148829997801, "uptime": 161966.164040587, "examples_seen": 87859200.0, "progress": 0.7619690416773975, "epoch": 68.5774766287299, "img/sec/core": 546.2874869623253, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.968800732305276, "core_hours": 44.968800732305276} {"step": 85850, "l2_params": 342.29094612168024, "train/loss": 2.250119924545288, "l2_grads": 2.140625, "lr": 0.00015858918699965466, "uptime": 162059.99053376602, "examples_seen": 87910400.0, "progress": 0.762413079580473, "epoch": 68.61744019319886, "img/sec/core": 545.6880915533305, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 44.994863647077224, "core_hours": 44.994863647077224} {"step": 85900, "l2_params": 342.29094612168024, "train/loss": 2.286934196949005, "l2_grads": 2.25, "lr": 0.00015803034419833105, "uptime": 162154.576109991, "examples_seen": 87961600.0, "progress": 0.7628571174835483, "epoch": 68.65740375766781, "img/sec/core": 541.3087496365591, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.02113741825084, "core_hours": 45.02113741825084} {"step": 85950, "l2_params": 342.29094041564264, "train/loss": 2.182027816772461, "l2_grads": 2.40625, "lr": 0.00015747230290364233, "uptime": 162249.144426561, "examples_seen": 88012800.0, "progress": 0.7633011553866238, "epoch": 68.69736732213677, "img/sec/core": 541.4075438480261, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.04740639507583, "core_hours": 45.04740639507583} {"step": 86000, "l2_params": 342.29094041564264, "train/loss": 2.103682041168213, "l2_grads": 2.3125, "lr": 0.00015691506442352311, "uptime": 162344.512952322, "examples_seen": 88064000.0, "progress": 0.7637451932896993, "epoch": 68.73733088660573, "img/sec/core": 536.8647527204938, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.07389765223166, "core_hours": 45.07389765223166} {"step": 86050, "l2_params": 342.29093470960487, "train/loss": 2.9054280519485474, "l2_grads": 2.15625, "lr": 0.00015635863006402596, "uptime": 162437.97374222, "examples_seen": 88115200.0, "progress": 0.7641892311927746, "epoch": 68.77729445107468, "img/sec/core": 547.8233177343819, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.09985898275889, "core_hours": 45.09985898275889} {"step": 86100, "l2_params": 342.29093470960487, "train/loss": 2.1087340712547302, "l2_grads": 2.34375, "lr": 0.00015580300112931839, "uptime": 162532.630641476, "examples_seen": 88166400.0, "progress": 0.76463326909585, "epoch": 68.81725801554364, "img/sec/core": 540.9008788839998, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.126152565885555, "core_hours": 45.126152565885555} {"step": 86150, "l2_params": 342.29093470960487, "train/loss": 2.951058030128479, "l2_grads": 2.171875, "lr": 0.00015524817892168094, "uptime": 162627.385758452, "examples_seen": 88217600.0, "progress": 0.7650773069989254, "epoch": 68.85722158001259, "img/sec/core": 540.3402120537912, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.152473431712224, "core_hours": 45.152473431712224} {"step": 86200, "l2_params": 342.29094041564264, "train/loss": 2.057144343852997, "l2_grads": 2.203125, "lr": 0.0001546941647415024, "uptime": 162722.64314902, "examples_seen": 88268800.0, "progress": 0.7655213449020009, "epoch": 68.89718514448155, "img/sec/core": 537.4911037842107, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.17893381798111, "core_hours": 45.17893381798111} {"step": 86250, "l2_params": 342.29094041564264, "train/loss": 2.285588264465332, "l2_grads": 2.21875, "lr": 0.00015414095988727875, "uptime": 162817.881650798, "examples_seen": 88320000.0, "progress": 0.7659653828050762, "epoch": 68.93714870895052, "img/sec/core": 537.5977051734044, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.20538895736389, "core_hours": 45.20538895736389} {"step": 86300, "l2_params": 342.29094041564264, "train/loss": 2.92885684967041, "l2_grads": 2.125, "lr": 0.00015358856565560807, "uptime": 162913.084794318, "examples_seen": 88371200.0, "progress": 0.7664094207081517, "epoch": 68.97711227341946, "img/sec/core": 537.7973678908402, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.23183427500833, "core_hours": 45.23183427500833} {"step": 86350, "l2_params": 342.29093470960487, "train/loss": 2.7849106788635254, "l2_grads": 2.09375, "lr": 0.00015303698334118919, "uptime": 163007.59228951202, "examples_seen": 88422400.0, "progress": 0.766853458611227, "epoch": 69.01707583788843, "img/sec/core": 541.7559728452975, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.25808635700667, "core_hours": 45.25808635700667} {"step": 86400, "l2_params": 342.29093470960487, "train/loss": 2.1072765588760376, "l2_grads": 2.234375, "lr": 0.00015248621423681803, "uptime": 163101.885095223, "examples_seen": 88473600.0, "progress": 0.7672974965143025, "epoch": 69.05703940235738, "img/sec/core": 542.989463659971, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.2842788030375, "core_hours": 45.2842788030375} {"step": 86450, "l2_params": 342.29093470960487, "train/loss": 2.195480227470398, "l2_grads": 2.234375, "lr": 0.00015193625963338354, "uptime": 163195.252407169, "examples_seen": 88524800.0, "progress": 0.7677415344173779, "epoch": 69.09700296682634, "img/sec/core": 548.3717902215295, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.310214167466945, "core_hours": 45.310214167466945} {"step": 86500, "l2_params": 342.29093470960487, "train/loss": 2.1229672729969025, "l2_grads": 2.265625, "lr": 0.00015138712081986706, "uptime": 163289.861354903, "examples_seen": 88576000.0, "progress": 0.7681855723204533, "epoch": 69.1369665312953, "img/sec/core": 541.175028644785, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.33649443072638, "core_hours": 45.33649443072638} {"step": 86550, "l2_params": 342.29093470960487, "train/loss": 2.2230268120765686, "l2_grads": 2.25, "lr": 0.0001508387990833367, "uptime": 163383.75704220802, "examples_seen": 88627200.0, "progress": 0.7686296102235287, "epoch": 69.17693009576425, "img/sec/core": 545.2859600854434, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.3625765660889, "core_hours": 45.3625765660889} {"step": 86600, "l2_params": 342.29093470960487, "train/loss": 2.050929844379425, "l2_grads": 2.234375, "lr": 0.00015029129570894617, "uptime": 163477.604998735, "examples_seen": 88678400.0, "progress": 0.7690736481266041, "epoch": 69.21689366023321, "img/sec/core": 545.5632908242632, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.38864544290195, "core_hours": 45.38864544290195} {"step": 86651, "l2_params": 342.29093470960487, "train/loss": 2.241633713245392, "l2_grads": 2.328125, "lr": 0.00014974461197993105, "uptime": 163571.407916719, "examples_seen": 88729600.0, "progress": 0.7695176860296795, "epoch": 69.25685722470216, "img/sec/core": 545.8252376406501, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.41470180900861, "core_hours": 45.41470180900861} {"step": 86700, "l2_params": 342.29094041564264, "train/loss": 2.0521406531333923, "l2_grads": 2.265625, "lr": 0.0001491987491776056, "uptime": 163665.150239187, "examples_seen": 88780800.0, "progress": 0.7699617239327549, "epoch": 69.29682078917112, "img/sec/core": 546.17806186187, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.440741343027504, "core_hours": 45.440741343027504} {"step": 86750, "l2_params": 342.29093470960487, "train/loss": 2.4868927597999573, "l2_grads": 2.328125, "lr": 0.00014865370858136028, "uptime": 163758.951017607, "examples_seen": 88832000.0, "progress": 0.7704057618358303, "epoch": 69.33678435364008, "img/sec/core": 545.8376877294901, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.46679711481083, "core_hours": 45.46679711481083} {"step": 86800, "l2_params": 342.29094041564264, "train/loss": 4.577837109565735, "l2_grads": 2.140625, "lr": 0.00014810949146865787, "uptime": 163852.726732305, "examples_seen": 88883200.0, "progress": 0.7708497997389057, "epoch": 69.37674791810903, "img/sec/core": 545.9835754373598, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.49284592444916, "core_hours": 45.49284592444916} {"step": 86851, "l2_params": 342.29094612168024, "train/loss": 2.8578761219978333, "l2_grads": 2.109375, "lr": 0.00014756609911503195, "uptime": 163947.255427081, "examples_seen": 88934400.0, "progress": 0.7712938376419811, "epoch": 69.416711482578, "img/sec/core": 541.6344753444905, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.519103895220276, "core_hours": 45.519103895220276} {"step": 86900, "l2_params": 342.29094612168024, "train/loss": 2.1047176122665405, "l2_grads": 2.25, "lr": 0.0001470235327940826, "uptime": 164040.505960237, "examples_seen": 88985600.0, "progress": 0.7717378755450566, "epoch": 69.45667504704696, "img/sec/core": 549.0585229613818, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.54500682109695, "core_hours": 45.54500682109695} {"step": 86950, "l2_params": 342.29093470960487, "train/loss": 2.271546721458435, "l2_grads": 2.171875, "lr": 0.0001464817937774736, "uptime": 164134.821844098, "examples_seen": 89036800.0, "progress": 0.7721819134481319, "epoch": 69.4966386115159, "img/sec/core": 542.8565995887955, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.571205677725, "core_hours": 45.571205677725} {"step": 87000, "l2_params": 342.29094041564264, "train/loss": 2.2391822934150696, "l2_grads": 2.359375, "lr": 0.00014594088333492984, "uptime": 164229.22771364, "examples_seen": 89088000.0, "progress": 0.7726259513512074, "epoch": 69.53660217598487, "img/sec/core": 542.3391601433444, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.59742953037555, "core_hours": 45.59742953037555} {"step": 87050, "l2_params": 342.29094041564264, "train/loss": 2.881435453891754, "l2_grads": 2.09375, "lr": 0.00014540080273423443, "uptime": 164324.036754806, "examples_seen": 89139200.0, "progress": 0.7730699892542827, "epoch": 69.57656574045382, "img/sec/core": 540.0328847366977, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.62376537514389, "core_hours": 45.62376537514389} {"step": 87100, "l2_params": 342.29094612168024, "train/loss": 3.4743135571479797, "l2_grads": 1.9921875, "lr": 0.0001448615532412254, "uptime": 164417.624277038, "examples_seen": 89190400.0, "progress": 0.7735140271573582, "epoch": 69.61652930492278, "img/sec/core": 547.0814781598294, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.64976190909722, "core_hours": 45.64976190909722} {"step": 87150, "l2_params": 342.29094041564264, "train/loss": 2.0848228335380554, "l2_grads": 2.21875, "lr": 0.00014432313611979295, "uptime": 164511.500840163, "examples_seen": 89241600.0, "progress": 0.7739580650604335, "epoch": 69.65649286939174, "img/sec/core": 545.3970436883799, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.6758387321875, "core_hours": 45.6758387321875} {"step": 87200, "l2_params": 342.29094041564264, "train/loss": 2.0733836889266968, "l2_grads": 2.234375, "lr": 0.00014378555263187603, "uptime": 164605.414604349, "examples_seen": 89292800.0, "progress": 0.774402102963509, "epoch": 69.69645643386069, "img/sec/core": 545.1810013556317, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.70192588890583, "core_hours": 45.70192588890583} {"step": 87250, "l2_params": 342.29094612168024, "train/loss": 2.27316415309906, "l2_grads": 2.40625, "lr": 0.0001432488040374599, "uptime": 164699.493957337, "examples_seen": 89344000.0, "progress": 0.7748461408665843, "epoch": 69.73641999832965, "img/sec/core": 544.2214298235765, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.72805904251361, "core_hours": 45.72805904251361} {"step": 87300, "l2_params": 342.29094612168024, "train/loss": 2.2522228956222534, "l2_grads": 2.40625, "lr": 0.00014271289159457313, "uptime": 164793.464542136, "examples_seen": 89395200.0, "progress": 0.7752901787696598, "epoch": 69.7763835627986, "img/sec/core": 544.8513501273696, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.75416198273556, "core_hours": 45.75416198273556} {"step": 87350, "l2_params": 342.29094041564264, "train/loss": 2.481394946575165, "l2_grads": 2.34375, "lr": 0.00014217781655928439, "uptime": 164887.56158627602, "examples_seen": 89446400.0, "progress": 0.7757342166727352, "epoch": 69.81634712726756, "img/sec/core": 544.1191109448258, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.78030005055223, "core_hours": 45.78030005055223} {"step": 87400, "l2_params": 342.29094041564264, "train/loss": 3.391106903553009, "l2_grads": 2.046875, "lr": 0.00014164358018569953, "uptime": 164981.699632284, "examples_seen": 89497600.0, "progress": 0.7761782545758106, "epoch": 69.85631069173652, "img/sec/core": 543.882119623121, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.80644950777666, "core_hours": 45.80644950777666} {"step": 87450, "l2_params": 342.29094612168024, "train/loss": 2.942936599254608, "l2_grads": 2.09375, "lr": 0.00014111018372595923, "uptime": 165075.842516072, "examples_seen": 89548800.0, "progress": 0.776622292478886, "epoch": 69.89627425620547, "img/sec/core": 543.8541708079866, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.83260030882889, "core_hours": 45.83260030882889} {"step": 87500, "l2_params": 342.2909518277178, "train/loss": 2.168856203556061, "l2_grads": 2.1875, "lr": 0.0001405776284302347, "uptime": 165171.40076326102, "examples_seen": 89600000.0, "progress": 0.7770663303819614, "epoch": 69.93623782067444, "img/sec/core": 535.7988609683214, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.85914426638139, "core_hours": 45.85914426638139, "val/acc@1": 0.6646404655612245, "val/loss": 1.3792164274016205, "z/secs/eval/val": 31.688646596012404} {"step": 87550, "l2_params": 342.29094612168024, "train/loss": 2.044601559638977, "l2_grads": 2.1875, "lr": 0.00014004591554672659, "uptime": 165296.057615213, "examples_seen": 89651200.0, "progress": 0.7775103682850368, "epoch": 69.97620138514338, "img/sec/core": 410.72752278164114, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.89377116970139, "core_hours": 45.89377116970139} {"step": 87600, "l2_params": 342.2909575337552, "train/loss": 2.279446542263031, "l2_grads": 2.21875, "lr": 0.00013951504632166078, "uptime": 165390.357358838, "examples_seen": 89702400.0, "progress": 0.7779544061881122, "epoch": 70.01616494961235, "img/sec/core": 542.9495143021129, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.919965542930555, "core_hours": 45.919965542930555} {"step": 87650, "l2_params": 342.29094612168024, "train/loss": 3.369343340396881, "l2_grads": 2.0625, "lr": 0.00013898502199928537, "uptime": 165484.588834022, "examples_seen": 89753600.0, "progress": 0.7783984440911876, "epoch": 70.05612851408131, "img/sec/core": 543.342868187341, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.946140952703885, "core_hours": 45.946140952703885} {"step": 87700, "l2_params": 342.29094041564264, "train/loss": 2.5458314418792725, "l2_grads": 2.078125, "lr": 0.00013845584382186858, "uptime": 165578.46538704602, "examples_seen": 89804800.0, "progress": 0.778842481994263, "epoch": 70.09609207855026, "img/sec/core": 545.3971023723002, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.97221777298834, "core_hours": 45.97221777298834} {"step": 87750, "l2_params": 342.29094612168024, "train/loss": 4.047891557216644, "l2_grads": 2.03125, "lr": 0.0001379275130296953, "uptime": 165673.336167206, "examples_seen": 89856000.0, "progress": 0.7792865198973384, "epoch": 70.13605564301922, "img/sec/core": 539.681447898511, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 45.99857076747722, "core_hours": 45.99857076747722} {"step": 87800, "l2_params": 342.29094612168024, "train/loss": 3.2772698402404785, "l2_grads": 1.9921875, "lr": 0.00013740003086106455, "uptime": 165767.91718531, "examples_seen": 89907200.0, "progress": 0.7797305578004139, "epoch": 70.17601920748817, "img/sec/core": 541.3348368030198, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.02484327250612, "core_hours": 46.02484327250612} {"step": 87850, "l2_params": 342.29094041564264, "train/loss": 2.5073734521865845, "l2_grads": 2.15625, "lr": 0.00013687339855228626, "uptime": 165861.227477587, "examples_seen": 89958400.0, "progress": 0.7801745957034892, "epoch": 70.21598277195713, "img/sec/core": 548.7068869960613, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.050762798138614, "core_hours": 46.050762798138614} {"step": 87900, "l2_params": 342.29094041564264, "train/loss": 4.6456180810928345, "l2_grads": 2.171875, "lr": 0.00013634761733767803, "uptime": 165955.77841435702, "examples_seen": 90009600.0, "progress": 0.7806186336065647, "epoch": 70.25594633642609, "img/sec/core": 541.5070622149299, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.07702694724139, "core_hours": 46.07702694724139} {"step": 87950, "l2_params": 342.29094041564264, "train/loss": 4.416576147079468, "l2_grads": 1.984375, "lr": 0.0001358226884495633, "uptime": 166049.632731318, "examples_seen": 90060800.0, "progress": 0.78106267150964, "epoch": 70.29590990089504, "img/sec/core": 545.52631842476, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.10309759084167, "core_hours": 46.10309759084167} {"step": 88000, "l2_params": 342.29094041564264, "train/loss": 4.719003200531006, "l2_grads": 2.109375, "lr": 0.00013529861311826788, "uptime": 166144.949766874, "examples_seen": 90112000.0, "progress": 0.7815067094127155, "epoch": 70.335873465364, "img/sec/core": 537.1547667355576, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.129574545162775, "core_hours": 46.129574545162775} {"step": 88050, "l2_params": 342.29094041564264, "train/loss": 2.1327638924121857, "l2_grads": 2.15625, "lr": 0.00013477539257211632, "uptime": 166239.075777086, "examples_seen": 90163200.0, "progress": 0.7819507473157908, "epoch": 70.37583702983295, "img/sec/core": 543.9516652695945, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.15572065911055, "core_hours": 46.15572065911055} {"step": 88100, "l2_params": 342.29093470960487, "train/loss": 3.2394394278526306, "l2_grads": 1.9765625, "lr": 0.00013425302803743, "uptime": 166333.948682609, "examples_seen": 90214400.0, "progress": 0.7823947852188663, "epoch": 70.41580059430191, "img/sec/core": 539.6693578397471, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.18207424397806, "core_hours": 46.18207424397806} {"step": 88150, "l2_params": 342.29094612168024, "train/loss": 2.2235125303268433, "l2_grads": 2.375, "lr": 0.00013373152073852432, "uptime": 166428.111885343, "examples_seen": 90265600.0, "progress": 0.7828388231219416, "epoch": 70.45576415877088, "img/sec/core": 543.736815586412, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.208230689181946, "core_hours": 46.208230689181946} {"step": 88200, "l2_params": 342.29094612168024, "train/loss": 3.6987149715423584, "l2_grads": 2.03125, "lr": 0.00013321087189770525, "uptime": 166522.176139732, "examples_seen": 90316800.0, "progress": 0.7832828610250171, "epoch": 70.49572772323982, "img/sec/core": 544.3087848043152, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.23435964873445, "core_hours": 46.23435964873445} {"step": 88250, "l2_params": 342.2909518277178, "train/loss": 4.020836591720581, "l2_grads": 2.046875, "lr": 0.00013269108273526685, "uptime": 166616.642360184, "examples_seen": 90368000.0, "progress": 0.7837268989280926, "epoch": 70.53569128770879, "img/sec/core": 541.9926800821254, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.26060026552667, "core_hours": 46.26060026552667} {"step": 88300, "l2_params": 342.29094612168024, "train/loss": 4.754755139350891, "l2_grads": 2.28125, "lr": 0.0001321721544694881, "uptime": 166711.395735711, "examples_seen": 90419200.0, "progress": 0.7841709368311679, "epoch": 70.57565485217773, "img/sec/core": 540.3501428337383, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.2869206476175, "core_hours": 46.2869206476175} {"step": 88350, "l2_params": 342.29094612168024, "train/loss": 2.349960505962372, "l2_grads": 2.296875, "lr": 0.00013165408831662993, "uptime": 166806.281246845, "examples_seen": 90470400.0, "progress": 0.7846149747342434, "epoch": 70.6156184166467, "img/sec/core": 539.5976623627702, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.31327773404361, "core_hours": 46.31327773404361} {"step": 88400, "l2_params": 342.29094612168024, "train/loss": 2.0095483362674713, "l2_grads": 2.21875, "lr": 0.00013113688549093322, "uptime": 166899.68935901, "examples_seen": 90521600.0, "progress": 0.7850590126373187, "epoch": 70.65558198111566, "img/sec/core": 548.1322640325001, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.33922443186722, "core_hours": 46.33922443186722} {"step": 88450, "l2_params": 342.29094612168024, "train/loss": 4.558243036270142, "l2_grads": 2.09375, "lr": 0.00013062054720461527, "uptime": 166993.733375095, "examples_seen": 90572800.0, "progress": 0.7855030505403942, "epoch": 70.69554554558461, "img/sec/core": 544.4259202384254, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.36534776966861, "core_hours": 46.36534776966861} {"step": 88500, "l2_params": 342.29094612168024, "train/loss": 2.0149600505828857, "l2_grads": 2.265625, "lr": 0.00013010507466786712, "uptime": 167088.356704451, "examples_seen": 90624000.0, "progress": 0.7859470884434695, "epoch": 70.73550911005357, "img/sec/core": 541.0927764692676, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.39163202782306, "core_hours": 46.39163202782306} {"step": 88550, "l2_params": 342.29094612168024, "train/loss": 2.172975778579712, "l2_grads": 2.28125, "lr": 0.00012959046908885024, "uptime": 167183.570038585, "examples_seen": 90675200.0, "progress": 0.786391126346545, "epoch": 70.77547267452252, "img/sec/core": 537.7398078292905, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.418080176193605, "core_hours": 46.418080176193605} {"step": 88600, "l2_params": 342.29094041564264, "train/loss": 4.10487425327301, "l2_grads": 2.078125, "lr": 0.00012907673167369423, "uptime": 167277.900518756, "examples_seen": 90726400.0, "progress": 0.7868351642496203, "epoch": 70.81543623899148, "img/sec/core": 542.7726001942953, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.444283087352225, "core_hours": 46.444283087352225} {"step": 88650, "l2_params": 342.29094041564264, "train/loss": 2.137860655784607, "l2_grads": 2.265625, "lr": 0.0001285638636264944, "uptime": 167372.381499291, "examples_seen": 90777600.0, "progress": 0.7872792021526958, "epoch": 70.85539980346044, "img/sec/core": 541.9080084699615, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.4705278041675, "core_hours": 46.4705278041675} {"step": 88700, "l2_params": 342.29094041564264, "train/loss": 2.5372273921966553, "l2_grads": 2.171875, "lr": 0.00012805186614930813, "uptime": 167467.013018912, "examples_seen": 90828800.0, "progress": 0.7877232400557712, "epoch": 70.89536336792939, "img/sec/core": 541.0459454212884, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.496814337395556, "core_hours": 46.496814337395556} {"step": 88750, "l2_params": 342.29093470960487, "train/loss": 2.421104669570923, "l2_grads": 2.234375, "lr": 0.00012754074044215232, "uptime": 167561.640631986, "examples_seen": 90880000.0, "progress": 0.7881672779588466, "epoch": 70.93532693239835, "img/sec/core": 541.0682816226229, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.523099785471665, "core_hours": 46.523099785471665} {"step": 88800, "l2_params": 342.29093470960487, "train/loss": 3.1333954334259033, "l2_grads": 2.15625, "lr": 0.00012703048770300042, "uptime": 167656.358153059, "examples_seen": 90931200.0, "progress": 0.788611315861922, "epoch": 70.9752904968673, "img/sec/core": 540.5546874536176, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.54941020799195, "core_hours": 46.54941020799195} {"step": 88850, "l2_params": 342.29093470960487, "train/loss": 2.265582859516144, "l2_grads": 2.171875, "lr": 0.00012652110912778023, "uptime": 167749.69293119002, "examples_seen": 90982400.0, "progress": 0.7890553537649974, "epoch": 71.01525406133626, "img/sec/core": 548.562936830793, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.575336535250564, "core_hours": 46.575336535250564} {"step": 88900, "l2_params": 342.29093470960487, "train/loss": 2.2333016395568848, "l2_grads": 2.453125, "lr": 0.0001260126059103704, "uptime": 167845.718712311, "examples_seen": 91033600.0, "progress": 0.7894993916680728, "epoch": 71.05521762580523, "img/sec/core": 533.1901433375491, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.60201036333972, "core_hours": 46.60201036333972} {"step": 88950, "l2_params": 342.29093470960487, "train/loss": 4.799022793769836, "l2_grads": 2.25, "lr": 0.00012550497924259822, "uptime": 167939.174835802, "examples_seen": 91084800.0, "progress": 0.7899434295711482, "epoch": 71.09518119027418, "img/sec/core": 547.8506713894974, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.62797039764278, "core_hours": 46.62797039764278} {"step": 89000, "l2_params": 342.29093470960487, "train/loss": 2.6378952860832214, "l2_grads": 2.203125, "lr": 0.0001249982303142363, "uptime": 168034.925643188, "examples_seen": 91136000.0, "progress": 0.7903874674742236, "epoch": 71.13514475474314, "img/sec/core": 534.7213396707272, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.65456784413889, "core_hours": 46.65456784413889} {"step": 89051, "l2_params": 342.29093470960487, "train/loss": 4.268168568611145, "l2_grads": 2.0, "lr": 0.00012449236031299984, "uptime": 168129.15594894902, "examples_seen": 91187200.0, "progress": 0.790831505377299, "epoch": 71.1751083192121, "img/sec/core": 543.3496112158894, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.6807429290725, "core_hours": 46.6807429290725} {"step": 89100, "l2_params": 342.29093470960487, "train/loss": 2.814502716064453, "l2_grads": 2.1875, "lr": 0.00012398737042454433, "uptime": 168224.996371023, "examples_seen": 91238400.0, "progress": 0.7912755432803744, "epoch": 71.21507188368105, "img/sec/core": 534.2213534960518, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.7073652685375, "core_hours": 46.7073652685375} {"step": 89150, "l2_params": 342.29093470960487, "train/loss": 2.208682656288147, "l2_grads": 2.3125, "lr": 0.00012348326183246237, "uptime": 168320.526059933, "examples_seen": 91289600.0, "progress": 0.7917195811834499, "epoch": 71.25503544815001, "img/sec/core": 535.95903623466, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.73390129323472, "core_hours": 46.73390129323472} {"step": 89200, "l2_params": 342.29094041564264, "train/loss": 4.664018869400024, "l2_grads": 2.03125, "lr": 0.000122980035718281, "uptime": 168414.140798279, "examples_seen": 91340800.0, "progress": 0.7921636190865252, "epoch": 71.29499901261896, "img/sec/core": 546.9224280771923, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.759905387219725, "core_hours": 46.759905387219725} {"step": 89250, "l2_params": 342.29094041564264, "train/loss": 2.7269753217697144, "l2_grads": 2.265625, "lr": 0.00012247769326145886, "uptime": 168508.835327798, "examples_seen": 91392000.0, "progress": 0.7926076569896007, "epoch": 71.33496257708792, "img/sec/core": 540.6859325461048, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.78620942319722, "core_hours": 46.78620942319722} {"step": 89300, "l2_params": 342.29094041564264, "train/loss": 4.538885593414307, "l2_grads": 2.109375, "lr": 0.00012197623563938353, "uptime": 168602.086121721, "examples_seen": 91443200.0, "progress": 0.793051694892676, "epoch": 71.37492614155688, "img/sec/core": 549.056987571456, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.81211242150916, "core_hours": 46.81211242150916} {"step": 89350, "l2_params": 342.29094041564264, "train/loss": 4.46789288520813, "l2_grads": 2.125, "lr": 0.00012147566402736844, "uptime": 168696.635419822, "examples_seen": 91494400.0, "progress": 0.7934957327957515, "epoch": 71.41488970602583, "img/sec/core": 541.5164472749166, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.83837611542611, "core_hours": 46.83837611542611} {"step": 89400, "l2_params": 342.29094041564264, "train/loss": 4.434023141860962, "l2_grads": 1.96875, "lr": 0.00012097597959865098, "uptime": 168790.333288669, "examples_seen": 91545600.0, "progress": 0.7939397706988268, "epoch": 71.4548532704948, "img/sec/core": 546.4371882737958, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.864403301216946, "core_hours": 46.864403301216946} {"step": 89450, "l2_params": 342.29094041564264, "train/loss": 2.4126444458961487, "l2_grads": 2.28125, "lr": 0.0001204771835243885, "uptime": 168885.441889969, "examples_seen": 91596800.0, "progress": 0.7943838086019023, "epoch": 71.49481683496374, "img/sec/core": 538.331962621415, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.89082235713361, "core_hours": 46.89082235713361} {"step": 89500, "l2_params": 342.29094041564264, "train/loss": 4.058161199092865, "l2_grads": 1.9765625, "lr": 0.00011997927697365667, "uptime": 168980.77813851502, "examples_seen": 91648000.0, "progress": 0.7948278465049776, "epoch": 71.5347803994327, "img/sec/core": 537.0465146348091, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.91730464839639, "core_hours": 46.91730464839639} {"step": 89550, "l2_params": 342.29094041564264, "train/loss": 4.024894952774048, "l2_grads": 1.984375, "lr": 0.0001194822611134464, "uptime": 169073.93155529, "examples_seen": 91699200.0, "progress": 0.7952718844080531, "epoch": 71.57474396390167, "img/sec/core": 549.630939718198, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.94318059750056, "core_hours": 46.94318059750056} {"step": 89600, "l2_params": 342.29094041564264, "train/loss": 2.1961089968681335, "l2_grads": 2.359375, "lr": 0.00011898613710866043, "uptime": 169168.499377687, "examples_seen": 91750400.0, "progress": 0.7957159223111285, "epoch": 71.61470752837062, "img/sec/core": 541.4103730237813, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.969449437055275, "core_hours": 46.969449437055275} {"step": 89650, "l2_params": 342.29094041564264, "train/loss": 2.3792765140533447, "l2_grads": 2.265625, "lr": 0.00011849090612211183, "uptime": 169262.838028773, "examples_seen": 91801600.0, "progress": 0.7961599602142039, "epoch": 71.65467109283958, "img/sec/core": 542.7255892531851, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 46.99565461791249, "core_hours": 46.99565461791249} {"step": 89700, "l2_params": 342.29094041564264, "train/loss": 2.276910126209259, "l2_grads": 2.1875, "lr": 0.0001179965693145201, "uptime": 169357.326527233, "examples_seen": 91852800.0, "progress": 0.7966039981172793, "epoch": 71.69463465730853, "img/sec/core": 541.8648918595206, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.021901423040276, "core_hours": 47.021901423040276} {"step": 89750, "l2_params": 342.29094041564264, "train/loss": 2.310694634914398, "l2_grads": 2.25, "lr": 0.00011750312784450915, "uptime": 169450.702030591, "examples_seen": 91904000.0, "progress": 0.7970480360203547, "epoch": 71.73459822177749, "img/sec/core": 548.3236840363053, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.04783906286195, "core_hours": 47.04783906286195} {"step": 89800, "l2_params": 342.29094041564264, "train/loss": 2.3167704939842224, "l2_grads": 2.3125, "lr": 0.00011701058286860469, "uptime": 169545.521637709, "examples_seen": 91955200.0, "progress": 0.7974920739234301, "epoch": 71.77456178624645, "img/sec/core": 539.9727077152271, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.07417784261694, "core_hours": 47.07417784261694} {"step": 89850, "l2_params": 342.29094041564264, "train/loss": 2.315218508243561, "l2_grads": 2.21875, "lr": 0.00011651893554123069, "uptime": 169639.942446822, "examples_seen": 92006400.0, "progress": 0.7979361118265055, "epoch": 71.8145253507154, "img/sec/core": 542.2533494573031, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.10040584514834, "core_hours": 47.10040584514834} {"step": 89900, "l2_params": 342.29094041564264, "train/loss": 3.49758380651474, "l2_grads": 2.09375, "lr": 0.00011602818701470787, "uptime": 169734.591475949, "examples_seen": 92057600.0, "progress": 0.7983801497295809, "epoch": 71.85448891518436, "img/sec/core": 540.9458551476403, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.12669724212806, "core_hours": 47.12669724212806} {"step": 89950, "l2_params": 342.29094041564264, "train/loss": 2.325157582759857, "l2_grads": 2.1875, "lr": 0.00011553833843924952, "uptime": 169829.083659623, "examples_seen": 92108800.0, "progress": 0.7988241876326563, "epoch": 71.89445247965331, "img/sec/core": 541.8437590208644, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.152945070926386, "core_hours": 47.152945070926386} {"step": 90000, "l2_params": 342.29094041564264, "train/loss": 2.4048911929130554, "l2_grads": 2.203125, "lr": 0.00011504939096296039, "uptime": 169923.83549325, "examples_seen": 92160000.0, "progress": 0.7992682255357317, "epoch": 71.93441604412227, "img/sec/core": 540.3589359711353, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.17926502471166, "core_hours": 47.17926502471166, "val/acc@1": 0.6650589923469388, "val/loss": 1.3766891789071414, "z/secs/eval/val": 31.735286634007934} {"step": 90050, "l2_params": 342.29094041564264, "train/loss": 3.3207985758781433, "l2_grads": 2.09375, "lr": 0.00011456134573183291, "uptime": 170048.893629952, "examples_seen": 92211200.0, "progress": 0.7997122634388072, "epoch": 71.97437960859124, "img/sec/core": 409.4095862150553, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.21400339601778, "core_hours": 47.21400339601778} {"step": 90100, "l2_params": 342.2909290035671, "train/loss": 2.263244867324829, "l2_grads": 2.453125, "lr": 0.00011407420388974492, "uptime": 170142.256210934, "examples_seen": 92262400.0, "progress": 0.8001563013418825, "epoch": 72.01434317306018, "img/sec/core": 548.3995778767394, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.239937446290554, "core_hours": 47.239937446290554} {"step": 90150, "l2_params": 342.29094041564264, "train/loss": 2.114278554916382, "l2_grads": 2.40625, "lr": 0.00011358796657845665, "uptime": 170236.760498692, "examples_seen": 92313600.0, "progress": 0.800600339244958, "epoch": 72.05430673752915, "img/sec/core": 541.7743598164607, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.266188637334444, "core_hours": 47.266188637334444} {"step": 90200, "l2_params": 342.29094041564264, "train/loss": 2.2255162596702576, "l2_grads": 2.3125, "lr": 0.00011310263493760858, "uptime": 170330.30901737, "examples_seen": 92364800.0, "progress": 0.8010443771480333, "epoch": 72.0942703019981, "img/sec/core": 547.3095750049698, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.29217433696722, "core_hours": 47.29217433696722} {"step": 90250, "l2_params": 342.29094041564264, "train/loss": 2.4205917716026306, "l2_grads": 2.25, "lr": 0.0001126182101047184, "uptime": 170425.205291043, "examples_seen": 92416000.0, "progress": 0.8014884150511088, "epoch": 72.13423386646706, "img/sec/core": 539.5364645867877, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.318534412987496, "core_hours": 47.318534412987496} {"step": 90300, "l2_params": 342.29094041564264, "train/loss": 4.007374584674835, "l2_grads": 2.109375, "lr": 0.0001121346932151785, "uptime": 170519.202067746, "examples_seen": 92467200.0, "progress": 0.8019324529541841, "epoch": 72.17419743093602, "img/sec/core": 544.6995290251501, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.34464462873834, "core_hours": 47.34464462873834} {"step": 90350, "l2_params": 342.29094041564264, "train/loss": 2.021597534418106, "l2_grads": 2.296875, "lr": 0.00011165208540225316, "uptime": 170613.253877251, "examples_seen": 92518400.0, "progress": 0.8023764908572596, "epoch": 72.21416099540497, "img/sec/core": 544.3808074450129, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.37077013137861, "core_hours": 47.37077013137861} {"step": 90400, "l2_params": 342.29094041564264, "train/loss": 2.0828880071640015, "l2_grads": 2.21875, "lr": 0.00011117038779707575, "uptime": 170707.711945576, "examples_seen": 92569600.0, "progress": 0.8028205287603349, "epoch": 72.25412455987393, "img/sec/core": 542.0394563207872, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.39700848369112, "core_hours": 47.39700848369112} {"step": 90450, "l2_params": 342.29094041564264, "train/loss": 2.5420921444892883, "l2_grads": 2.03125, "lr": 0.00011068960152864657, "uptime": 170802.675178826, "examples_seen": 92620800.0, "progress": 0.8032645666634104, "epoch": 72.29408812434288, "img/sec/core": 539.1560317372158, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.42338715959389, "core_hours": 47.42338715959389} {"step": 90500, "l2_params": 342.29094041564264, "train/loss": 2.214872419834137, "l2_grads": 2.328125, "lr": 0.00011020972772383015, "uptime": 170897.064501526, "examples_seen": 92672000.0, "progress": 0.8037086045664857, "epoch": 72.33405168881184, "img/sec/core": 542.4342344602461, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.449606415899446, "core_hours": 47.449606415899446} {"step": 90550, "l2_params": 342.29094041564264, "train/loss": 2.151147484779358, "l2_grads": 2.46875, "lr": 0.00010973076750735175, "uptime": 170990.350922651, "examples_seen": 92723200.0, "progress": 0.8041526424695612, "epoch": 72.3740152532808, "img/sec/core": 548.8472961289316, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.47551931065639, "core_hours": 47.47551931065639} {"step": 90600, "l2_params": 342.2909290035671, "train/loss": 3.181069493293762, "l2_grads": 2.015625, "lr": 0.00010925272200179608, "uptime": 171085.146566846, "examples_seen": 92774400.0, "progress": 0.8045966803726367, "epoch": 72.41397881774975, "img/sec/core": 540.1092047508231, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.50185143404389, "core_hours": 47.50185143404389} {"step": 90650, "l2_params": 342.29094041564264, "train/loss": 2.5792535543441772, "l2_grads": 2.21875, "lr": 0.00010877559232760339, "uptime": 171178.587500961, "examples_seen": 92825600.0, "progress": 0.805040718275712, "epoch": 72.45394238221871, "img/sec/core": 547.9397277534249, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.527807249075835, "core_hours": 47.527807249075835} {"step": 90700, "l2_params": 342.29094041564264, "train/loss": 2.175998032093048, "l2_grads": 2.40625, "lr": 0.00010829937960306777, "uptime": 171272.514856259, "examples_seen": 92876800.0, "progress": 0.8054847561787875, "epoch": 72.49390594668766, "img/sec/core": 545.1021146881741, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.55389818110305, "core_hours": 47.55389818110305} {"step": 90750, "l2_params": 342.29094041564264, "train/loss": 4.62316620349884, "l2_grads": 2.03125, "lr": 0.00010782408494433412, "uptime": 171366.527970516, "examples_seen": 92928000.0, "progress": 0.8059287940818628, "epoch": 72.53386951115662, "img/sec/core": 544.6048714015282, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.58001293506334, "core_hours": 47.58001293506334} {"step": 90800, "l2_params": 342.29094041564264, "train/loss": 2.139245867729187, "l2_grads": 2.375, "lr": 0.00010734970946539514, "uptime": 171461.004350581, "examples_seen": 92979200.0, "progress": 0.8063728319849383, "epoch": 72.57383307562559, "img/sec/core": 541.9343963515148, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.606256373970275, "core_hours": 47.606256373970275} {"step": 90850, "l2_params": 342.29094041564264, "train/loss": 3.9725899696350098, "l2_grads": 2.015625, "lr": 0.00010687625427808997, "uptime": 171556.592295935, "examples_seen": 93030400.0, "progress": 0.8068168698880136, "epoch": 72.61379664009453, "img/sec/core": 535.6323939215141, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.63280858101305, "core_hours": 47.63280858101305} {"step": 90900, "l2_params": 342.29094041564264, "train/loss": 2.331211805343628, "l2_grads": 2.25, "lr": 0.00010640372049209992, "uptime": 171649.918153552, "examples_seen": 93081600.0, "progress": 0.807260907791089, "epoch": 72.6537602045635, "img/sec/core": 548.6153709953046, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.6587324303511, "core_hours": 47.6587324303511} {"step": 90950, "l2_params": 342.2909290035671, "train/loss": 2.098683714866638, "l2_grads": 2.359375, "lr": 0.0001059321092149473, "uptime": 171744.689831235, "examples_seen": 93132800.0, "progress": 0.8077049456941644, "epoch": 72.69372376903246, "img/sec/core": 540.2457912715968, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.68505789637417, "core_hours": 47.68505789637417} {"step": 91000, "l2_params": 342.2909290035671, "train/loss": 2.1192392110824585, "l2_grads": 2.390625, "lr": 0.00010546142155199233, "uptime": 171838.115845203, "examples_seen": 93184000.0, "progress": 0.8081489835972399, "epoch": 72.73368733350141, "img/sec/core": 548.0272338017796, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.71100956692083, "core_hours": 47.71100956692083} {"step": 91050, "l2_params": 342.2909290035671, "train/loss": 4.396859884262085, "l2_grads": 2.125, "lr": 0.00010499165860642971, "uptime": 171933.06822044, "examples_seen": 93235200.0, "progress": 0.8085930215003153, "epoch": 72.77365089797037, "img/sec/core": 539.217685415423, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.73738522670889, "core_hours": 47.73738522670889} {"step": 91100, "l2_params": 342.29094041564264, "train/loss": 3.336625039577484, "l2_grads": 2.015625, "lr": 0.00010452282147928775, "uptime": 172026.797484282, "examples_seen": 93286400.0, "progress": 0.8090370594033907, "epoch": 72.81361446243932, "img/sec/core": 546.2541569334624, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.76342113333167, "core_hours": 47.76342113333167} {"step": 91150, "l2_params": 342.29094041564264, "train/loss": 2.7406066060066223, "l2_grads": 2.0625, "lr": 0.00010405491126942405, "uptime": 172121.493883501, "examples_seen": 93337600.0, "progress": 0.8094810973064661, "epoch": 72.85357802690828, "img/sec/core": 540.6752571614107, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.78972568867028, "core_hours": 47.78972568867028} {"step": 91200, "l2_params": 342.29094041564264, "train/loss": 2.329359471797943, "l2_grads": 2.265625, "lr": 0.00010358792907352435, "uptime": 172214.89583084302, "examples_seen": 93388800.0, "progress": 0.8099251352095415, "epoch": 72.89354159137724, "img/sec/core": 548.1684424900021, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.81567067404306, "core_hours": 47.81567067404306} {"step": 91250, "l2_params": 342.29094041564264, "train/loss": 3.2404685020446777, "l2_grads": 2.078125, "lr": 0.00010312187598609862, "uptime": 172309.424832293, "examples_seen": 93440000.0, "progress": 0.8103691731126169, "epoch": 72.93350515584619, "img/sec/core": 541.6327181567262, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.84192873000139, "core_hours": 47.84192873000139} {"step": 91300, "l2_params": 342.29094041564264, "train/loss": 2.056648313999176, "l2_grads": 2.171875, "lr": 0.00010265675309947983, "uptime": 172402.906365341, "examples_seen": 93491200.0, "progress": 0.8108132110156923, "epoch": 72.97346872031515, "img/sec/core": 547.7017580970515, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.867895822514726, "core_hours": 47.867895822514726} {"step": 91350, "l2_params": 342.29094041564264, "train/loss": 4.284328937530518, "l2_grads": 2.0625, "lr": 0.00010219256150382053, "uptime": 172497.515893357, "examples_seen": 93542400.0, "progress": 0.8112572489187677, "epoch": 73.0134322847841, "img/sec/core": 541.171709379553, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.89417624696361, "core_hours": 47.89417624696361} {"step": 91401, "l2_params": 342.29094041564264, "train/loss": 3.468083620071411, "l2_grads": 2.0, "lr": 0.00010172930228709034, "uptime": 172591.692170824, "examples_seen": 93593600.0, "progress": 0.8117012868218431, "epoch": 73.05339584925306, "img/sec/core": 543.6613272161841, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.92033632403778, "core_hours": 47.92033632403778} {"step": 91450, "l2_params": 342.29094041564264, "train/loss": 4.175688147544861, "l2_grads": 2.015625, "lr": 0.00010126697653507394, "uptime": 172686.183826712, "examples_seen": 93644800.0, "progress": 0.8121453247249185, "epoch": 73.09335941372203, "img/sec/core": 541.8467855055787, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.94658400622889, "core_hours": 47.94658400622889} {"step": 91500, "l2_params": 342.29094041564264, "train/loss": 4.236873149871826, "l2_grads": 1.953125, "lr": 0.0001008055853313676, "uptime": 172780.60253194, "examples_seen": 93696000.0, "progress": 0.812589362627994, "epoch": 73.13332297819098, "img/sec/core": 542.2654322186893, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.97281142434778, "core_hours": 47.97281142434778} {"step": 91550, "l2_params": 342.29094041564264, "train/loss": 3.416196823120117, "l2_grads": 2.203125, "lr": 0.0001003451297573777, "uptime": 172874.818243835, "examples_seen": 93747200.0, "progress": 0.8130334005310693, "epoch": 73.17328654265994, "img/sec/core": 543.4337752185281, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 47.998982455429726, "core_hours": 47.998982455429726} {"step": 91600, "l2_params": 342.29094041564264, "train/loss": 4.741888403892517, "l2_grads": 2.265625, "lr": 9.988561089231769e-05, "uptime": 172969.013350953, "examples_seen": 93798400.0, "progress": 0.8134774384341448, "epoch": 73.21325010712889, "img/sec/core": 543.5526490337145, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.025147762962504, "core_hours": 48.025147762962504} {"step": 91650, "l2_params": 342.29094041564264, "train/loss": 2.2332960963249207, "l2_grads": 2.3125, "lr": 9.94270298132051e-05, "uptime": 173063.179500673, "examples_seen": 93849600.0, "progress": 0.8139214763372201, "epoch": 73.25321367159785, "img/sec/core": 543.7197990174111, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.05130502677361, "core_hours": 48.05130502677361} {"step": 91700, "l2_params": 342.29094041564264, "train/loss": 2.0673897862434387, "l2_grads": 2.296875, "lr": 9.896938759486002e-05, "uptime": 173157.278211753, "examples_seen": 93900800.0, "progress": 0.8143655142402956, "epoch": 73.29317723606681, "img/sec/core": 544.1094719827611, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.07744355762917, "core_hours": 48.07744355762917} {"step": 91750, "l2_params": 342.29094041564264, "train/loss": 2.2527629733085632, "l2_grads": 2.390625, "lr": 9.851268530990162e-05, "uptime": 173250.92974828, "examples_seen": 93952000.0, "progress": 0.8148095521433709, "epoch": 73.33314080053576, "img/sec/core": 546.7075277001734, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.10345787333111, "core_hours": 48.10345787333111} {"step": 91800, "l2_params": 342.2909290035671, "train/loss": 2.040144443511963, "l2_grads": 2.21875, "lr": 9.80569240287464e-05, "uptime": 173345.191448584, "examples_seen": 94003200.0, "progress": 0.8152535900464464, "epoch": 73.37310436500472, "img/sec/core": 543.1686446868764, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.12964167897111, "core_hours": 48.12964167897111} {"step": 91850, "l2_params": 342.2909290035671, "train/loss": 2.443311035633087, "l2_grads": 2.171875, "lr": 9.760210481960528e-05, "uptime": 173438.911791039, "examples_seen": 94054400.0, "progress": 0.8156976279495217, "epoch": 73.41306792947367, "img/sec/core": 546.3061557269316, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.15567510743083, "core_hours": 48.15567510743083} {"step": 91900, "l2_params": 342.2909290035671, "train/loss": 2.152082145214081, "l2_grads": 2.375, "lr": 9.714822874848103e-05, "uptime": 173533.344618675, "examples_seen": 94105600.0, "progress": 0.8161416658525972, "epoch": 73.45303149394263, "img/sec/core": 542.1843365460328, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.181906448440834, "core_hours": 48.181906448440834} {"step": 91950, "l2_params": 342.29094041564264, "train/loss": 2.082663983106613, "l2_grads": 2.28125, "lr": 9.669529687916576e-05, "uptime": 173627.00576533002, "examples_seen": 94156800.0, "progress": 0.8165857037556726, "epoch": 73.4929950584116, "img/sec/core": 546.6514326222124, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.20792343362278, "core_hours": 48.20792343362278} {"step": 92000, "l2_params": 342.29094041564264, "train/loss": 4.72079074382782, "l2_grads": 2.28125, "lr": 9.624331027323879e-05, "uptime": 173722.419285078, "examples_seen": 94208000.0, "progress": 0.817029741658748, "epoch": 73.53295862288054, "img/sec/core": 536.6115843460184, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.23442718910834, "core_hours": 48.23442718910834} {"step": 92050, "l2_params": 342.29094041564264, "train/loss": 2.9044255018234253, "l2_grads": 2.203125, "lr": 9.579226999006394e-05, "uptime": 173817.040708623, "examples_seen": 94259200.0, "progress": 0.8174737795618234, "epoch": 73.5729221873495, "img/sec/core": 541.1036748527567, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.26071091787084, "core_hours": 48.26071091787084} {"step": 92100, "l2_params": 342.29094041564264, "train/loss": 2.630531668663025, "l2_grads": 2.265625, "lr": 9.534217708678702e-05, "uptime": 173910.33404893, "examples_seen": 94310400.0, "progress": 0.8179178174648988, "epoch": 73.61288575181845, "img/sec/core": 548.8065903902819, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.28662573462278, "core_hours": 48.28662573462278} {"step": 92150, "l2_params": 342.29094041564264, "train/loss": 3.5260486602783203, "l2_grads": 2.046875, "lr": 9.48930326183334e-05, "uptime": 174004.682869096, "examples_seen": 94361600.0, "progress": 0.8183618553679742, "epoch": 73.65284931628742, "img/sec/core": 542.6670933448992, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.31283374022444, "core_hours": 48.31283374022444} {"step": 92200, "l2_params": 342.29094041564264, "train/loss": 4.567097306251526, "l2_grads": 2.125, "lr": 9.444483763740524e-05, "uptime": 174099.33875887402, "examples_seen": 94412800.0, "progress": 0.8188058932710496, "epoch": 73.69281288075638, "img/sec/core": 540.906647437055, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.339127042940554, "core_hours": 48.339127042940554} {"step": 92250, "l2_params": 342.29094041564264, "train/loss": 2.2067896127700806, "l2_grads": 2.328125, "lr": 9.399759319447973e-05, "uptime": 174192.670637005, "examples_seen": 94464000.0, "progress": 0.819249931174125, "epoch": 73.73277644522533, "img/sec/core": 548.5799817307817, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.36505256464361, "core_hours": 48.36505256464361} {"step": 92300, "l2_params": 342.29094041564264, "train/loss": 3.461094319820404, "l2_grads": 2.015625, "lr": 9.355130033780596e-05, "uptime": 174287.527495474, "examples_seen": 94515200.0, "progress": 0.8196939690772004, "epoch": 73.77274000969429, "img/sec/core": 539.7606543836409, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.39140169199611, "core_hours": 48.39140169199611} {"step": 92350, "l2_params": 342.29094041564264, "train/loss": 3.3446878790855408, "l2_grads": 2.015625, "lr": 9.310596011340265e-05, "uptime": 174381.646433929, "examples_seen": 94566400.0, "progress": 0.8201380069802758, "epoch": 73.81270357416324, "img/sec/core": 543.992535832465, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.41754584156695, "core_hours": 48.41754584156695} {"step": 92400, "l2_params": 342.29094041564264, "train/loss": 2.161632716655731, "l2_grads": 2.3125, "lr": 9.266157356505598e-05, "uptime": 174476.260839906, "examples_seen": 94617600.0, "progress": 0.8205820448833513, "epoch": 73.8526671386322, "img/sec/core": 541.1438086125435, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.443827621005, "core_hours": 48.443827621005} {"step": 92450, "l2_params": 342.29094041564264, "train/loss": 4.7593584060668945, "l2_grads": 2.21875, "lr": 9.221814173431647e-05, "uptime": 174569.674677698, "examples_seen": 94668800.0, "progress": 0.8210260827864266, "epoch": 73.89263070310116, "img/sec/core": 548.0986672874216, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.46977590928056, "core_hours": 48.46977590928056} {"step": 92500, "l2_params": 342.29094041564264, "train/loss": 4.645861268043518, "l2_grads": 2.171875, "lr": 9.177566566049734e-05, "uptime": 174664.358157004, "examples_seen": 94720000.0, "progress": 0.8214701206895021, "epoch": 73.93259426757011, "img/sec/core": 540.7490343118086, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.49607687575444, "core_hours": 48.49607687575444, "val/acc@1": 0.6649194834183674, "val/loss": 1.3744782029974216, "z/secs/eval/val": 31.8001477799844} {"step": 92550, "l2_params": 342.29094041564264, "train/loss": 4.728032350540161, "l2_grads": 2.15625, "lr": 9.133414638067184e-05, "uptime": 174789.149358813, "examples_seen": 94771200.0, "progress": 0.8219141585925774, "epoch": 73.97255783203907, "img/sec/core": 410.28533468536403, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.53074109847917, "core_hours": 48.53074109847917} {"step": 92600, "l2_params": 342.29094041564264, "train/loss": 2.143768310546875, "l2_grads": 2.328125, "lr": 9.08935849296702e-05, "uptime": 174882.44562278801, "examples_seen": 94822400.0, "progress": 0.8223581964956529, "epoch": 74.01252139650802, "img/sec/core": 548.7893921852815, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.556656727361116, "core_hours": 48.556656727361116} {"step": 92650, "l2_params": 342.29094041564264, "train/loss": 2.1759620308876038, "l2_grads": 2.234375, "lr": 9.045398234007823e-05, "uptime": 174977.08817559, "examples_seen": 94873600.0, "progress": 0.8228022343987282, "epoch": 74.05248496097698, "img/sec/core": 540.9828717016968, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.58294632536167, "core_hours": 48.58294632536167} {"step": 92700, "l2_params": 342.29094041564264, "train/loss": 2.173651695251465, "l2_grads": 2.21875, "lr": 9.001533964223385e-05, "uptime": 175070.43586760102, "examples_seen": 94924800.0, "progress": 0.8232462723018037, "epoch": 74.09244852544595, "img/sec/core": 548.4870476921949, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.60887623980917, "core_hours": 48.60887623980917} {"step": 92750, "l2_params": 342.29094041564264, "train/loss": 2.0409752130508423, "l2_grads": 2.234375, "lr": 8.957765786422552e-05, "uptime": 175165.29238315, "examples_seen": 94976000.0, "progress": 0.823690310204879, "epoch": 74.1324120899149, "img/sec/core": 539.7626056964282, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.635225271906116, "core_hours": 48.635225271906116} {"step": 92800, "l2_params": 342.29094041564264, "train/loss": 3.498321771621704, "l2_grads": 1.9375, "lr": 8.91409380318896e-05, "uptime": 175258.653031775, "examples_seen": 95027200.0, "progress": 0.8241343481079545, "epoch": 74.17237565438386, "img/sec/core": 548.4109285235428, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.66115878541305, "core_hours": 48.66115878541305} {"step": 92850, "l2_params": 342.29094041564264, "train/loss": 2.30840665102005, "l2_grads": 2.453125, "lr": 8.87051811688075e-05, "uptime": 175353.294083307, "examples_seen": 95078400.0, "progress": 0.82457838601103, "epoch": 74.21233921885282, "img/sec/core": 540.991453192879, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.68744796639417, "core_hours": 48.68744796639417} {"step": 92901, "l2_params": 342.29094041564264, "train/loss": 2.4292648434638977, "l2_grads": 2.34375, "lr": 8.827038829630394e-05, "uptime": 175447.83969380602, "examples_seen": 95129600.0, "progress": 0.8250224239141053, "epoch": 74.25230278332177, "img/sec/core": 541.5375682674686, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.71371063597723, "core_hours": 48.71371063597723} {"step": 92950, "l2_params": 342.29094041564264, "train/loss": 3.5719576478004456, "l2_grads": 2.015625, "lr": 8.783656043344395e-05, "uptime": 175541.295287359, "examples_seen": 95180800.0, "progress": 0.8254664618171808, "epoch": 74.29226634779073, "img/sec/core": 547.8537779653326, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.739670523075276, "core_hours": 48.739670523075276} {"step": 93000, "l2_params": 342.29094041564264, "train/loss": 4.416687488555908, "l2_grads": 2.140625, "lr": 8.740369859703118e-05, "uptime": 175636.095794446, "examples_seen": 95232000.0, "progress": 0.8259104997202561, "epoch": 74.33222991225968, "img/sec/core": 540.081499279468, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.76600399726611, "core_hours": 48.76600399726611} {"step": 93050, "l2_params": 342.29094041564264, "train/loss": 4.708588242530823, "l2_grads": 2.109375, "lr": 8.697180380160461e-05, "uptime": 175730.379583297, "examples_seen": 95283200.0, "progress": 0.8263545376233316, "epoch": 74.37219347672864, "img/sec/core": 543.0413926291718, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.792193938613615, "core_hours": 48.792193938613615} {"step": 93100, "l2_params": 342.29094041564264, "train/loss": 4.245914101600647, "l2_grads": 2.0625, "lr": 8.654087705943698e-05, "uptime": 175823.923456788, "examples_seen": 95334400.0, "progress": 0.8267985755264069, "epoch": 74.4121570411976, "img/sec/core": 547.3367532180164, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.818178347916664, "core_hours": 48.818178347916664} {"step": 93150, "l2_params": 342.29094041564264, "train/loss": 3.494325041770935, "l2_grads": 2.0, "lr": 8.611091938053228e-05, "uptime": 175919.304650553, "examples_seen": 95385600.0, "progress": 0.8272426134294824, "epoch": 74.45212060566655, "img/sec/core": 536.7934493055843, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.8446731239625, "core_hours": 48.8446731239625} {"step": 93200, "l2_params": 342.29094041564264, "train/loss": 2.1312942504882812, "l2_grads": 2.359375, "lr": 8.568193177262272e-05, "uptime": 176014.24755755402, "examples_seen": 95436800.0, "progress": 0.8276866513325577, "epoch": 74.49208417013551, "img/sec/core": 539.2714592092304, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.87104615368501, "core_hours": 48.87104615368501} {"step": 93250, "l2_params": 342.29094041564264, "train/loss": 2.1607476472854614, "l2_grads": 2.390625, "lr": 8.525391524116735e-05, "uptime": 176108.669935185, "examples_seen": 95488000.0, "progress": 0.8281306892356332, "epoch": 74.53204773460446, "img/sec/core": 542.2443416972459, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.89727459191583, "core_hours": 48.89727459191583} {"step": 93300, "l2_params": 342.29094041564264, "train/loss": 2.2084767818450928, "l2_grads": 2.359375, "lr": 8.482687078934878e-05, "uptime": 176202.82333812802, "examples_seen": 95539200.0, "progress": 0.8285747271387086, "epoch": 74.57201129907342, "img/sec/core": 543.7934094743885, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.92342831495556, "core_hours": 48.92342831495556} {"step": 93350, "l2_params": 342.29094041564264, "train/loss": 2.3164129853248596, "l2_grads": 2.375, "lr": 8.440079941807163e-05, "uptime": 176297.168405301, "examples_seen": 95590400.0, "progress": 0.829018765041784, "epoch": 74.61197486354239, "img/sec/core": 542.6886803326491, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.94963527805917, "core_hours": 48.94963527805917} {"step": 93400, "l2_params": 342.29094041564264, "train/loss": 2.2050397396087646, "l2_grads": 2.328125, "lr": 8.397570212595977e-05, "uptime": 176390.783895769, "examples_seen": 95641600.0, "progress": 0.8294628029448594, "epoch": 74.65193842801133, "img/sec/core": 546.9180340137519, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 48.97563958096694, "core_hours": 48.97563958096694} {"step": 93450, "l2_params": 342.29094041564264, "train/loss": 4.5779770612716675, "l2_grads": 1.9921875, "lr": 8.35515799093538e-05, "uptime": 176485.918488362, "examples_seen": 95692800.0, "progress": 0.8299068408479348, "epoch": 74.6919019924803, "img/sec/core": 538.1848873737549, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.00206585668722, "core_hours": 49.00206585668722} {"step": 93500, "l2_params": 342.29094041564264, "train/loss": 3.6423120498657227, "l2_grads": 2.0625, "lr": 8.312843376230925e-05, "uptime": 176580.360575375, "examples_seen": 95744000.0, "progress": 0.8303508787510102, "epoch": 74.73186555694924, "img/sec/core": 542.1311792161637, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.02829976974639, "core_hours": 49.02829976974639} {"step": 93550, "l2_params": 342.29094041564264, "train/loss": 2.196761429309845, "l2_grads": 2.21875, "lr": 8.270626467659365e-05, "uptime": 176674.812429102, "examples_seen": 95795200.0, "progress": 0.8307949166540856, "epoch": 74.77182912141821, "img/sec/core": 542.0751206005087, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.05453639578166, "core_hours": 49.05453639578166} {"step": 93600, "l2_params": 342.29094041564264, "train/loss": 2.1256775557994843, "l2_grads": 2.359375, "lr": 8.228507364168441e-05, "uptime": 176769.341305341, "examples_seen": 95846400.0, "progress": 0.831238954557161, "epoch": 74.81179268588717, "img/sec/core": 541.6334355922211, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.080794416959165, "core_hours": 49.080794416959165} {"step": 93650, "l2_params": 342.29094041564264, "train/loss": 2.1614295542240143, "l2_grads": 2.21875, "lr": 8.186486164476726e-05, "uptime": 176863.853802996, "examples_seen": 95897600.0, "progress": 0.8316829924602364, "epoch": 74.85175625035612, "img/sec/core": 541.7272981917813, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.10704788853, "core_hours": 49.10704788853} {"step": 93700, "l2_params": 342.29094041564264, "train/loss": 2.074503540992737, "l2_grads": 2.21875, "lr": 8.144562967073252e-05, "uptime": 176958.108183494, "examples_seen": 95948800.0, "progress": 0.8321270303633118, "epoch": 74.89171981482508, "img/sec/core": 543.210827225943, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.133229660890564, "core_hours": 49.133229660890564} {"step": 93750, "l2_params": 342.29094041564264, "train/loss": 2.1174222826957703, "l2_grads": 2.296875, "lr": 8.10273787021741e-05, "uptime": 177051.74188793902, "examples_seen": 96000000.0, "progress": 0.8325710682663873, "epoch": 74.93168337929403, "img/sec/core": 546.8116454804165, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.159239023236395, "core_hours": 49.159239023236395} {"step": 93800, "l2_params": 342.29094041564264, "train/loss": 2.1329389810562134, "l2_grads": 2.203125, "lr": 8.061010971938606e-05, "uptime": 177146.681731733, "examples_seen": 96051200.0, "progress": 0.8330151061694626, "epoch": 74.97164694376299, "img/sec/core": 539.2888586493082, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.18561120206805, "core_hours": 49.18561120206805} {"step": 93850, "l2_params": 342.29094041564264, "train/loss": 2.665432393550873, "l2_grads": 2.140625, "lr": 8.019382370036102e-05, "uptime": 177241.04763883402, "examples_seen": 96102400.0, "progress": 0.8334591440725381, "epoch": 75.01161050823195, "img/sec/core": 542.5688320379344, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.21182395404056, "core_hours": 49.21182395404056} {"step": 93900, "l2_params": 342.29094041564264, "train/loss": 2.388672113418579, "l2_grads": 2.15625, "lr": 7.977852162078848e-05, "uptime": 177334.434033917, "examples_seen": 96153600.0, "progress": 0.8339031819756134, "epoch": 75.0515740727009, "img/sec/core": 548.2597326356093, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.23776461934139, "core_hours": 49.23776461934139} {"step": 93951, "l2_params": 342.29094041564264, "train/loss": 3.0852783918380737, "l2_grads": 2.171875, "lr": 7.936420445405077e-05, "uptime": 177428.931710849, "examples_seen": 96204800.0, "progress": 0.8343472198786889, "epoch": 75.09153763716986, "img/sec/core": 541.8122610236028, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.264013974044715, "core_hours": 49.264013974044715} {"step": 94000, "l2_params": 342.29094041564264, "train/loss": 2.2769872546195984, "l2_grads": 2.375, "lr": 7.895087317122258e-05, "uptime": 177523.888665059, "examples_seen": 96256000.0, "progress": 0.8347912577817642, "epoch": 75.13150120163881, "img/sec/core": 539.1916834944592, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.290390905769726, "core_hours": 49.290390905769726} {"step": 94050, "l2_params": 342.29094041564264, "train/loss": 2.668339431285858, "l2_grads": 2.234375, "lr": 7.85385287410671e-05, "uptime": 177618.7504345, "examples_seen": 96307200.0, "progress": 0.8352352956848397, "epoch": 75.17146476610777, "img/sec/core": 539.7327110986361, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.316741397281106, "core_hours": 49.316741397281106} {"step": 94100, "l2_params": 342.29094041564264, "train/loss": 2.311309814453125, "l2_grads": 2.265625, "lr": 7.812717213003548e-05, "uptime": 177713.067045844, "examples_seen": 96358400.0, "progress": 0.835679333587915, "epoch": 75.21142833057674, "img/sec/core": 542.8524124265431, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.34294045598778, "core_hours": 49.34294045598778} {"step": 94150, "l2_params": 342.29094041564264, "train/loss": 2.1701409816741943, "l2_grads": 2.34375, "lr": 7.771680430226272e-05, "uptime": 177806.491438417, "examples_seen": 96409600.0, "progress": 0.8361233714909905, "epoch": 75.25139189504569, "img/sec/core": 548.0367449004598, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.368891676146944, "core_hours": 49.368891676146944} {"step": 94200, "l2_params": 342.29094041564264, "train/loss": 4.101945877075195, "l2_grads": 2.015625, "lr": 7.73074262195669e-05, "uptime": 177902.189272558, "examples_seen": 96460800.0, "progress": 0.8365674093940659, "epoch": 75.29135545951465, "img/sec/core": 535.0173330418621, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.39547440785278, "core_hours": 49.39547440785278} {"step": 94250, "l2_params": 342.29094041564264, "train/loss": 3.116343379020691, "l2_grads": 2.046875, "lr": 7.689903884144618e-05, "uptime": 177997.334811358, "examples_seen": 96512000.0, "progress": 0.8370114472971413, "epoch": 75.3313190239836, "img/sec/core": 538.1229708269883, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.421903724186116, "core_hours": 49.421903724186116} {"step": 94300, "l2_params": 342.29094041564264, "train/loss": 2.8528313040733337, "l2_grads": 2.03125, "lr": 7.649164312507661e-05, "uptime": 178092.02155136, "examples_seen": 96563200.0, "progress": 0.8374554852002167, "epoch": 75.37128258845256, "img/sec/core": 540.7304127159447, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.44820559640889, "core_hours": 49.44820559640889} {"step": 94350, "l2_params": 342.29094041564264, "train/loss": 4.444255709648132, "l2_grads": 1.90625, "lr": 7.608524002531023e-05, "uptime": 178185.420753344, "examples_seen": 96614400.0, "progress": 0.8378995231032921, "epoch": 75.41124615292152, "img/sec/core": 548.1845552467843, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.47414981918222, "core_hours": 49.47414981918222} {"step": 94400, "l2_params": 342.29094041564264, "train/loss": 2.601940631866455, "l2_grads": 2.171875, "lr": 7.56798304946722e-05, "uptime": 178279.362283518, "examples_seen": 96665600.0, "progress": 0.8383435610063675, "epoch": 75.45120971739047, "img/sec/core": 545.0198640064104, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.500244688675004, "core_hours": 49.500244688675004} {"step": 94450, "l2_params": 342.29094041564264, "train/loss": 2.2514621019363403, "l2_grads": 2.28125, "lr": 7.527541548335916e-05, "uptime": 178373.29413609402, "examples_seen": 96716800.0, "progress": 0.8387875989094429, "epoch": 75.49117328185943, "img/sec/core": 545.0760162381845, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.526336869946114, "core_hours": 49.526336869946114} {"step": 94500, "l2_params": 342.29094041564264, "train/loss": 2.1493051052093506, "l2_grads": 2.28125, "lr": 7.48719959392372e-05, "uptime": 178467.159456024, "examples_seen": 96768000.0, "progress": 0.8392316368125183, "epoch": 75.53113684632838, "img/sec/core": 545.4623713868867, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.55241056992667, "core_hours": 49.55241056992667} {"step": 94551, "l2_params": 342.29094041564264, "train/loss": 2.1060990691184998, "l2_grads": 2.5, "lr": 7.446957280783852e-05, "uptime": 178561.159847795, "examples_seen": 96819200.0, "progress": 0.8396756747155937, "epoch": 75.57110041079734, "img/sec/core": 544.678580965198, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.57852178986306, "core_hours": 49.57852178986306} {"step": 94600, "l2_params": 342.29094041564264, "train/loss": 2.323840618133545, "l2_grads": 2.140625, "lr": 7.406814703236053e-05, "uptime": 178655.123991933, "examples_seen": 96870400.0, "progress": 0.8401197126186691, "epoch": 75.6110639752663, "img/sec/core": 544.8886963180438, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.6046229410125, "core_hours": 49.6046229410125} {"step": 94650, "l2_params": 342.29094041564264, "train/loss": 4.583529949188232, "l2_grads": 2.09375, "lr": 7.366771955366269e-05, "uptime": 178749.763326915, "examples_seen": 96921600.0, "progress": 0.8405637505217446, "epoch": 75.65102753973525, "img/sec/core": 541.0012655915059, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.630911645174166, "core_hours": 49.630911645174166} {"step": 94700, "l2_params": 342.29094041564264, "train/loss": 2.094210058450699, "l2_grads": 2.375, "lr": 7.326829131026457e-05, "uptime": 178844.489795106, "examples_seen": 96972800.0, "progress": 0.8410077884248199, "epoch": 75.69099110420422, "img/sec/core": 540.5036309046236, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.657224553005, "core_hours": 49.657224553005} {"step": 94750, "l2_params": 342.29094041564264, "train/loss": 2.476179003715515, "l2_grads": 2.21875, "lr": 7.286986323834431e-05, "uptime": 178938.796787239, "examples_seen": 97024000.0, "progress": 0.8414518263278954, "epoch": 75.73095466867316, "img/sec/core": 542.9077827844611, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.68342093970861, "core_hours": 49.68342093970861} {"step": 94800, "l2_params": 342.29094041564264, "train/loss": 2.5858357548713684, "l2_grads": 2.140625, "lr": 7.247243627173512e-05, "uptime": 179032.209604543, "examples_seen": 97075200.0, "progress": 0.8418958642309707, "epoch": 75.77091823314213, "img/sec/core": 548.1046549894726, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.709368944515276, "core_hours": 49.709368944515276} {"step": 94850, "l2_params": 342.29094041564264, "train/loss": 2.3859930634498596, "l2_grads": 2.25, "lr": 7.207601134192462e-05, "uptime": 179126.937469817, "examples_seen": 97126400.0, "progress": 0.8423399021340462, "epoch": 75.81088179761109, "img/sec/core": 540.4956593490302, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.73568224042472, "core_hours": 49.73568224042472} {"step": 94900, "l2_params": 342.29094041564264, "train/loss": 3.0675269961357117, "l2_grads": 2.296875, "lr": 7.168058937805106e-05, "uptime": 179221.433526467, "examples_seen": 97177600.0, "progress": 0.8427839400371215, "epoch": 75.85084536208004, "img/sec/core": 541.8215512381952, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.76193114504972, "core_hours": 49.76193114504972} {"step": 94950, "l2_params": 342.29094041564264, "train/loss": 2.280742645263672, "l2_grads": 2.453125, "lr": 7.12861713069022e-05, "uptime": 179314.856392121, "examples_seen": 97228800.0, "progress": 0.843227977940197, "epoch": 75.890808926549, "img/sec/core": 548.0457021049627, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.78788194106472, "core_hours": 49.78788194106472} {"step": 95000, "l2_params": 342.29094041564264, "train/loss": 2.890575408935547, "l2_grads": 2.1875, "lr": 7.089275805291342e-05, "uptime": 179410.161550076, "examples_seen": 97280000.0, "progress": 0.8436720158432723, "epoch": 75.93077249101796, "img/sec/core": 537.2217107511694, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.81435559605222, "core_hours": 49.81435559605222, "val/acc@1": 0.665397799744898, "val/loss": 1.373689472979429, "z/secs/eval/val": 31.669325399998343} {"step": 95050, "l2_params": 342.29094041564264, "train/loss": 2.0845552682876587, "l2_grads": 2.203125, "lr": 7.050035053816422e-05, "uptime": 179534.952741046, "examples_seen": 97331200.0, "progress": 0.8441160537463478, "epoch": 75.97073605548691, "img/sec/core": 410.2853703216314, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.84901981576611, "core_hours": 49.84901981576611} {"step": 95100, "l2_params": 342.29094041564264, "train/loss": 2.3131989240646362, "l2_grads": 2.375, "lr": 7.010894968237751e-05, "uptime": 179628.301071819, "examples_seen": 97382400.0, "progress": 0.8445600916494233, "epoch": 76.01069961995587, "img/sec/core": 548.4832945165625, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.874949907647505, "core_hours": 49.874949907647505} {"step": 95150, "l2_params": 342.29094041564264, "train/loss": 2.1622583866119385, "l2_grads": 2.25, "lr": 6.97185564029163e-05, "uptime": 179722.765858123, "examples_seen": 97433600.0, "progress": 0.8450041295524986, "epoch": 76.05066318442482, "img/sec/core": 542.0009085209713, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.90119012606528, "core_hours": 49.90119012606528} {"step": 95200, "l2_params": 342.29094041564264, "train/loss": 4.582998275756836, "l2_grads": 2.15625, "lr": 6.932917161478221e-05, "uptime": 179816.029922968, "examples_seen": 97484800.0, "progress": 0.845448167455574, "epoch": 76.09062674889378, "img/sec/core": 548.9788600259052, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.92709681074445, "core_hours": 49.92709681074445} {"step": 95250, "l2_params": 342.29094041564264, "train/loss": 2.1357076168060303, "l2_grads": 2.15625, "lr": 6.894079623061334e-05, "uptime": 179910.50451996102, "examples_seen": 97536000.0, "progress": 0.8458922053586494, "epoch": 76.13059031336275, "img/sec/core": 541.9446245829362, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.953339754353614, "core_hours": 49.953339754353614} {"step": 95300, "l2_params": 342.29094041564264, "train/loss": 2.1739585995674133, "l2_grads": 2.4375, "lr": 6.855343116068173e-05, "uptime": 180004.24625844, "examples_seen": 97587200.0, "progress": 0.8463362432617249, "epoch": 76.1705538778317, "img/sec/core": 546.1814644229626, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 49.979379126153326, "core_hours": 49.979379126153326} {"step": 95350, "l2_params": 342.29094041564264, "train/loss": 2.7651729583740234, "l2_grads": 2.109375, "lr": 6.816707731289177e-05, "uptime": 180100.163698385, "examples_seen": 97638400.0, "progress": 0.8467802811648002, "epoch": 76.21051744230066, "img/sec/core": 533.7923950988645, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.006022859471386, "core_hours": 50.006022859471386} {"step": 95400, "l2_params": 342.29094041564264, "train/loss": 2.241505980491638, "l2_grads": 2.421875, "lr": 6.778173559277724e-05, "uptime": 180193.43681461, "examples_seen": 97689600.0, "progress": 0.8472243190678757, "epoch": 76.2504810067696, "img/sec/core": 548.9255861945541, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.031932058422775, "core_hours": 50.031932058422775} {"step": 95450, "l2_params": 342.29094041564264, "train/loss": 2.727667987346649, "l2_grads": 2.125, "lr": 6.739740690350006e-05, "uptime": 180288.940949477, "examples_seen": 97740800.0, "progress": 0.847668356970951, "epoch": 76.29044457123857, "img/sec/core": 536.1024428031981, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.05846098477472, "core_hours": 50.05846098477472} {"step": 95500, "l2_params": 342.29094041564264, "train/loss": 3.884447455406189, "l2_grads": 1.984375, "lr": 6.701409214584782e-05, "uptime": 180384.42302387502, "examples_seen": 97792000.0, "progress": 0.8481123948740265, "epoch": 76.33040813570753, "img/sec/core": 536.2263055426436, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.08498378321861, "core_hours": 50.08498378321861} {"step": 95550, "l2_params": 342.29094041564264, "train/loss": 3.1738786697387695, "l2_grads": 2.21875, "lr": 6.663179221823136e-05, "uptime": 180477.617082377, "examples_seen": 97843200.0, "progress": 0.8485564327771018, "epoch": 76.37037170017648, "img/sec/core": 549.3912468563016, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.11087102169139, "core_hours": 50.11087102169139} {"step": 95600, "l2_params": 342.29094041564264, "train/loss": 2.248219668865204, "l2_grads": 2.234375, "lr": 6.625050801668354e-05, "uptime": 180572.639220048, "examples_seen": 97894400.0, "progress": 0.8490004706801773, "epoch": 76.41033526464544, "img/sec/core": 538.821807790377, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.13726605993334, "core_hours": 50.13726605993334} {"step": 95650, "l2_params": 342.29094041564264, "train/loss": 3.2080113291740417, "l2_grads": 1.9921875, "lr": 6.587024043485599e-05, "uptime": 180666.157380313, "examples_seen": 97945600.0, "progress": 0.8494445085832527, "epoch": 76.45029882911439, "img/sec/core": 547.4872458452708, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.163243326673616, "core_hours": 50.163243326673616} {"step": 95700, "l2_params": 342.29094041564264, "train/loss": 2.1809738874435425, "l2_grads": 2.34375, "lr": 6.549099036401783e-05, "uptime": 180761.330266738, "examples_seen": 97996800.0, "progress": 0.8498885464863281, "epoch": 76.49026239358335, "img/sec/core": 537.968342909864, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.18968023956945, "core_hours": 50.18968023956945} {"step": 95750, "l2_params": 342.29094041564264, "train/loss": 2.2342971563339233, "l2_grads": 2.40625, "lr": 6.511275869305346e-05, "uptime": 180855.976244903, "examples_seen": 98048000.0, "progress": 0.8503325843894035, "epoch": 76.53022595805231, "img/sec/core": 540.963292816717, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.21597078905972, "core_hours": 50.21597078905972} {"step": 95800, "l2_params": 342.29094041564264, "train/loss": 2.5066806077957153, "l2_grads": 2.125, "lr": 6.473554630845992e-05, "uptime": 180949.783515712, "examples_seen": 98099200.0, "progress": 0.8507766222924789, "epoch": 76.57018952252126, "img/sec/core": 545.7999103740868, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.24202836428445, "core_hours": 50.24202836428445} {"step": 95850, "l2_params": 342.29094041564264, "train/loss": 2.1508325934410095, "l2_grads": 2.328125, "lr": 6.435935409434594e-05, "uptime": 181044.370940436, "examples_seen": 98150400.0, "progress": 0.8512206601955543, "epoch": 76.61015308699022, "img/sec/core": 541.2981709715294, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.268302648929996, "core_hours": 50.268302648929996} {"step": 95900, "l2_params": 342.29094041564264, "train/loss": 2.1737610697746277, "l2_grads": 2.21875, "lr": 6.39841829324287e-05, "uptime": 181138.68310754502, "examples_seen": 98201600.0, "progress": 0.8516646980986297, "epoch": 76.65011665145917, "img/sec/core": 542.877993046388, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.29450047312695, "core_hours": 50.29450047312695} {"step": 95950, "l2_params": 342.29094041564264, "train/loss": 2.000598222017288, "l2_grads": 2.15625, "lr": 6.36100337020321e-05, "uptime": 181233.077503559, "examples_seen": 98252800.0, "progress": 0.8521087360017051, "epoch": 76.69008021592813, "img/sec/core": 542.4050808314191, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.32072113868639, "core_hours": 50.32072113868639} {"step": 96000, "l2_params": 342.29094041564264, "train/loss": 4.4276286363601685, "l2_grads": 1.984375, "lr": 6.323690728008544e-05, "uptime": 181327.387865405, "examples_seen": 98304000.0, "progress": 0.8525527739047805, "epoch": 76.7300437803971, "img/sec/core": 542.8883846676819, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.34691846142139, "core_hours": 50.34691846142139} {"step": 96050, "l2_params": 342.29094041564264, "train/loss": 2.142230600118637, "l2_grads": 2.234375, "lr": 6.286480454112006e-05, "uptime": 181421.525980207, "examples_seen": 98355200.0, "progress": 0.8529968118078559, "epoch": 76.77000734486604, "img/sec/core": 543.8817221663721, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.37306793775528, "core_hours": 50.37306793775528} {"step": 96100, "l2_params": 342.29094041564264, "train/loss": 4.698774814605713, "l2_grads": 2.109375, "lr": 6.249372635726878e-05, "uptime": 181516.113009293, "examples_seen": 98406400.0, "progress": 0.8534408497109314, "epoch": 76.80997090933501, "img/sec/core": 541.3004351097461, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.39934211250139, "core_hours": 50.39934211250139} {"step": 96150, "l2_params": 342.29094041564264, "train/loss": 2.097356766462326, "l2_grads": 2.3125, "lr": 6.21236735982623e-05, "uptime": 181609.722434631, "examples_seen": 98457600.0, "progress": 0.8538848876140067, "epoch": 76.84993447380396, "img/sec/core": 546.9534698577397, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.425344730650835, "core_hours": 50.425344730650835} {"step": 96200, "l2_params": 342.29094041564264, "train/loss": 2.133470892906189, "l2_grads": 2.375, "lr": 6.175464713142834e-05, "uptime": 181705.654030179, "examples_seen": 98508800.0, "progress": 0.8543289255170822, "epoch": 76.88989803827292, "img/sec/core": 533.7136290450094, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.45199239608083, "core_hours": 50.45199239608083} {"step": 96250, "l2_params": 342.29094041564264, "train/loss": 3.4231003522872925, "l2_grads": 2.09375, "lr": 6.13866478216894e-05, "uptime": 181799.822662198, "examples_seen": 98560000.0, "progress": 0.8547729634201575, "epoch": 76.92986160274188, "img/sec/core": 543.705466483347, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.47815034941945, "core_hours": 50.47815034941945} {"step": 96300, "l2_params": 342.29094041564264, "train/loss": 3.5888145565986633, "l2_grads": 2.046875, "lr": 6.101967653155976e-05, "uptime": 181893.872036331, "examples_seen": 98611200.0, "progress": 0.855217001323233, "epoch": 76.96982516721083, "img/sec/core": 544.3949039745432, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.5042751755675, "core_hours": 50.5042751755675} {"step": 96350, "l2_params": 342.29094041564264, "train/loss": 3.637322425842285, "l2_grads": 2.109375, "lr": 6.065373412114527e-05, "uptime": 181988.531435471, "examples_seen": 98662400.0, "progress": 0.8556610392263083, "epoch": 77.00978873167979, "img/sec/core": 540.8865940959914, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.53056945310639, "core_hours": 50.53056945310639} {"step": 96400, "l2_params": 342.29094041564264, "train/loss": 2.0817391872406006, "l2_grads": 2.3125, "lr": 6.028882144813961e-05, "uptime": 182082.847823683, "examples_seen": 98713600.0, "progress": 0.8561050771293838, "epoch": 77.04975229614874, "img/sec/core": 542.853696697075, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.55676844983194, "core_hours": 50.55676844983194} {"step": 96450, "l2_params": 342.29094041564264, "train/loss": 3.998414933681488, "l2_grads": 2.046875, "lr": 5.992493936782296e-05, "uptime": 182177.092723717, "examples_seen": 98764800.0, "progress": 0.8565491150324591, "epoch": 77.0897158606177, "img/sec/core": 543.2654709328773, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.58294758873028, "core_hours": 50.58294758873028} {"step": 96500, "l2_params": 342.29094041564264, "train/loss": 2.4341933727264404, "l2_grads": 2.140625, "lr": 5.956208873306049e-05, "uptime": 182271.748431657, "examples_seen": 98816000.0, "progress": 0.8569931529355346, "epoch": 77.12967942508666, "img/sec/core": 540.9076865439317, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.60924084093583, "core_hours": 50.60924084093583} {"step": 96550, "l2_params": 342.29094041564264, "train/loss": 2.2328789234161377, "l2_grads": 2.34375, "lr": 5.9200270394299225e-05, "uptime": 182366.200143887, "examples_seen": 98867200.0, "progress": 0.85743719083861, "epoch": 77.16964298955561, "img/sec/core": 542.0759326768926, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.63547742766639, "core_hours": 50.63547742766639} {"step": 96600, "l2_params": 342.29094041564264, "train/loss": 4.616406202316284, "l2_grads": 2.234375, "lr": 5.883948519956733e-05, "uptime": 182461.161321496, "examples_seen": 98918400.0, "progress": 0.8578812287416854, "epoch": 77.20960655402457, "img/sec/core": 539.1677029407267, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.66185553255778, "core_hours": 50.66185553255778} {"step": 96650, "l2_params": 342.29094041564264, "train/loss": 2.0510159134864807, "l2_grads": 2.171875, "lr": 5.847973399447081e-05, "uptime": 182554.528504773, "examples_seen": 98969600.0, "progress": 0.8583252666447608, "epoch": 77.24957011849352, "img/sec/core": 548.3725459308118, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.68779086124584, "core_hours": 50.68779086124584} {"step": 96700, "l2_params": 342.29094041564264, "train/loss": 4.762613296508789, "l2_grads": 2.171875, "lr": 5.8121017622193114e-05, "uptime": 182649.217847301, "examples_seen": 99020800.0, "progress": 0.8587693045478362, "epoch": 77.28953368296249, "img/sec/core": 540.7155508008751, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.7140934563925, "core_hours": 50.7140934563925} {"step": 96750, "l2_params": 342.29094041564264, "train/loss": 2.2503654956817627, "l2_grads": 2.421875, "lr": 5.776333692349144e-05, "uptime": 182743.937222545, "examples_seen": 99072000.0, "progress": 0.8592133424509116, "epoch": 77.32949724743145, "img/sec/core": 540.5441058718058, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.740404393960276, "core_hours": 50.740404393960276} {"step": 96800, "l2_params": 342.29094041564264, "train/loss": 2.572913110256195, "l2_grads": 2.296875, "lr": 5.7406692736695825e-05, "uptime": 182837.679769103, "examples_seen": 99123200.0, "progress": 0.859657380353987, "epoch": 77.3694608119004, "img/sec/core": 546.1767562322491, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.76644399022639, "core_hours": 50.76644399022639} {"step": 96850, "l2_params": 342.29094041564264, "train/loss": 2.1551490426063538, "l2_grads": 2.3125, "lr": 5.705108589770723e-05, "uptime": 182932.542735218, "examples_seen": 99174400.0, "progress": 0.8601014182570624, "epoch": 77.40942437636936, "img/sec/core": 539.7259024973893, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.79279481414722, "core_hours": 50.79279481414722} {"step": 96900, "l2_params": 342.29094041564264, "train/loss": 2.1777411699295044, "l2_grads": 2.421875, "lr": 5.6696517239994664e-05, "uptime": 183026.78119106402, "examples_seen": 99225600.0, "progress": 0.8605454561601378, "epoch": 77.44938794083832, "img/sec/core": 543.3026203619752, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.81897216299333, "core_hours": 50.81897216299333} {"step": 96950, "l2_params": 342.29094041564264, "train/loss": 2.059470236301422, "l2_grads": 2.375, "lr": 5.634298759459468e-05, "uptime": 183121.277801791, "examples_seen": 99276800.0, "progress": 0.8609894940632132, "epoch": 77.48935150530727, "img/sec/core": 541.8183742898855, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.84522122152861, "core_hours": 50.84522122152861} {"step": 97000, "l2_params": 342.29094041564264, "train/loss": 2.0202154517173767, "l2_grads": 2.296875, "lr": 5.5990497790108014e-05, "uptime": 183215.417713284, "examples_seen": 99328000.0, "progress": 0.8614335319662887, "epoch": 77.52931506977623, "img/sec/core": 543.8713420057716, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.87137119694333, "core_hours": 50.87137119694333} {"step": 97050, "l2_params": 342.29094041564264, "train/loss": 3.72368985414505, "l2_grads": 2.015625, "lr": 5.563904865269814e-05, "uptime": 183310.028496146, "examples_seen": 99379200.0, "progress": 0.861877569869364, "epoch": 77.56927863424518, "img/sec/core": 541.1645316864185, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.89765196996055, "core_hours": 50.89765196996055} {"step": 97100, "l2_params": 342.29094041564264, "train/loss": 4.643423557281494, "l2_grads": 2.109375, "lr": 5.528864100608995e-05, "uptime": 183403.25793537401, "examples_seen": 99430400.0, "progress": 0.8623216077724395, "epoch": 77.60924219871414, "img/sec/core": 549.182751971481, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.92354903641278, "core_hours": 50.92354903641278} {"step": 97150, "l2_params": 342.29094041564264, "train/loss": 2.1933164596557617, "l2_grads": 2.296875, "lr": 5.493927567156663e-05, "uptime": 183497.703453894, "examples_seen": 99481600.0, "progress": 0.8627656456755148, "epoch": 77.6492057631831, "img/sec/core": 542.1114818609682, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.94978390266833, "core_hours": 50.94978390266833} {"step": 97200, "l2_params": 342.29094041564264, "train/loss": 2.1810632050037384, "l2_grads": 2.265625, "lr": 5.4590953467969194e-05, "uptime": 183592.09252710402, "examples_seen": 99532800.0, "progress": 0.8632096835785903, "epoch": 77.68916932765205, "img/sec/core": 542.4356682270009, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 50.97600308967112, "core_hours": 50.97600308967112} {"step": 97250, "l2_params": 342.29094041564264, "train/loss": 4.691965222358704, "l2_grads": 2.109375, "lr": 5.424367521169318e-05, "uptime": 183686.868749965, "examples_seen": 99584000.0, "progress": 0.8636537214816656, "epoch": 77.72913289212102, "img/sec/core": 540.2198827346605, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.002329818243616, "core_hours": 51.002329818243616} {"step": 97300, "l2_params": 342.29094041564264, "train/loss": 2.2245829701423645, "l2_grads": 2.484375, "lr": 5.389744171668734e-05, "uptime": 183780.922325952, "examples_seen": 99635200.0, "progress": 0.8640977593847411, "epoch": 77.76909645658996, "img/sec/core": 544.3705830714914, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.02845581157333, "core_hours": 51.02845581157333} {"step": 97350, "l2_params": 342.29094041564264, "train/loss": 3.435669243335724, "l2_grads": 2.046875, "lr": 5.3552253794452134e-05, "uptime": 183875.938009821, "examples_seen": 99686400.0, "progress": 0.8645417972878164, "epoch": 77.80906002105893, "img/sec/core": 538.8584064773697, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.0548490570925, "core_hours": 51.0548490570925} {"step": 97400, "l2_params": 342.29094041564264, "train/loss": 4.199220895767212, "l2_grads": 2.03125, "lr": 5.320811225403677e-05, "uptime": 183970.397191133, "examples_seen": 99737600.0, "progress": 0.8649858351908919, "epoch": 77.84902358552789, "img/sec/core": 542.033069616414, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.08108771856806, "core_hours": 51.08108771856806} {"step": 97450, "l2_params": 342.29094041564264, "train/loss": 2.8701987266540527, "l2_grads": 2.1875, "lr": 5.2865017902038755e-05, "uptime": 184063.65480558, "examples_seen": 99788800.0, "progress": 0.8654298730939674, "epoch": 77.88898714999684, "img/sec/core": 549.0168315327612, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.10699261147, "core_hours": 51.10699261147} {"step": 97500, "l2_params": 342.29094041564264, "train/loss": 2.3611499071121216, "l2_grads": 2.296875, "lr": 5.252297154260067e-05, "uptime": 184157.918408452, "examples_seen": 99840000.0, "progress": 0.8658739109970427, "epoch": 77.9289507144658, "img/sec/core": 543.157681650719, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.133176945601114, "core_hours": 51.133176945601114, "val/acc@1": 0.6655173788265306, "val/loss": 1.3751786329916544, "z/secs/eval/val": 31.729153140011476} {"step": 97550, "l2_params": 342.29094041564264, "train/loss": 2.0750066339969635, "l2_grads": 2.265625, "lr": 5.218197397740876e-05, "uptime": 184282.551877775, "examples_seen": 99891200.0, "progress": 0.8663179489001182, "epoch": 77.96891427893475, "img/sec/core": 410.80457984616726, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.16779735374639, "core_hours": 51.16779735374639} {"step": 97601, "l2_params": 342.29094041564264, "train/loss": 2.96011745929718, "l2_grads": 2.09375, "lr": 5.1842026005691466e-05, "uptime": 184376.888104305, "examples_seen": 99942400.0, "progress": 0.8667619868031935, "epoch": 78.00887784340371, "img/sec/core": 542.7395379623401, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.19400186111583, "core_hours": 51.19400186111583} {"step": 97650, "l2_params": 342.29094041564264, "train/loss": 2.2327755093574524, "l2_grads": 2.296875, "lr": 5.15031284242168e-05, "uptime": 184471.243936306, "examples_seen": 99993600.0, "progress": 0.867206024706269, "epoch": 78.04884140787267, "img/sec/core": 542.6267662972508, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.22021181444945, "core_hours": 51.22021181444945} {"step": 97700, "l2_params": 342.29094041564264, "train/loss": 2.4023094177246094, "l2_grads": 2.296875, "lr": 5.116528202729123e-05, "uptime": 184565.595412656, "examples_seen": 100044800.0, "progress": 0.8676500626093443, "epoch": 78.08880497234162, "img/sec/core": 542.6518161738178, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.24642055788, "core_hours": 51.24642055788} {"step": 97750, "l2_params": 342.29094041564264, "train/loss": 4.719676852226257, "l2_grads": 2.09375, "lr": 5.0828487606757436e-05, "uptime": 184660.097299594, "examples_seen": 100096000.0, "progress": 0.8680941005124198, "epoch": 78.12876853681058, "img/sec/core": 541.7881235915512, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.27267108202944, "core_hours": 51.27267108202944} {"step": 97800, "l2_params": 342.29094041564264, "train/loss": 2.052795559167862, "l2_grads": 2.234375, "lr": 5.049274595199214e-05, "uptime": 184754.786264364, "examples_seen": 100147200.0, "progress": 0.8685381384154951, "epoch": 78.16873210127953, "img/sec/core": 540.7177079648573, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.298973572243334, "core_hours": 51.298973572243334} {"step": 97850, "l2_params": 342.29094041564264, "train/loss": 2.168622374534607, "l2_grads": 2.375, "lr": 5.0158057849904917e-05, "uptime": 184848.819048226, "examples_seen": 100198400.0, "progress": 0.8689821763185706, "epoch": 78.2086956657485, "img/sec/core": 544.4909519550113, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.32509378998278, "core_hours": 51.32509378998278} {"step": 97900, "l2_params": 342.29094041564264, "train/loss": 4.574453115463257, "l2_grads": 2.21875, "lr": 4.982442408493595e-05, "uptime": 184943.350774009, "examples_seen": 100249600.0, "progress": 0.869426214221646, "epoch": 78.24865923021746, "img/sec/core": 541.6171087103758, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.35135260270028, "core_hours": 51.35135260270028} {"step": 97950, "l2_params": 342.29094041564264, "train/loss": 2.3576200008392334, "l2_grads": 2.3125, "lr": 4.949184543905423e-05, "uptime": 185037.609627832, "examples_seen": 100300800.0, "progress": 0.8698702521247214, "epoch": 78.2886227946864, "img/sec/core": 543.1850475941176, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.377535617651105, "core_hours": 51.377535617651105} {"step": 98000, "l2_params": 342.29094041564264, "train/loss": 2.0696635842323303, "l2_grads": 2.390625, "lr": 4.916032269175589e-05, "uptime": 185130.778080825, "examples_seen": 100352000.0, "progress": 0.8703142900277968, "epoch": 78.32858635915537, "img/sec/core": 549.5422361885023, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.4034157434825, "core_hours": 51.4034157434825} {"step": 98050, "l2_params": 342.29094041564264, "train/loss": 2.2674010396003723, "l2_grads": 2.34375, "lr": 4.882985662006188e-05, "uptime": 185225.442950916, "examples_seen": 100403200.0, "progress": 0.8707583279308722, "epoch": 78.36854992362431, "img/sec/core": 540.8553347273788, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.42971154073, "core_hours": 51.42971154073} {"step": 98100, "l2_params": 342.29094041564264, "train/loss": 2.0783353447914124, "l2_grads": 2.28125, "lr": 4.850044799851716e-05, "uptime": 185319.748853425, "examples_seen": 100454400.0, "progress": 0.8712023658339476, "epoch": 78.40851348809328, "img/sec/core": 542.9140556193646, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.45590762476027, "core_hours": 51.45590762476027} {"step": 98150, "l2_params": 342.29094041564264, "train/loss": 3.0106412768363953, "l2_grads": 2.109375, "lr": 4.817209759918763e-05, "uptime": 185414.106860837, "examples_seen": 100505600.0, "progress": 0.871646403737023, "epoch": 78.44847705256224, "img/sec/core": 542.6142561112476, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.48211818237472, "core_hours": 51.48211818237472} {"step": 98200, "l2_params": 342.29094041564264, "train/loss": 2.3707927465438843, "l2_grads": 2.40625, "lr": 4.7844806191659334e-05, "uptime": 185508.44540772, "examples_seen": 100556800.0, "progress": 0.8720904416400984, "epoch": 78.48844061703119, "img/sec/core": 542.7261887285781, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.50832333428666, "core_hours": 51.50832333428666} {"step": 98250, "l2_params": 342.29094041564264, "train/loss": 2.727694034576416, "l2_grads": 2.09375, "lr": 4.751857454303605e-05, "uptime": 185602.041431953, "examples_seen": 100608000.0, "progress": 0.8725344795431738, "epoch": 78.52840418150015, "img/sec/core": 547.0317828088455, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.53432222990694, "core_hours": 51.53432222990694} {"step": 98300, "l2_params": 342.29094041564264, "train/loss": 2.578981041908264, "l2_grads": 2.140625, "lr": 4.719340341793751e-05, "uptime": 185696.836231347, "examples_seen": 100659200.0, "progress": 0.8729785174462492, "epoch": 78.5683677459691, "img/sec/core": 540.114018145587, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.560654118627504, "core_hours": 51.560654118627504} {"step": 98350, "l2_params": 342.29094041564264, "train/loss": 2.2078518867492676, "l2_grads": 2.296875, "lr": 4.6869293578498535e-05, "uptime": 185791.356099924, "examples_seen": 100710400.0, "progress": 0.8734225553493247, "epoch": 78.60833131043806, "img/sec/core": 541.6850527916446, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.58690963767667, "core_hours": 51.58690963767667} {"step": 98400, "l2_params": 342.29094041564264, "train/loss": 2.2256767749786377, "l2_grads": 2.375, "lr": 4.654624578436562e-05, "uptime": 185886.230082245, "examples_seen": 100761600.0, "progress": 0.8738665932524, "epoch": 78.64829487490702, "img/sec/core": 539.663232716225, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.61326352165472, "core_hours": 51.61326352165472} {"step": 98450, "l2_params": 342.29094041564264, "train/loss": 3.9040966033935547, "l2_grads": 2.03125, "lr": 4.6224260792696706e-05, "uptime": 185980.77218933, "examples_seen": 100812800.0, "progress": 0.8743106311554755, "epoch": 78.68825843937597, "img/sec/core": 541.557635836995, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.63952521806722, "core_hours": 51.63952521806722} {"step": 98500, "l2_params": 342.29094041564264, "train/loss": 3.3332828283309937, "l2_grads": 2.078125, "lr": 4.590333935815835e-05, "uptime": 186075.470538, "examples_seen": 100864000.0, "progress": 0.8747546690585508, "epoch": 78.72822200384493, "img/sec/core": 540.6641268731797, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.665830314919994, "core_hours": 51.665830314919994} {"step": 98550, "l2_params": 342.29094041564264, "train/loss": 3.8432633876800537, "l2_grads": 2.078125, "lr": 4.5583482232924336e-05, "uptime": 186170.02105674602, "examples_seen": 100915200.0, "progress": 0.8751987069616263, "epoch": 78.76818556831388, "img/sec/core": 541.5094563101385, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.692094347905005, "core_hours": 51.692094347905005} {"step": 98600, "l2_params": 342.29094041564264, "train/loss": 2.574362337589264, "l2_grads": 2.25, "lr": 4.526469016667435e-05, "uptime": 186264.283025477, "examples_seen": 100966400.0, "progress": 0.8756427448647016, "epoch": 78.80814913278284, "img/sec/core": 543.1670979217919, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.718278228108055, "core_hours": 51.718278228108055} {"step": 98650, "l2_params": 342.29094041564264, "train/loss": 2.133487105369568, "l2_grads": 2.296875, "lr": 4.494696390659133e-05, "uptime": 186357.79308048, "examples_seen": 101017600.0, "progress": 0.8760867827677771, "epoch": 78.8481126972518, "img/sec/core": 547.5347009297273, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.744253243386666, "core_hours": 51.744253243386666} {"step": 98701, "l2_params": 342.29094041564264, "train/loss": 2.048056125640869, "l2_grads": 2.40625, "lr": 4.463030419736049e-05, "uptime": 186452.166316087, "examples_seen": 101068800.0, "progress": 0.8765308206708524, "epoch": 78.88807626172076, "img/sec/core": 542.526699129139, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.77046803105528, "core_hours": 51.77046803105528} {"step": 98750, "l2_params": 342.29094041564264, "train/loss": 2.1477587819099426, "l2_grads": 2.296875, "lr": 4.4314711781167084e-05, "uptime": 186546.874659612, "examples_seen": 101120000.0, "progress": 0.8769748585739279, "epoch": 78.92803982618972, "img/sec/core": 540.6070689695392, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.79677590425667, "core_hours": 51.79677590425667} {"step": 98800, "l2_params": 342.29094041564264, "train/loss": 2.247831642627716, "l2_grads": 2.34375, "lr": 4.4000187397694786e-05, "uptime": 186640.176536043, "examples_seen": 101171200.0, "progress": 0.8774188964770033, "epoch": 78.96800339065867, "img/sec/core": 548.75638045563, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.82269309215417, "core_hours": 51.82269309215417} {"step": 98850, "l2_params": 342.29094041564264, "train/loss": 2.198529899120331, "l2_grads": 2.40625, "lr": 4.368673178412445e-05, "uptime": 186735.171924614, "examples_seen": 101222400.0, "progress": 0.8778629343800787, "epoch": 79.00796695512763, "img/sec/core": 538.9735309281227, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.84908070009055, "core_hours": 51.84908070009055} {"step": 98900, "l2_params": 342.29094041564264, "train/loss": 3.6656681299209595, "l2_grads": 2.0625, "lr": 4.3374345675131424e-05, "uptime": 186830.055972434, "examples_seen": 101273600.0, "progress": 0.8783069722831541, "epoch": 79.04793051959659, "img/sec/core": 539.6059841073505, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.87543738004056, "core_hours": 51.87543738004056} {"step": 98950, "l2_params": 342.29094041564264, "train/loss": 3.1943888068199158, "l2_grads": 2.09375, "lr": 4.306302980288472e-05, "uptime": 186923.293827991, "examples_seen": 101324800.0, "progress": 0.8787510101862295, "epoch": 79.08789408406554, "img/sec/core": 549.1331787301535, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.90133678436194, "core_hours": 51.90133678436194} {"step": 99000, "l2_params": 342.29094041564264, "train/loss": 3.018212080001831, "l2_grads": 2.0625, "lr": 4.2752784897044704e-05, "uptime": 187017.571258164, "examples_seen": 101376000.0, "progress": 0.8791950480893049, "epoch": 79.1278576485345, "img/sec/core": 543.0780188433464, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.92752495941, "core_hours": 51.92752495941} {"step": 99050, "l2_params": 342.29094041564264, "train/loss": 2.233436644077301, "l2_grads": 2.421875, "lr": 4.244361168476169e-05, "uptime": 187111.664784735, "examples_seen": 101427200.0, "progress": 0.8796390859923803, "epoch": 79.16782121300346, "img/sec/core": 544.1394521584474, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.95366205012417, "core_hours": 51.95366205012417} {"step": 99100, "l2_params": 342.29094041564264, "train/loss": 2.4008631706237793, "l2_grads": 2.453125, "lr": 4.213551089067431e-05, "uptime": 187205.846856665, "examples_seen": 101478400.0, "progress": 0.8800831238954557, "epoch": 79.20778477747241, "img/sec/core": 543.627878966745, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 51.979823736771394, "core_hours": 51.979823736771394} {"step": 99150, "l2_params": 342.29094041564264, "train/loss": 4.194733262062073, "l2_grads": 1.9453125, "lr": 4.1828483236907324e-05, "uptime": 187300.410776314, "examples_seen": 101529600.0, "progress": 0.8805271617985311, "epoch": 79.24774834194137, "img/sec/core": 541.432717573957, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.006091492229444, "core_hours": 52.006091492229444} {"step": 99200, "l2_params": 342.29094041564264, "train/loss": 3.8354318141937256, "l2_grads": 1.953125, "lr": 4.1522529443070805e-05, "uptime": 187395.202161752, "examples_seen": 101580800.0, "progress": 0.8809711997016065, "epoch": 79.28771190641032, "img/sec/core": 540.1334706041099, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.03242243262889, "core_hours": 52.03242243262889} {"step": 99250, "l2_params": 342.29094041564264, "train/loss": 4.032051622867584, "l2_grads": 2.015625, "lr": 4.121765022625736e-05, "uptime": 187489.417235291, "examples_seen": 101632000.0, "progress": 0.881415237604682, "epoch": 79.32767547087929, "img/sec/core": 543.4374572642527, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.05859328638972, "core_hours": 52.05859328638972} {"step": 99300, "l2_params": 342.29094041564264, "train/loss": 4.367904305458069, "l2_grads": 2.0625, "lr": 4.0913846301041304e-05, "uptime": 187583.480224488, "examples_seen": 101683200.0, "progress": 0.8818592755077573, "epoch": 79.36763903534825, "img/sec/core": 544.3161060166675, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.08472189450001, "core_hours": 52.08472189450001} {"step": 99350, "l2_params": 342.29094041564264, "train/loss": 2.3746777176856995, "l2_grads": 2.40625, "lr": 4.0611118379476755e-05, "uptime": 187677.99535836, "examples_seen": 101734400.0, "progress": 0.8823033134108328, "epoch": 79.4076025998172, "img/sec/core": 541.7121883289685, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.11097609835333, "core_hours": 52.11097609835333} {"step": 99400, "l2_params": 342.29094041564264, "train/loss": 2.1774969696998596, "l2_grads": 2.1875, "lr": 4.030946717109555e-05, "uptime": 187773.010713809, "examples_seen": 101785600.0, "progress": 0.8827473513139081, "epoch": 79.44756616428616, "img/sec/core": 538.8602690381391, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.13736925264472, "core_hours": 52.13736925264472} {"step": 99450, "l2_params": 342.29094041564264, "train/loss": 1.9682146906852722, "l2_grads": 2.203125, "lr": 4.000889338290647e-05, "uptime": 187866.81652244402, "examples_seen": 101836800.0, "progress": 0.8831913892169836, "epoch": 79.4875297287551, "img/sec/core": 545.8084178902882, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.16342642171001, "core_hours": 52.16342642171001} {"step": 99500, "l2_params": 342.29094041564264, "train/loss": 3.0978786945343018, "l2_grads": 2.03125, "lr": 3.970939771939241e-05, "uptime": 187961.67788371802, "examples_seen": 101888000.0, "progress": 0.8836354271200589, "epoch": 79.52749329322407, "img/sec/core": 539.7350334464638, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.18977679984167, "core_hours": 52.18977679984167} {"step": 99550, "l2_params": 342.29094041564264, "train/loss": 2.7218146324157715, "l2_grads": 2.1875, "lr": 3.941098088251004e-05, "uptime": 188055.175830131, "examples_seen": 101939200.0, "progress": 0.8840794650231344, "epoch": 79.56745685769303, "img/sec/core": 547.6056102222208, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.21574845162306, "core_hours": 52.21574845162306} {"step": 99600, "l2_params": 342.29094041564264, "train/loss": 4.561155080795288, "l2_grads": 2.1875, "lr": 3.911364357168688e-05, "uptime": 188150.34093165302, "examples_seen": 101990400.0, "progress": 0.8845235029262097, "epoch": 79.60742042216198, "img/sec/core": 538.0123509682728, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.24218320204584, "core_hours": 52.24218320204584} {"step": 99650, "l2_params": 342.29094041564264, "train/loss": 2.455418109893799, "l2_grads": 2.328125, "lr": 3.8817386483820416e-05, "uptime": 188244.62680369001, "examples_seen": 102041600.0, "progress": 0.8849675408292852, "epoch": 79.64738398663094, "img/sec/core": 543.029394477135, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.26837372205612, "core_hours": 52.26837372205612} {"step": 99700, "l2_params": 342.29094041564264, "train/loss": 2.2310438752174377, "l2_grads": 2.296875, "lr": 3.8522210313276785e-05, "uptime": 188339.173338324, "examples_seen": 102092800.0, "progress": 0.8854115787323606, "epoch": 79.68734755109989, "img/sec/core": 541.5322750665098, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.294636648343335, "core_hours": 52.294636648343335} {"step": 99750, "l2_params": 342.29094041564264, "train/loss": 2.161039352416992, "l2_grads": 2.234375, "lr": 3.822811575188805e-05, "uptime": 188434.163011973, "examples_seen": 102144000.0, "progress": 0.885855616635436, "epoch": 79.72731111556885, "img/sec/core": 539.0059575233039, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.32102266880138, "core_hours": 52.32102266880138} {"step": 99800, "l2_params": 342.29094041564264, "train/loss": 2.4898016452789307, "l2_grads": 2.21875, "lr": 3.7935103488951534e-05, "uptime": 188527.841457611, "examples_seen": 102195200.0, "progress": 0.8862996545385114, "epoch": 79.76727468003781, "img/sec/core": 546.550486094152, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.34704445925639, "core_hours": 52.34704445925639} {"step": 99850, "l2_params": 342.29094041564264, "train/loss": 2.103590488433838, "l2_grads": 2.34375, "lr": 3.764317421122778e-05, "uptime": 188621.818393983, "examples_seen": 102246400.0, "progress": 0.8867436924415868, "epoch": 79.80723824450676, "img/sec/core": 544.8145255270999, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.37314916380417, "core_hours": 52.37314916380417} {"step": 99900, "l2_params": 342.29094041564264, "train/loss": 2.8039937019348145, "l2_grads": 2.09375, "lr": 3.7352328602938904e-05, "uptime": 188717.054665615, "examples_seen": 102297600.0, "progress": 0.8871877303446623, "epoch": 79.84720180897573, "img/sec/core": 537.6102940888455, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.39960368370194, "core_hours": 52.39960368370194} {"step": 99950, "l2_params": 342.29094041564264, "train/loss": 2.117263972759247, "l2_grads": 2.375, "lr": 3.706256734576766e-05, "uptime": 188811.042688309, "examples_seen": 102348800.0, "progress": 0.8876317682477376, "epoch": 79.88716537344467, "img/sec/core": 544.7502621337768, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.425711467783614, "core_hours": 52.425711467783614} {"step": 100000, "l2_params": 342.29094041564264, "train/loss": 2.764780282974243, "l2_grads": 2.203125, "lr": 3.67738911188545e-05, "uptime": 188905.800632261, "examples_seen": 102400000.0, "progress": 0.888075806150813, "epoch": 79.92712893791364, "img/sec/core": 540.324091729351, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.452033118881396, "core_hours": 52.452033118881396, "val/acc@1": 0.6655970982142857, "val/loss": 1.3752036283210831, "z/secs/eval/val": 31.67971892800415} {"step": 100050, "l2_params": 342.29094041564264, "train/loss": 2.2377781867980957, "l2_grads": 2.28125, "lr": 3.648630059879748e-05, "uptime": 189030.55301922, "examples_seen": 102451200.0, "progress": 0.8885198440538884, "epoch": 79.9670925023826, "img/sec/core": 410.4129888658865, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.48668655970334, "core_hours": 52.48668655970334} {"step": 100100, "l2_params": 342.29094041564264, "train/loss": 2.737166106700897, "l2_grads": 2.234375, "lr": 3.619979645964959e-05, "uptime": 189123.689337782, "examples_seen": 102502400.0, "progress": 0.8889638819569639, "epoch": 80.00705606685155, "img/sec/core": 549.7318424274735, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.512557759303895, "core_hours": 52.512557759303895} {"step": 100150, "l2_params": 342.29094041564264, "train/loss": 4.219680070877075, "l2_grads": 2.09375, "lr": 3.591437937291769e-05, "uptime": 189218.253945731, "examples_seen": 102553600.0, "progress": 0.8894079198600392, "epoch": 80.04701963132051, "img/sec/core": 541.428776690059, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.538825705956384, "core_hours": 52.538825705956384} {"step": 100200, "l2_params": 342.29094041564264, "train/loss": 3.895188808441162, "l2_grads": 2.046875, "lr": 3.56300500075608e-05, "uptime": 189312.392692655, "examples_seen": 102604800.0, "progress": 0.8898519577631147, "epoch": 80.08698319578946, "img/sec/core": 543.8780701142624, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.56497535787972, "core_hours": 52.56497535787972} {"step": 100250, "l2_params": 342.29094041564264, "train/loss": 2.251760959625244, "l2_grads": 2.421875, "lr": 3.53468090299886e-05, "uptime": 189406.897424902, "examples_seen": 102656000.0, "progress": 0.8902959956661901, "epoch": 80.12694676025842, "img/sec/core": 541.7718116610225, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.59122667239278, "core_hours": 52.59122667239278} {"step": 100300, "l2_params": 342.29094041564264, "train/loss": 2.153879940509796, "l2_grads": 2.28125, "lr": 3.506465710405989e-05, "uptime": 189500.134061562, "examples_seen": 102707200.0, "progress": 0.8907400335692655, "epoch": 80.16691032472738, "img/sec/core": 549.1403576332956, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.61712573813167, "core_hours": 52.61712573813167} {"step": 100350, "l2_params": 342.29094041564264, "train/loss": 2.1685265600681305, "l2_grads": 2.328125, "lr": 3.478359489108062e-05, "uptime": 189594.997406614, "examples_seen": 102758400.0, "progress": 0.8911840714723409, "epoch": 80.20687388919633, "img/sec/core": 539.7237465317588, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.64347666731278, "core_hours": 52.64347666731278} {"step": 100400, "l2_params": 342.29094041564264, "train/loss": 2.3020854592323303, "l2_grads": 2.28125, "lr": 3.450362304980286e-05, "uptime": 189688.25686431202, "examples_seen": 102809600.0, "progress": 0.8916281093754163, "epoch": 80.2468374536653, "img/sec/core": 549.0059803456858, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.66938207222889, "core_hours": 52.66938207222889} {"step": 100450, "l2_params": 342.29094041564264, "train/loss": 2.2182650566101074, "l2_grads": 2.296875, "lr": 3.4224742236423354e-05, "uptime": 189783.663668972, "examples_seen": 102860800.0, "progress": 0.8920721472784917, "epoch": 80.28680101813424, "img/sec/core": 536.6493530777844, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.695883962412225, "core_hours": 52.695883962412225} {"step": 100500, "l2_params": 342.29094041564264, "train/loss": 4.580095410346985, "l2_grads": 2.21875, "lr": 3.394695310458112e-05, "uptime": 189876.87579492, "examples_seen": 102912000.0, "progress": 0.8925161851815671, "epoch": 80.3267645826032, "img/sec/core": 549.2847575278812, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.72177621962, "core_hours": 52.72177621962} {"step": 100550, "l2_params": 342.29094041564264, "train/loss": 2.0240637063980103, "l2_grads": 2.3125, "lr": 3.367025630535719e-05, "uptime": 189972.202550356, "examples_seen": 102963200.0, "progress": 0.8929602230846425, "epoch": 80.36672814707217, "img/sec/core": 537.0999963841545, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.74825587390778, "core_hours": 52.74825587390778} {"step": 100600, "l2_params": 342.29094041564264, "train/loss": 2.171779155731201, "l2_grads": 2.25, "lr": 3.3394652487271765e-05, "uptime": 190066.43495295302, "examples_seen": 103014400.0, "progress": 0.8934042609877179, "epoch": 80.40669171154111, "img/sec/core": 543.337520735457, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.77443154129583, "core_hours": 52.77443154129583} {"step": 100650, "l2_params": 342.29094041564264, "train/loss": 2.1588340997695923, "l2_grads": 2.296875, "lr": 3.3120142296283624e-05, "uptime": 190159.695198673, "examples_seen": 103065600.0, "progress": 0.8938482988907933, "epoch": 80.44665527601008, "img/sec/core": 549.0013414046734, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.800337165106946, "core_hours": 52.800337165106946} {"step": 100700, "l2_params": 342.29094041564264, "train/loss": 3.4574629068374634, "l2_grads": 1.96875, "lr": 3.284672637578841e-05, "uptime": 190254.372916062, "examples_seen": 103116800.0, "progress": 0.8942923367938688, "epoch": 80.48661884047903, "img/sec/core": 540.7819433333791, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.82663653104833, "core_hours": 52.82663653104833} {"step": 100750, "l2_params": 342.29094041564264, "train/loss": 4.521859884262085, "l2_grads": 2.140625, "lr": 3.257440536661664e-05, "uptime": 190347.600720421, "examples_seen": 103168000.0, "progress": 0.8947363746969441, "epoch": 80.52658240494799, "img/sec/core": 549.1923825948448, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.85253314337027, "core_hours": 52.85253314337027} {"step": 100800, "l2_params": 342.29094041564264, "train/loss": 2.3193970322608948, "l2_grads": 2.328125, "lr": 3.2303179907033165e-05, "uptime": 190441.989202615, "examples_seen": 103219200.0, "progress": 0.8951804126000196, "epoch": 80.56654596941695, "img/sec/core": 542.4390647025575, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.87875216620194, "core_hours": 52.87875216620194} {"step": 100850, "l2_params": 342.29094041564264, "train/loss": 2.139205276966095, "l2_grads": 2.25, "lr": 3.203305063273452e-05, "uptime": 190535.242564506, "examples_seen": 103270400.0, "progress": 0.8956244505030949, "epoch": 80.6065095338859, "img/sec/core": 549.0418678935403, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.90465587783834, "core_hours": 52.90465587783834} {"step": 100900, "l2_params": 342.29094041564264, "train/loss": 2.2140763998031616, "l2_grads": 2.25, "lr": 3.176401817684824e-05, "uptime": 190630.703810144, "examples_seen": 103321600.0, "progress": 0.8960684884061704, "epoch": 80.64647309835486, "img/sec/core": 536.343305158171, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.931172890515555, "core_hours": 52.931172890515555} {"step": 100950, "l2_params": 342.29094041564264, "train/loss": 2.180727928876877, "l2_grads": 2.359375, "lr": 3.149608316993129e-05, "uptime": 190723.795046587, "examples_seen": 103372800.0, "progress": 0.8965125263092457, "epoch": 80.68643666282382, "img/sec/core": 549.9980659441729, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.95703156730528, "core_hours": 52.95703156730528} {"step": 101000, "l2_params": 342.29094041564264, "train/loss": 3.5622392892837524, "l2_grads": 1.984375, "lr": 3.122924623996804e-05, "uptime": 190818.158584105, "examples_seen": 103424000.0, "progress": 0.8969565642123212, "epoch": 80.72640022729277, "img/sec/core": 542.5824566002556, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 52.98324366106028, "core_hours": 52.98324366106028} {"step": 101050, "l2_params": 342.29094041564264, "train/loss": 3.8342286944389343, "l2_grads": 1.9140625, "lr": 3.096350801236979e-05, "uptime": 190911.659676139, "examples_seen": 103475200.0, "progress": 0.8974006021153965, "epoch": 80.76636379176173, "img/sec/core": 547.5871873386733, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.00921618662528, "core_hours": 53.00921618662528} {"step": 101101, "l2_params": 342.29094041564264, "train/loss": 2.169910192489624, "l2_grads": 2.484375, "lr": 3.0698869109972145e-05, "uptime": 191005.227073181, "examples_seen": 103526400.0, "progress": 0.897844640018472, "epoch": 80.80632735623068, "img/sec/core": 547.1991486202827, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.03520713024806, "core_hours": 53.03520713024806} {"step": 101150, "l2_params": 342.29094041564264, "train/loss": 3.6074753999710083, "l2_grads": 2.09375, "lr": 3.043533015303427e-05, "uptime": 191099.832232595, "examples_seen": 103577600.0, "progress": 0.8982886779215474, "epoch": 80.84629092069964, "img/sec/core": 541.1966991773052, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.06148634119639, "core_hours": 53.06148634119639} {"step": 101200, "l2_params": 342.29094041564264, "train/loss": 2.7356841564178467, "l2_grads": 2.109375, "lr": 3.0172891759237524e-05, "uptime": 191193.805679323, "examples_seen": 103628800.0, "progress": 0.8987327158246228, "epoch": 80.8862544851686, "img/sec/core": 544.8347568670038, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.087590076398605, "core_hours": 53.087590076398605} {"step": 101250, "l2_params": 342.29094041564264, "train/loss": 2.1559940576553345, "l2_grads": 2.328125, "lr": 2.9911554543683467e-05, "uptime": 191287.00967534, "examples_seen": 103680000.0, "progress": 0.8991767537276982, "epoch": 80.92621804963755, "img/sec/core": 549.332670142867, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.11348007529222, "core_hours": 53.11348007529222} {"step": 101300, "l2_params": 342.29094041564264, "train/loss": 4.742226839065552, "l2_grads": 2.171875, "lr": 2.9651319118892933e-05, "uptime": 191380.941094513, "examples_seen": 103731200.0, "progress": 0.8996207916307736, "epoch": 80.96618161410652, "img/sec/core": 545.0785312388913, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.139572136173605, "core_hours": 53.139572136173605} {"step": 101350, "l2_params": 342.29094041564264, "train/loss": 1.9690950214862823, "l2_grads": 2.1875, "lr": 2.9392186094804333e-05, "uptime": 191474.794267979, "examples_seen": 103782400.0, "progress": 0.900064829533849, "epoch": 81.00614517857547, "img/sec/core": 545.5329650471189, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.16564246213639, "core_hours": 53.16564246213639} {"step": 101400, "l2_params": 342.29094041564264, "train/loss": 2.014261156320572, "l2_grads": 2.3125, "lr": 2.9134156078772193e-05, "uptime": 191569.267859187, "examples_seen": 103833600.0, "progress": 0.9005088674369244, "epoch": 81.04610874304443, "img/sec/core": 541.9503942353424, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.19188512636084, "core_hours": 53.19188512636084} {"step": 101450, "l2_params": 342.29094041564264, "train/loss": 2.2271395921707153, "l2_grads": 2.203125, "lr": 2.887722967556594e-05, "uptime": 191662.420462326, "examples_seen": 103884800.0, "progress": 0.9009529053399998, "epoch": 81.08607230751339, "img/sec/core": 549.6357404376928, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.217760849455, "core_hours": 53.217760849455} {"step": 101500, "l2_params": 342.29094041564264, "train/loss": 2.1036284267902374, "l2_grads": 2.3125, "lr": 2.862140748736813e-05, "uptime": 191756.371190092, "examples_seen": 103936000.0, "progress": 0.9013969432430752, "epoch": 81.12603587198234, "img/sec/core": 544.9665076306958, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.24385827383445, "core_hours": 53.24385827383445} {"step": 101550, "l2_params": 342.29094041564264, "train/loss": 2.321183443069458, "l2_grads": 2.234375, "lr": 2.8366690113773692e-05, "uptime": 191851.045263222, "examples_seen": 103987200.0, "progress": 0.9018409811461506, "epoch": 81.1659994364513, "img/sec/core": 540.8027594808443, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.27015662748167, "core_hours": 53.27015662748167} {"step": 101600, "l2_params": 342.29094041564264, "train/loss": 2.1532645225524902, "l2_grads": 2.34375, "lr": 2.8113078151787532e-05, "uptime": 191944.364417408, "examples_seen": 104038400.0, "progress": 0.9022850190492261, "epoch": 81.20596300092025, "img/sec/core": 548.6547798959944, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.29607861475556, "core_hours": 53.29607861475556} {"step": 101650, "l2_params": 342.29094041564264, "train/loss": 2.896084427833557, "l2_grads": 2.171875, "lr": 2.7860572195824153e-05, "uptime": 192038.741412831, "examples_seen": 104089600.0, "progress": 0.9027290569523014, "epoch": 81.24592656538921, "img/sec/core": 542.5050858053249, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.3222944468175, "core_hours": 53.3222944468175} {"step": 101700, "l2_params": 342.29094041564264, "train/loss": 4.24149751663208, "l2_grads": 2.0, "lr": 2.7609172837705807e-05, "uptime": 192131.97329672, "examples_seen": 104140800.0, "progress": 0.9031730948553769, "epoch": 81.28589012985817, "img/sec/core": 549.1683516870087, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.348192192342225, "core_hours": 53.348192192342225} {"step": 101750, "l2_params": 342.29094041564264, "train/loss": 2.138271987438202, "l2_grads": 2.34375, "lr": 2.735888066666064e-05, "uptime": 192225.224815255, "examples_seen": 104192000.0, "progress": 0.9036171327584522, "epoch": 81.32585369432712, "img/sec/core": 549.0527211177584, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.37409539193528, "core_hours": 53.37409539193528} {"step": 101800, "l2_params": 342.29094041564264, "train/loss": 4.604807734489441, "l2_grads": 2.0, "lr": 2.7109696269322343e-05, "uptime": 192320.56534183602, "examples_seen": 104243200.0, "progress": 0.9040611706615277, "epoch": 81.36581725879608, "img/sec/core": 537.0224167630699, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.400578871541114, "core_hours": 53.400578871541114} {"step": 101850, "l2_params": 342.29094041564264, "train/loss": 4.700582146644592, "l2_grads": 2.140625, "lr": 2.6861620229727856e-05, "uptime": 192413.74485830602, "examples_seen": 104294400.0, "progress": 0.904505208564603, "epoch": 81.40578082326503, "img/sec/core": 549.4769874287066, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.42646207056056, "core_hours": 53.42646207056056} {"step": 101900, "l2_params": 342.29094041564264, "train/loss": 2.138647735118866, "l2_grads": 2.296875, "lr": 2.661465312931634e-05, "uptime": 192508.109944926, "examples_seen": 104345600.0, "progress": 0.9049492464676785, "epoch": 81.445744387734, "img/sec/core": 542.5735495394763, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.45267459462166, "core_hours": 53.45267459462166} {"step": 101950, "l2_params": 342.29094041564264, "train/loss": 2.1377804279327393, "l2_grads": 2.40625, "lr": 2.636879554692824e-05, "uptime": 192601.367688668, "examples_seen": 104396800.0, "progress": 0.9053932843707538, "epoch": 81.48570795220296, "img/sec/core": 549.0160703613835, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.47857952343888, "core_hours": 53.47857952343888} {"step": 102000, "l2_params": 342.29094041564264, "train/loss": 4.7841304540634155, "l2_grads": 2.125, "lr": 2.6124048058803047e-05, "uptime": 192694.782100175, "examples_seen": 104448000.0, "progress": 0.9058373222738293, "epoch": 81.5256715166719, "img/sec/core": 548.0953010783642, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.504527971079725, "core_hours": 53.504527971079725} {"step": 102050, "l2_params": 342.29094041564264, "train/loss": 2.0541513562202454, "l2_grads": 2.359375, "lr": 2.5880411238578685e-05, "uptime": 192788.431426881, "examples_seen": 104499200.0, "progress": 0.9062813601769047, "epoch": 81.56563508114087, "img/sec/core": 546.7204282284272, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.5305416729425, "core_hours": 53.5305416729425} {"step": 102100, "l2_params": 342.29094041564264, "train/loss": 4.209516525268555, "l2_grads": 1.96875, "lr": 2.5637885657289618e-05, "uptime": 192882.770410146, "examples_seen": 104550400.0, "progress": 0.9067253980799801, "epoch": 81.60559864560982, "img/sec/core": 542.7236782504939, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.55674694607167, "core_hours": 53.55674694607167} {"step": 102150, "l2_params": 342.29094041564264, "train/loss": 2.3729456067085266, "l2_grads": 2.296875, "lr": 2.5396471883366287e-05, "uptime": 192977.511123482, "examples_seen": 104601600.0, "progress": 0.9071694359830555, "epoch": 81.64556221007878, "img/sec/core": 540.4223611704114, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.58306381088722, "core_hours": 53.58306381088722} {"step": 102200, "l2_params": 342.29094041564264, "train/loss": 2.228968560695648, "l2_grads": 2.296875, "lr": 2.5156170482632834e-05, "uptime": 193071.095501986, "examples_seen": 104652800.0, "progress": 0.9076134738861309, "epoch": 81.68552577454774, "img/sec/core": 547.0998559636834, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.60905947158278, "core_hours": 53.60905947158278} {"step": 102250, "l2_params": 342.29094041564264, "train/loss": 2.12504643201828, "l2_grads": 2.40625, "lr": 2.491698201830637e-05, "uptime": 193164.846946235, "examples_seen": 104704000.0, "progress": 0.9080575117892064, "epoch": 81.72548933901669, "img/sec/core": 546.1249201028547, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.63510153942972, "core_hours": 53.63510153942972} {"step": 102300, "l2_params": 342.29094041564264, "train/loss": 2.1827574372291565, "l2_grads": 2.375, "lr": 2.4678907050995664e-05, "uptime": 193259.020684864, "examples_seen": 104755200.0, "progress": 0.9085015496922817, "epoch": 81.76545290348565, "img/sec/core": 543.6759838292234, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.661260911271114, "core_hours": 53.661260911271114} {"step": 102350, "l2_params": 342.29094041564264, "train/loss": 2.7182796001434326, "l2_grads": 2.34375, "lr": 2.4441946138699314e-05, "uptime": 193353.472821762, "examples_seen": 104806400.0, "progress": 0.9089455875953572, "epoch": 81.8054164679546, "img/sec/core": 542.073495439159, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.68749761596499, "core_hours": 53.68749761596499} {"step": 102400, "l2_params": 342.29094041564264, "train/loss": 2.06887549161911, "l2_grads": 2.234375, "lr": 2.4206099836805217e-05, "uptime": 193447.910736447, "examples_seen": 104857600.0, "progress": 0.9093896254984325, "epoch": 81.84538003242356, "img/sec/core": 542.1551309215216, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.71373037004416, "core_hours": 53.71373037004416} {"step": 102450, "l2_params": 342.29094041564264, "train/loss": 3.8250216245651245, "l2_grads": 2.046875, "lr": 2.3971368698088642e-05, "uptime": 193542.491710807, "examples_seen": 104908800.0, "progress": 0.909833663401508, "epoch": 81.88534359689253, "img/sec/core": 541.3350871721959, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.74000286292195, "core_hours": 53.74000286292195} {"step": 102500, "l2_params": 342.29094041564264, "train/loss": 2.0385018587112427, "l2_grads": 2.171875, "lr": 2.3737753272711056e-05, "uptime": 193635.738959576, "examples_seen": 104960000.0, "progress": 0.9102777013045834, "epoch": 81.92530716136147, "img/sec/core": 549.0778620914746, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.76590487646889, "core_hours": 53.76590487646889, "val/acc@1": 0.6653380102040817, "val/loss": 1.3750918677874975, "z/secs/eval/val": 31.77661646998604} {"step": 102550, "l2_params": 342.29094041564264, "train/loss": 2.8881337642669678, "l2_grads": 2.125, "lr": 2.3505254108219143e-05, "uptime": 193760.491953043, "examples_seen": 105011200.0, "progress": 0.9107217392076588, "epoch": 81.96527072583044, "img/sec/core": 410.4109935730141, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.80055848576528, "core_hours": 53.80055848576528} {"step": 102600, "l2_params": 342.29094041564264, "train/loss": 4.4630889892578125, "l2_grads": 2.046875, "lr": 2.3273871749543106e-05, "uptime": 193853.899131516, "examples_seen": 105062400.0, "progress": 0.9111657771107342, "epoch": 82.00523429029938, "img/sec/core": 548.1377431265146, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.82650492423, "core_hours": 53.82650492423} {"step": 102650, "l2_params": 342.29094041564264, "train/loss": 2.1395143568515778, "l2_grads": 2.4375, "lr": 2.304360673899582e-05, "uptime": 193948.314047472, "examples_seen": 105113600.0, "progress": 0.9116098150138096, "epoch": 82.04519785476835, "img/sec/core": 542.2871956361065, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.85273128977334, "core_hours": 53.85273128977334} {"step": 102700, "l2_params": 342.29094041564264, "train/loss": 2.039723813533783, "l2_grads": 2.171875, "lr": 2.281445961627094e-05, "uptime": 194042.11479870402, "examples_seen": 105164800.0, "progress": 0.912053852916885, "epoch": 82.08516141923731, "img/sec/core": 545.8378459395882, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.87878705400445, "core_hours": 53.87878705400445} {"step": 102750, "l2_params": 342.29094041564264, "train/loss": 2.2452170848846436, "l2_grads": 2.296875, "lr": 2.2586430918442426e-05, "uptime": 194135.838120734, "examples_seen": 105216000.0, "progress": 0.9124978908199604, "epoch": 82.12512498370626, "img/sec/core": 546.2887880096807, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.904821310123886, "core_hours": 53.904821310123886} {"step": 102800, "l2_params": 342.29094041564264, "train/loss": 4.068678557872772, "l2_grads": 2.046875, "lr": 2.2359521179962716e-05, "uptime": 194230.31769440701, "examples_seen": 105267200.0, "progress": 0.9129419287230358, "epoch": 82.16508854817522, "img/sec/core": 541.9160778307283, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.93106563614417, "core_hours": 53.93106563614417} {"step": 102850, "l2_params": 342.29094041564264, "train/loss": 3.556091785430908, "l2_grads": 2.0, "lr": 2.213373093266157e-05, "uptime": 194323.788068303, "examples_seen": 105318400.0, "progress": 0.9133859666261112, "epoch": 82.20505211264418, "img/sec/core": 547.7671465931963, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.957029628893046, "core_hours": 53.957029628893046} {"step": 102900, "l2_params": 342.29094041564264, "train/loss": 2.1223293244838715, "l2_grads": 2.34375, "lr": 2.1909060705744993e-05, "uptime": 194419.13852780202, "examples_seen": 105369600.0, "progress": 0.9138300045291866, "epoch": 82.24501567711313, "img/sec/core": 536.9664736699542, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 53.98351586764279, "core_hours": 53.98351586764279} {"step": 102950, "l2_params": 342.29094041564264, "train/loss": 2.7806422114372253, "l2_grads": 2.046875, "lr": 2.168551102579386e-05, "uptime": 194512.25435325102, "examples_seen": 105420800.0, "progress": 0.9142740424322621, "epoch": 82.28497924158209, "img/sec/core": 549.8528284866296, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.00938137471194, "core_hours": 54.00938137471194} {"step": 103000, "l2_params": 342.29094041564264, "train/loss": 3.81102591753006, "l2_grads": 2.015625, "lr": 2.146308241676249e-05, "uptime": 194605.567076287, "examples_seen": 105472000.0, "progress": 0.9147180803353374, "epoch": 82.32494280605104, "img/sec/core": 548.6925934018318, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.03530157555528, "core_hours": 54.03530157555528} {"step": 103050, "l2_params": 342.29094041564264, "train/loss": 2.097638338804245, "l2_grads": 2.46875, "lr": 2.124177539997818e-05, "uptime": 194700.12858481, "examples_seen": 105523200.0, "progress": 0.9151621182384129, "epoch": 82.36490637052, "img/sec/core": 541.4465230061523, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.06156866125612, "core_hours": 54.06156866125612} {"step": 103100, "l2_params": 342.29094041564264, "train/loss": 3.1782066822052, "l2_grads": 2.0625, "lr": 2.102159049413899e-05, "uptime": 194793.659378815, "examples_seen": 105574400.0, "progress": 0.9156061561414882, "epoch": 82.40486993498897, "img/sec/core": 547.4132936074997, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.08754943736861, "core_hours": 54.08754943736861} {"step": 103150, "l2_params": 342.29094041564264, "train/loss": 2.107936680316925, "l2_grads": 2.3125, "lr": 2.080252821531308e-05, "uptime": 194886.857274371, "examples_seen": 105625600.0, "progress": 0.9160501940445637, "epoch": 82.44483349945791, "img/sec/core": 549.3686278489083, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.11343774168972, "core_hours": 54.11343774168972} {"step": 103200, "l2_params": 342.29094041564264, "train/loss": 2.16661137342453, "l2_grads": 2.21875, "lr": 2.0584589076937544e-05, "uptime": 194980.05737660002, "examples_seen": 105676800.0, "progress": 0.916494231947639, "epoch": 82.48479706392688, "img/sec/core": 549.3556205999246, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.139326658975556, "core_hours": 54.139326658975556} {"step": 103250, "l2_params": 342.29094041564264, "train/loss": 3.0949278473854065, "l2_grads": 2.09375, "lr": 2.036777358981672e-05, "uptime": 195074.437312285, "examples_seen": 105728000.0, "progress": 0.9169382698507145, "epoch": 82.52476062839582, "img/sec/core": 542.4881848922635, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.16554330777694, "core_hours": 54.16554330777694} {"step": 103300, "l2_params": 342.29094041564264, "train/loss": 2.3731093406677246, "l2_grads": 2.265625, "lr": 2.0152082262121817e-05, "uptime": 195168.87386775602, "examples_seen": 105779200.0, "progress": 0.9173823077537898, "epoch": 82.56472419286479, "img/sec/core": 542.1629340951308, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.19177568429667, "core_hours": 54.19177568429667} {"step": 103350, "l2_params": 342.29094041564264, "train/loss": 2.8072601556777954, "l2_grads": 2.09375, "lr": 1.9937515599388914e-05, "uptime": 195262.383209336, "examples_seen": 105830400.0, "progress": 0.9178263456568653, "epoch": 82.60468775733375, "img/sec/core": 547.5388783077757, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.217750501402215, "core_hours": 54.217750501402215} {"step": 103400, "l2_params": 342.29094041564264, "train/loss": 2.0949350595474243, "l2_grads": 2.25, "lr": 1.9724074104518298e-05, "uptime": 195355.499333722, "examples_seen": 105881600.0, "progress": 0.9182703835599407, "epoch": 82.6446513218027, "img/sec/core": 549.8510632568766, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.243616091509445, "core_hours": 54.243616091509445} {"step": 103450, "l2_params": 342.29094041564264, "train/loss": 2.339078366756439, "l2_grads": 2.3125, "lr": 1.9511758277772885e-05, "uptime": 195450.063785877, "examples_seen": 105932800.0, "progress": 0.9187144214630161, "epoch": 82.68461488627166, "img/sec/core": 541.4296686886024, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.26988399488583, "core_hours": 54.26988399488583} {"step": 103500, "l2_params": 342.29094041564264, "train/loss": 2.2241620123386383, "l2_grads": 2.265625, "lr": 1.930056861677724e-05, "uptime": 195543.18964171, "examples_seen": 105984000.0, "progress": 0.9191584593660915, "epoch": 82.72457845074061, "img/sec/core": 549.7936050307553, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.29575228817278, "core_hours": 54.29575228817278} {"step": 103550, "l2_params": 342.29094041564264, "train/loss": 2.0401129722595215, "l2_grads": 2.1875, "lr": 1.9090505616516854e-05, "uptime": 195636.921319117, "examples_seen": 106035200.0, "progress": 0.9196024972691669, "epoch": 82.76454201520957, "img/sec/core": 546.2400910384767, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.32178886523028, "core_hours": 54.32178886523028} {"step": 103600, "l2_params": 342.29094041564264, "train/loss": 2.9488248229026794, "l2_grads": 2.09375, "lr": 1.8881569769336015e-05, "uptime": 195732.27593812, "examples_seen": 106086400.0, "progress": 0.9200465351722423, "epoch": 82.80450557967853, "img/sec/core": 536.9430504294232, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.34827625939777, "core_hours": 54.34827625939777} {"step": 103650, "l2_params": 342.29094041564264, "train/loss": 2.542407751083374, "l2_grads": 2.234375, "lr": 1.867376156493759e-05, "uptime": 195825.319157293, "examples_seen": 106137600.0, "progress": 0.9204905730753177, "epoch": 82.84446914414748, "img/sec/core": 550.2819061408162, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.374121598056945, "core_hours": 54.374121598056945} {"step": 103700, "l2_params": 342.29094041564264, "train/loss": 3.3163915872573853, "l2_grads": 2.125, "lr": 1.8467081490381257e-05, "uptime": 195918.791840486, "examples_seen": 106188800.0, "progress": 0.9209346109783931, "epoch": 82.88443270861644, "img/sec/core": 547.7536136872247, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.40008623227722, "core_hours": 54.40008623227722} {"step": 103750, "l2_params": 342.29094041564264, "train/loss": 3.070133328437805, "l2_grads": 2.140625, "lr": 1.8261530030082602e-05, "uptime": 196012.015207674, "examples_seen": 106240000.0, "progress": 0.9213786488814685, "epoch": 82.92439627308539, "img/sec/core": 549.2185226129168, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.42598161205167, "core_hours": 54.42598161205167} {"step": 103800, "l2_params": 342.29094041564264, "train/loss": 3.1210617423057556, "l2_grads": 2.109375, "lr": 1.8057107665812057e-05, "uptime": 196105.267344125, "examples_seen": 106291200.0, "progress": 0.9218226867845439, "epoch": 82.96435983755435, "img/sec/core": 549.0490829334482, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.45188498328805, "core_hours": 54.45188498328805} {"step": 103850, "l2_params": 342.29094041564264, "train/loss": 4.5418360233306885, "l2_grads": 2.0625, "lr": 1.7853814876693707e-05, "uptime": 196199.402280476, "examples_seen": 106342400.0, "progress": 0.9222667246876194, "epoch": 83.00432340202332, "img/sec/core": 543.900086245198, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.478033576718886, "core_hours": 54.478033576718886} {"step": 103900, "l2_params": 342.29094041564264, "train/loss": 4.825581312179565, "l2_grads": 2.203125, "lr": 1.765165213920418e-05, "uptime": 196293.619628299, "examples_seen": 106393600.0, "progress": 0.9227107625906947, "epoch": 83.04428696649227, "img/sec/core": 543.4243393922342, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.50420506222528, "core_hours": 54.50420506222528} {"step": 103950, "l2_params": 342.29094041564264, "train/loss": 2.0835056602954865, "l2_grads": 2.453125, "lr": 1.7450619927171243e-05, "uptime": 196386.771987638, "examples_seen": 106444800.0, "progress": 0.9231548004937702, "epoch": 83.08425053096123, "img/sec/core": 549.6371789540228, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.53008071759722, "core_hours": 54.53008071759722} {"step": 104000, "l2_params": 342.29094041564264, "train/loss": 4.247912406921387, "l2_grads": 2.0, "lr": 1.725071871177315e-05, "uptime": 196481.085587528, "examples_seen": 106496000.0, "progress": 0.9235988383968455, "epoch": 83.12421409543018, "img/sec/core": 542.8697458236128, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.55627893978889, "core_hours": 54.55627893978889} {"step": 104050, "l2_params": 342.29094041564264, "train/loss": 2.341948986053467, "l2_grads": 2.25, "lr": 1.705194896153734e-05, "uptime": 196574.42911343402, "examples_seen": 106547200.0, "progress": 0.924042876299921, "epoch": 83.16417765989914, "img/sec/core": 548.5115277470527, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.58220769698501, "core_hours": 54.58220769698501} {"step": 104100, "l2_params": 342.29094041564264, "train/loss": 2.1659910678863525, "l2_grads": 2.296875, "lr": 1.6854311142339163e-05, "uptime": 196668.736970274, "examples_seen": 106598400.0, "progress": 0.9244869142029963, "epoch": 83.2041412243681, "img/sec/core": 542.9028048730617, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.608404323885004, "core_hours": 54.608404323885004} {"step": 104150, "l2_params": 342.29094041564264, "train/loss": 3.4851366877555847, "l2_grads": 2.09375, "lr": 1.6657805717401272e-05, "uptime": 196761.995552945, "examples_seen": 106649600.0, "progress": 0.9249309521060718, "epoch": 83.24410478883705, "img/sec/core": 549.0111315612162, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.63430948573806, "core_hours": 54.63430948573806} {"step": 104200, "l2_params": 342.29094041564264, "train/loss": 2.7352019548416138, "l2_grads": 2.1875, "lr": 1.646243314729195e-05, "uptime": 196856.377251864, "examples_seen": 106700800.0, "progress": 0.9253749900091471, "epoch": 83.28406835330601, "img/sec/core": 542.4780501561398, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.660526624326664, "core_hours": 54.660526624326664} {"step": 104250, "l2_params": 342.29094041564264, "train/loss": 4.657914638519287, "l2_grads": 2.078125, "lr": 1.6268193889924224e-05, "uptime": 196949.525719074, "examples_seen": 106752000.0, "progress": 0.9258190279122226, "epoch": 83.32403191777496, "img/sec/core": 549.660145073226, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.68640119855167, "core_hours": 54.68640119855167} {"step": 104300, "l2_params": 342.29094041564264, "train/loss": 2.609122097492218, "l2_grads": 2.125, "lr": 1.6075088400555205e-05, "uptime": 197043.814273025, "examples_seen": 106803200.0, "progress": 0.926263065815298, "epoch": 83.36399548224392, "img/sec/core": 543.0139487197375, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.71259246353805, "core_hours": 54.71259246353805} {"step": 104350, "l2_params": 342.29094041564264, "train/loss": 4.7074480056762695, "l2_grads": 2.125, "lr": 1.5883117131784358e-05, "uptime": 197136.975703222, "examples_seen": 106854400.0, "progress": 0.9267071037183734, "epoch": 83.40395904671288, "img/sec/core": 549.5836623775081, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.73847063859277, "core_hours": 54.73847063859277} {"step": 104400, "l2_params": 342.29094041564264, "train/loss": 2.454248011112213, "l2_grads": 2.125, "lr": 1.5692280533553088e-05, "uptime": 197230.91908722802, "examples_seen": 106905600.0, "progress": 0.9271511416214488, "epoch": 83.44392261118183, "img/sec/core": 545.009108855664, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.764566023038896, "core_hours": 54.764566023038896} {"step": 104450, "l2_params": 342.29094041564264, "train/loss": 4.764366149902344, "l2_grads": 2.140625, "lr": 1.550257905314306e-05, "uptime": 197324.104227706, "examples_seen": 106956800.0, "progress": 0.9275951795245242, "epoch": 83.4838861756508, "img/sec/core": 549.4438248134021, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.79045078428278, "core_hours": 54.79045078428278} {"step": 104500, "l2_params": 342.29094041564264, "train/loss": 4.738344192504883, "l2_grads": 2.1875, "lr": 1.5314013135175506e-05, "uptime": 197418.422103392, "examples_seen": 107008000.0, "progress": 0.9280392174275996, "epoch": 83.52384974011974, "img/sec/core": 542.8451354275769, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.81665019419555, "core_hours": 54.81665019419555} {"step": 104550, "l2_params": 342.29094041564264, "train/loss": 4.3959349393844604, "l2_grads": 2.03125, "lr": 1.5126583221610374e-05, "uptime": 197511.934593167, "examples_seen": 107059200.0, "progress": 0.928483255330675, "epoch": 83.5638133045887, "img/sec/core": 547.5204448430424, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.84262588579973, "core_hours": 54.84262588579973} {"step": 104600, "l2_params": 342.29094041564264, "train/loss": 2.1741872429847717, "l2_grads": 2.25, "lr": 1.4940289751744715e-05, "uptime": 197606.993617995, "examples_seen": 107110400.0, "progress": 0.9289272932337505, "epoch": 83.60377686905767, "img/sec/core": 538.6127208084243, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.869031170474166, "core_hours": 54.869031170474166} {"step": 104650, "l2_params": 342.29094041564264, "train/loss": 4.278063654899597, "l2_grads": 2.078125, "lr": 1.4755133162212328e-05, "uptime": 197700.106902256, "examples_seen": 107161600.0, "progress": 0.9293713311368258, "epoch": 83.64374043352662, "img/sec/core": 549.8678347171951, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.894895971657775, "core_hours": 54.894895971657775} {"step": 104700, "l2_params": 342.29094041564264, "train/loss": 3.366665005683899, "l2_grads": 1.984375, "lr": 1.4571113886982173e-05, "uptime": 197794.441277902, "examples_seen": 107212800.0, "progress": 0.9298153690399013, "epoch": 83.68370399799558, "img/sec/core": 542.7501867626345, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.921099964892775, "core_hours": 54.921099964892775} {"step": 104750, "l2_params": 342.29094041564264, "train/loss": 2.6407180428504944, "l2_grads": 2.0625, "lr": 1.438823235735753e-05, "uptime": 197887.975222566, "examples_seen": 107264000.0, "progress": 0.9302594069429767, "epoch": 83.72366756246453, "img/sec/core": 547.394854177541, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.947081616188335, "core_hours": 54.947081616188335} {"step": 104800, "l2_params": 342.29094041564264, "train/loss": 2.219188690185547, "l2_grads": 2.4375, "lr": 1.4206489001975344e-05, "uptime": 197981.598256576, "examples_seen": 107315200.0, "progress": 0.930703444846052, "epoch": 83.76363112693349, "img/sec/core": 546.8739668758301, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.97308801452444, "core_hours": 54.97308801452444} {"step": 104850, "l2_params": 342.29094041564264, "train/loss": 2.5907830595970154, "l2_grads": 2.25, "lr": 1.4025884246804445e-05, "uptime": 198075.170561125, "examples_seen": 107366400.0, "progress": 0.9311474827491275, "epoch": 83.80359469140245, "img/sec/core": 547.1704501322823, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 54.99908032134361, "core_hours": 54.99908032134361} {"step": 104900, "l2_params": 342.29094041564264, "train/loss": 3.753122627735138, "l2_grads": 2.109375, "lr": 1.3846418515145505e-05, "uptime": 198168.765202555, "examples_seen": 107417600.0, "progress": 0.9315915206522029, "epoch": 83.8435582558714, "img/sec/core": 547.0398648655748, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.02507883285194, "core_hours": 55.02507883285194} {"step": 104950, "l2_params": 342.29094041564264, "train/loss": 2.2061696648597717, "l2_grads": 2.375, "lr": 1.3668092227629273e-05, "uptime": 198263.240474091, "examples_seen": 107468800.0, "progress": 0.9320355585552783, "epoch": 83.88352182034036, "img/sec/core": 541.9407551581969, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.05132196383417, "core_hours": 55.05132196383417} {"step": 105000, "l2_params": 342.29094041564264, "train/loss": 3.3069936633110046, "l2_grads": 2.1875, "lr": 1.3490905802215968e-05, "uptime": 198356.402692192, "examples_seen": 107520000.0, "progress": 0.9324795964583537, "epoch": 83.92348538480933, "img/sec/core": 549.5790143649343, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.07720035775112, "core_hours": 55.07720035775112, "val/acc@1": 0.6656967474489796, "val/loss": 1.3745831263308623, "z/secs/eval/val": 31.741081576998113} {"step": 105050, "l2_params": 342.29094041564264, "train/loss": 4.751234531402588, "l2_grads": 2.078125, "lr": 1.3314859654194123e-05, "uptime": 198481.296980145, "examples_seen": 107571200.0, "progress": 0.9329236343614291, "epoch": 83.96344894927827, "img/sec/core": 409.94669043042484, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.111893215515835, "core_hours": 55.111893215515835} {"step": 105100, "l2_params": 342.29094041564264, "train/loss": 3.9145914912223816, "l2_grads": 2.078125, "lr": 1.3139954196179763e-05, "uptime": 198574.497052438, "examples_seen": 107622400.0, "progress": 0.9333676722645045, "epoch": 84.00341251374724, "img/sec/core": 549.3557970539057, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.13778212448611, "core_hours": 55.13778212448611} {"step": 105150, "l2_params": 342.29094041564264, "train/loss": 2.8799842596054077, "l2_grads": 2.15625, "lr": 1.2966189838115386e-05, "uptime": 198668.488730574, "examples_seen": 107673600.0, "progress": 0.9338117101675799, "epoch": 84.04337607821618, "img/sec/core": 544.729076183962, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.16389092396833, "core_hours": 55.16389092396833} {"step": 105200, "l2_params": 342.29094041564264, "train/loss": 2.142612010240555, "l2_grads": 2.265625, "lr": 1.2793566987268807e-05, "uptime": 198761.614513856, "examples_seen": 107724800.0, "progress": 0.9342557480706553, "epoch": 84.08333964268515, "img/sec/core": 549.7940333554188, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.18975919710223, "core_hours": 55.18975919710223} {"step": 105250, "l2_params": 342.29094041564264, "train/loss": 3.149441182613373, "l2_grads": 2.0, "lr": 1.2622086048232793e-05, "uptime": 198854.871644102, "examples_seen": 107776000.0, "progress": 0.9346997859737307, "epoch": 84.12330320715411, "img/sec/core": 549.0196820869579, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.21566395550389, "core_hours": 55.21566395550389} {"step": 105300, "l2_params": 342.29094041564264, "train/loss": 2.029370039701462, "l2_grads": 2.3125, "lr": 1.2451747422923274e-05, "uptime": 198949.375887275, "examples_seen": 107827200.0, "progress": 0.9351438238768062, "epoch": 84.16326677162306, "img/sec/core": 541.7746154135644, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.24191513416306, "core_hours": 55.24191513416306} {"step": 105350, "l2_params": 342.29094041564264, "train/loss": 4.642120957374573, "l2_grads": 2.078125, "lr": 1.2282551510579047e-05, "uptime": 199042.983076412, "examples_seen": 107878400.0, "progress": 0.9355878617798815, "epoch": 84.20323033609202, "img/sec/core": 546.9665361393231, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.26791713114555, "core_hours": 55.26791713114555} {"step": 105400, "l2_params": 342.29094041564264, "train/loss": 2.1525180339813232, "l2_grads": 2.359375, "lr": 1.21144987077606e-05, "uptime": 199137.01638438102, "examples_seen": 107929600.0, "progress": 0.936031899682957, "epoch": 84.24319390056097, "img/sec/core": 544.4879171630308, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.29403749447028, "core_hours": 55.29403749447028} {"step": 105450, "l2_params": 342.29094041564264, "train/loss": 4.763368487358093, "l2_grads": 2.25, "lr": 1.1947589408349055e-05, "uptime": 199230.117185902, "examples_seen": 107980800.0, "progress": 0.9364759375860323, "epoch": 84.28315746502993, "img/sec/core": 549.94155972397, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.31989882822611, "core_hours": 55.31989882822611} {"step": 105500, "l2_params": 342.29094041564264, "train/loss": 3.5319822430610657, "l2_grads": 2.0625, "lr": 1.1781824003545706e-05, "uptime": 199323.387086297, "examples_seen": 108032000.0, "progress": 0.9369199754891078, "epoch": 84.32312102949889, "img/sec/core": 548.9445124650165, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.34580713389139, "core_hours": 55.34580713389139} {"step": 105550, "l2_params": 342.29094041564264, "train/loss": 2.1413195729255676, "l2_grads": 2.390625, "lr": 1.1617202881870553e-05, "uptime": 199416.709246841, "examples_seen": 108083200.0, "progress": 0.9373640133921831, "epoch": 84.36308459396784, "img/sec/core": 548.6371050728651, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.37172995626472, "core_hours": 55.37172995626472} {"step": 105600, "l2_params": 342.29094041564264, "train/loss": 2.3139713406562805, "l2_grads": 2.3125, "lr": 1.1453726429161687e-05, "uptime": 199511.2577776, "examples_seen": 108134400.0, "progress": 0.9378080512952586, "epoch": 84.4030481584368, "img/sec/core": 541.5208421430383, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.39799343703111, "core_hours": 55.39799343703111} {"step": 105650, "l2_params": 342.29094041564264, "train/loss": 2.152215301990509, "l2_grads": 2.21875, "lr": 1.129139502857432e-05, "uptime": 199605.034887457, "examples_seen": 108185600.0, "progress": 0.9382520891983339, "epoch": 84.44301172290575, "img/sec/core": 545.9754526245258, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.42404263421361, "core_hours": 55.42404263421361} {"step": 105700, "l2_params": 342.29094041564264, "train/loss": 4.718995690345764, "l2_grads": 2.21875, "lr": 1.1130209060579847e-05, "uptime": 199698.24054879101, "examples_seen": 108236800.0, "progress": 0.9386961271014094, "epoch": 84.48297528737471, "img/sec/core": 549.3228551484725, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.449933095695286, "core_hours": 55.449933095695286} {"step": 105750, "l2_params": 342.29094041564264, "train/loss": 3.244956314563751, "l2_grads": 2.109375, "lr": 1.0970168902965231e-05, "uptime": 199792.30824621802, "examples_seen": 108288000.0, "progress": 0.9391401650044848, "epoch": 84.52293885184368, "img/sec/core": 544.288862175367, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.47606301164722, "core_hours": 55.47606301164722} {"step": 105800, "l2_params": 342.29094041564264, "train/loss": 2.368381142616272, "l2_grads": 2.265625, "lr": 1.0811274930831645e-05, "uptime": 199885.53203486, "examples_seen": 108339200.0, "progress": 0.9395842029075602, "epoch": 84.56290241631262, "img/sec/core": 549.2160396595008, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.501958508492216, "core_hours": 55.501958508492216} {"step": 105850, "l2_params": 342.29094041564264, "train/loss": 2.3074421882629395, "l2_grads": 2.296875, "lr": 1.0653527516593905e-05, "uptime": 199978.74497589, "examples_seen": 108390400.0, "progress": 0.9400282408106356, "epoch": 84.60286598078159, "img/sec/core": 549.2799544165805, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.52785099211167, "core_hours": 55.52785099211167} {"step": 105900, "l2_params": 342.29094041564264, "train/loss": 2.4978872537612915, "l2_grads": 2.203125, "lr": 1.049692702997959e-05, "uptime": 200071.952526749, "examples_seen": 108441600.0, "progress": 0.940472278713711, "epoch": 84.64282954525054, "img/sec/core": 549.3117191487806, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.55374197846139, "core_hours": 55.55374197846139} {"step": 105950, "l2_params": 342.29094041564264, "train/loss": 4.120395660400391, "l2_grads": 1.9921875, "lr": 1.0341473838027993e-05, "uptime": 200165.145988712, "examples_seen": 108492800.0, "progress": 0.9409163166167864, "epoch": 84.6827931097195, "img/sec/core": 549.3947635546048, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.579629051228885, "core_hours": 55.579629051228885} {"step": 106000, "l2_params": 342.29094041564264, "train/loss": 2.606952488422394, "l2_grads": 2.203125, "lr": 1.0187168305089621e-05, "uptime": 200259.91709119402, "examples_seen": 108544000.0, "progress": 0.9413603545198618, "epoch": 84.72275667418846, "img/sec/core": 540.249070223865, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.6059543574739, "core_hours": 55.6059543574739} {"step": 106050, "l2_params": 342.29094041564264, "train/loss": 2.154721438884735, "l2_grads": 2.265625, "lr": 1.0034010792824815e-05, "uptime": 200353.214130695, "examples_seen": 108595200.0, "progress": 0.9418043924229372, "epoch": 84.76272023865741, "img/sec/core": 548.7848304067178, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.631870201779726, "core_hours": 55.631870201779726} {"step": 106100, "l2_params": 342.29094041564264, "train/loss": 2.265348494052887, "l2_grads": 2.390625, "lr": 9.882001660203335e-06, "uptime": 200447.252408864, "examples_seen": 108646400.0, "progress": 0.9422484303260126, "epoch": 84.80268380312637, "img/sec/core": 544.4591393728747, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.65799194571556, "core_hours": 55.65799194571556} {"step": 106150, "l2_params": 342.29094041564264, "train/loss": 2.083209276199341, "l2_grads": 2.390625, "lr": 9.731141263503459e-06, "uptime": 200540.511776277, "examples_seen": 108697600.0, "progress": 0.942692468229088, "epoch": 84.84264736759532, "img/sec/core": 549.0065118419488, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.6838973255525, "core_hours": 55.6838973255525} {"step": 106200, "l2_params": 342.29094041564264, "train/loss": 3.4558371901512146, "l2_grads": 2.15625, "lr": 9.581429956310915e-06, "uptime": 200635.527247772, "examples_seen": 108748800.0, "progress": 0.9431365061321635, "epoch": 84.88261093206428, "img/sec/core": 538.8596109076823, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.71029051207889, "core_hours": 55.71029051207889} {"step": 106250, "l2_params": 342.29094041564264, "train/loss": 3.113368034362793, "l2_grads": 2.03125, "lr": 9.432868089518233e-06, "uptime": 200728.719957145, "examples_seen": 108800000.0, "progress": 0.9435805440352388, "epoch": 84.92257449653324, "img/sec/core": 549.3992002644709, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.73617737579361, "core_hours": 55.73617737579361} {"step": 106300, "l2_params": 342.29094041564264, "train/loss": 2.8169572353363037, "l2_grads": 2.03125, "lr": 9.285456011323937e-06, "uptime": 200823.172548604, "examples_seen": 108851200.0, "progress": 0.9440245819383143, "epoch": 84.96253806100219, "img/sec/core": 542.070886665108, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.76241420675444, "core_hours": 55.76241420675444} {"step": 106350, "l2_params": 342.29094041564264, "train/loss": 2.347804605960846, "l2_grads": 2.21875, "lr": 9.139194067231649e-06, "uptime": 200916.897094635, "examples_seen": 108902400.0, "progress": 0.9444686198413896, "epoch": 85.00250162547115, "img/sec/core": 546.2816537202647, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.78844880287417, "core_hours": 55.78844880287417} {"step": 106400, "l2_params": 342.29094041564264, "train/loss": 2.220972180366516, "l2_grads": 2.34375, "lr": 8.994082600049378e-06, "uptime": 201010.099365131, "examples_seen": 108953600.0, "progress": 0.9449126577444651, "epoch": 85.0424651899401, "img/sec/core": 549.3428403356265, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.814338322456386, "core_hours": 55.814338322456386} {"step": 106450, "l2_params": 342.29094041564264, "train/loss": 4.244796872138977, "l2_grads": 2.109375, "lr": 8.850121949888508e-06, "uptime": 201103.913870577, "examples_seen": 109004800.0, "progress": 0.9453566956475404, "epoch": 85.08242875440907, "img/sec/core": 545.7578202495442, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.8403979073025, "core_hours": 55.8403979073025} {"step": 106500, "l2_params": 342.29094041564264, "train/loss": 4.729810476303101, "l2_grads": 2.1875, "lr": 8.707312454163345e-06, "uptime": 201198.402485315, "examples_seen": 109056000.0, "progress": 0.9458007335506159, "epoch": 85.12239231887803, "img/sec/core": 541.8642250389128, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.86664474472972, "core_hours": 55.86664474472972} {"step": 106550, "l2_params": 342.29094041564264, "train/loss": 2.2860307097434998, "l2_grads": 2.484375, "lr": 8.565654447589945e-06, "uptime": 201291.606088156, "examples_seen": 109107200.0, "progress": 0.9462447714536912, "epoch": 85.16235588334698, "img/sec/core": 549.3349874826205, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.892534634407774, "core_hours": 55.892534634407774} {"step": 106600, "l2_params": 342.29094041564264, "train/loss": 3.6883097290992737, "l2_grads": 2.03125, "lr": 8.425148262185491e-06, "uptime": 201386.891103542, "examples_seen": 109158400.0, "progress": 0.9466888093567667, "epoch": 85.20231944781594, "img/sec/core": 537.3352755686262, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.91900269423722, "core_hours": 55.91900269423722} {"step": 106650, "l2_params": 342.29094041564264, "train/loss": 4.1595354080200195, "l2_grads": 2.140625, "lr": 8.285794227267833e-06, "uptime": 201479.981534996, "examples_seen": 109209600.0, "progress": 0.9471328472598421, "epoch": 85.24228301228489, "img/sec/core": 550.0028219903028, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.94486114741889, "core_hours": 55.94486114741889} {"step": 106700, "l2_params": 342.29094041564264, "train/loss": 2.2040569186210632, "l2_grads": 2.3125, "lr": 8.147592669454026e-06, "uptime": 201574.296824365, "examples_seen": 109260800.0, "progress": 0.9475768851629175, "epoch": 85.28224657675385, "img/sec/core": 542.8600213448476, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.97105983891028, "core_hours": 55.97105983891028} {"step": 106750, "l2_params": 342.29094041564264, "train/loss": 1.9940473139286041, "l2_grads": 2.34375, "lr": 8.010543912660262e-06, "uptime": 201668.456633146, "examples_seen": 109312000.0, "progress": 0.948020923065993, "epoch": 85.32221014122281, "img/sec/core": 543.7564143644742, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 55.997215341349445, "core_hours": 55.997215341349445} {"step": 106800, "l2_params": 342.29094041564264, "train/loss": 2.7254653573036194, "l2_grads": 2.078125, "lr": 7.874648278100641e-06, "uptime": 201762.709260934, "examples_seen": 109363200.0, "progress": 0.9484649609690683, "epoch": 85.36217370569176, "img/sec/core": 543.2209287062582, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.02339662684611, "core_hours": 56.02339662684611} {"step": 106850, "l2_params": 342.29094041564264, "train/loss": 2.189050793647766, "l2_grads": 2.296875, "lr": 7.739906084286541e-06, "uptime": 201857.025368173, "examples_seen": 109414400.0, "progress": 0.9489089988721437, "epoch": 85.40213727016072, "img/sec/core": 542.8553138888765, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.04959554552361, "core_hours": 56.04959554552361} {"step": 106900, "l2_params": 342.29094041564264, "train/loss": 2.0836799442768097, "l2_grads": 2.25, "lr": 7.606317647026073e-06, "uptime": 201950.249555032, "examples_seen": 109465600.0, "progress": 0.9493530367752191, "epoch": 85.44210083462968, "img/sec/core": 549.2136936247637, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.07549115298445, "core_hours": 56.07549115298445} {"step": 106950, "l2_params": 342.29094041564264, "train/loss": 2.0234069526195526, "l2_grads": 2.21875, "lr": 7.473883279423053e-06, "uptime": 202044.536968224, "examples_seen": 109516800.0, "progress": 0.9497970746782946, "epoch": 85.48206439909863, "img/sec/core": 543.020518504779, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.10168210109334, "core_hours": 56.10168210109334} {"step": 107000, "l2_params": 342.29094041564264, "train/loss": 2.2708595395088196, "l2_grads": 2.328125, "lr": 7.342603291876466e-06, "uptime": 202138.520601594, "examples_seen": 109568000.0, "progress": 0.9502411125813699, "epoch": 85.5220279635676, "img/sec/core": 544.7757036423214, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.12778866591834, "core_hours": 56.12778866591834} {"step": 107050, "l2_params": 342.29094041564264, "train/loss": 4.626183986663818, "l2_grads": 2.0625, "lr": 7.212477992079683e-06, "uptime": 202232.777409412, "examples_seen": 109619200.0, "progress": 0.9506851504844454, "epoch": 85.56199152803654, "img/sec/core": 543.196838353227, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.15397111253444, "core_hours": 56.15397111253444} {"step": 107100, "l2_params": 342.29094041564264, "train/loss": 3.027275562286377, "l2_grads": 2.140625, "lr": 7.083507685019521e-06, "uptime": 202326.765836085, "examples_seen": 109670400.0, "progress": 0.9511291883875208, "epoch": 85.6019550925055, "img/sec/core": 544.7479207002397, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.1800790088325, "core_hours": 56.1800790088325} {"step": 107150, "l2_params": 342.29094041564264, "train/loss": 2.125804126262665, "l2_grads": 2.21875, "lr": 6.9556926729760105e-06, "uptime": 202419.829629555, "examples_seen": 109721600.0, "progress": 0.9515732262905962, "epoch": 85.64191865697447, "img/sec/core": 550.1602512743196, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.20593006257416, "core_hours": 56.20593006257416} {"step": 107200, "l2_params": 342.29094041564264, "train/loss": 2.304241895675659, "l2_grads": 2.40625, "lr": 6.8290332555212965e-06, "uptime": 202514.538209702, "examples_seen": 109772800.0, "progress": 0.9520172641936716, "epoch": 85.68188222144342, "img/sec/core": 540.6057183047819, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.23223800150389, "core_hours": 56.23223800150389} {"step": 107250, "l2_params": 342.29094041564264, "train/loss": 2.5425232648849487, "l2_grads": 2.234375, "lr": 6.703529729519084e-06, "uptime": 202608.802480116, "examples_seen": 109824000.0, "progress": 0.952461302096747, "epoch": 85.72184578591238, "img/sec/core": 543.1538352245375, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.25842252106333, "core_hours": 56.25842252106333} {"step": 107300, "l2_params": 342.29094041564264, "train/loss": 3.124502658843994, "l2_grads": 2.046875, "lr": 6.5791823891237354e-06, "uptime": 202701.840603454, "examples_seen": 109875200.0, "progress": 0.9529053399998224, "epoch": 85.76180935038133, "img/sec/core": 550.3120458909606, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.28426644421278, "core_hours": 56.28426644421278} {"step": 107350, "l2_params": 342.29094041564264, "train/loss": 2.1891385316848755, "l2_grads": 2.28125, "lr": 6.455991525779844e-06, "uptime": 202795.04754077, "examples_seen": 109926400.0, "progress": 0.9533493779028978, "epoch": 85.80177291485029, "img/sec/core": 549.315335042302, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.31015726013389, "core_hours": 56.31015726013389} {"step": 107400, "l2_params": 342.29094041564264, "train/loss": 2.5953309535980225, "l2_grads": 2.15625, "lr": 6.33395742822172e-06, "uptime": 202888.281949692, "examples_seen": 109977600.0, "progress": 0.9537934158059732, "epoch": 85.84173647931925, "img/sec/core": 549.1534787637759, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.336055707056666, "core_hours": 56.336055707056666} {"step": 107450, "l2_params": 342.29094041564264, "train/loss": 4.432282328605652, "l2_grads": 1.96875, "lr": 6.213080382471957e-06, "uptime": 202982.91226702, "examples_seen": 110028800.0, "progress": 0.9542374537090486, "epoch": 85.8817000437882, "img/sec/core": 541.0528194947614, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.36234190631444, "core_hours": 56.36234190631444} {"step": 107500, "l2_params": 342.29094041564264, "train/loss": 2.125524401664734, "l2_grads": 2.328125, "lr": 6.093360671841717e-06, "uptime": 203076.231545965, "examples_seen": 110080000.0, "progress": 0.954681491612124, "epoch": 85.92166360825716, "img/sec/core": 548.6540463966696, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.38826392824362, "core_hours": 56.38826392824362, "val/acc@1": 0.6650988520408163, "val/loss": 1.3747515766596308, "z/secs/eval/val": 31.712590751005337} {"step": 107550, "l2_params": 342.29094041564264, "train/loss": 2.1154284477233887, "l2_grads": 2.3125, "lr": 5.974798576929316e-06, "uptime": 203200.862109535, "examples_seen": 110131200.0, "progress": 0.9551255295151995, "epoch": 85.96162717272611, "img/sec/core": 410.81415772664855, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.42288352923528, "core_hours": 56.42288352923528} {"step": 107600, "l2_params": 342.29094041564264, "train/loss": 2.2066676020622253, "l2_grads": 2.328125, "lr": 5.857394375620027e-06, "uptime": 203293.962824975, "examples_seen": 110182400.0, "progress": 0.9555695674182748, "epoch": 86.00159073719507, "img/sec/core": 549.9420682002901, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.44874483907972, "core_hours": 56.44874483907972} {"step": 107650, "l2_params": 342.29094041564264, "train/loss": 3.580696702003479, "l2_grads": 1.96875, "lr": 5.741148343085121e-06, "uptime": 203387.118238952, "examples_seen": 110233600.0, "progress": 0.9560136053213503, "epoch": 86.04155430166404, "img/sec/core": 549.6191559261649, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.47462134296222, "core_hours": 56.47462134296222} {"step": 107700, "l2_params": 342.29094041564264, "train/loss": 2.871168553829193, "l2_grads": 2.140625, "lr": 5.6260607517813776e-06, "uptime": 203481.637717436, "examples_seen": 110284800.0, "progress": 0.9564576432244256, "epoch": 86.08151786613298, "img/sec/core": 541.6872883896382, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.50087675365223, "core_hours": 56.50087675365223} {"step": 107750, "l2_params": 342.29094041564264, "train/loss": 2.1378660798072815, "l2_grads": 2.25, "lr": 5.512131871450583e-06, "uptime": 203574.73239371402, "examples_seen": 110336000.0, "progress": 0.9569016811275011, "epoch": 86.12148143060195, "img/sec/core": 549.9777435940802, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.52673638595167, "core_hours": 56.52673638595167} {"step": 107800, "l2_params": 342.29094041564264, "train/loss": 3.1383556127548218, "l2_grads": 2.09375, "lr": 5.399361969118581e-06, "uptime": 203667.930662452, "examples_seen": 110387200.0, "progress": 0.9573457190305764, "epoch": 86.1614449950709, "img/sec/core": 549.3664280818106, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.55262479393445, "core_hours": 56.55262479393445} {"step": 107850, "l2_params": 342.29094041564264, "train/loss": 2.588127553462982, "l2_grads": 2.203125, "lr": 5.287751309094891e-06, "uptime": 203762.054076492, "examples_seen": 110438400.0, "progress": 0.9577897569336519, "epoch": 86.20140855953986, "img/sec/core": 543.9666688911931, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.57877018672333, "core_hours": 56.57877018672333} {"step": 107900, "l2_params": 342.29094041564264, "train/loss": 2.173121154308319, "l2_grads": 2.34375, "lr": 5.1773001529719314e-06, "uptime": 203855.338056663, "examples_seen": 110489600.0, "progress": 0.9582337948367272, "epoch": 86.24137212400882, "img/sec/core": 548.8616577696279, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.6046824034375, "core_hours": 56.6046824034375} {"step": 107950, "l2_params": 342.29094041564264, "train/loss": 2.0736621022224426, "l2_grads": 2.265625, "lr": 5.068008759624456e-06, "uptime": 203948.578772051, "examples_seen": 110540800.0, "progress": 0.9586778327398027, "epoch": 86.28133568847777, "img/sec/core": 549.1163360012863, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.63058260215639, "core_hours": 56.63058260215639} {"step": 108000, "l2_params": 342.29094041564264, "train/loss": 2.168838620185852, "l2_grads": 2.359375, "lr": 4.959877385209223e-06, "uptime": 204041.814908306, "examples_seen": 110592000.0, "progress": 0.9591218706428781, "epoch": 86.32129925294673, "img/sec/core": 549.1433049088225, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.656481528893885, "core_hours": 56.656481528893885} {"step": 108050, "l2_params": 342.29094041564264, "train/loss": 2.159307539463043, "l2_grads": 2.328125, "lr": 4.852906283163787e-06, "uptime": 204135.872548688, "examples_seen": 110643200.0, "progress": 0.9595659085459535, "epoch": 86.36126281741568, "img/sec/core": 544.3470598673181, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.682608651222225, "core_hours": 56.682608651222225} {"step": 108100, "l2_params": 342.29094041564264, "train/loss": 2.4194626808166504, "l2_grads": 2.328125, "lr": 4.747095704206642e-06, "uptime": 204229.814068673, "examples_seen": 110694400.0, "progress": 0.9600099464490289, "epoch": 86.40122638188464, "img/sec/core": 545.0199231199667, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.70870351788472, "core_hours": 56.70870351788472} {"step": 108150, "l2_params": 342.29094041564264, "train/loss": 2.203447699546814, "l2_grads": 2.5, "lr": 4.642445896335857e-06, "uptime": 204324.103733483, "examples_seen": 110745600.0, "progress": 0.9604539843521043, "epoch": 86.4411899463536, "img/sec/core": 543.0075512854107, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.73489509144306, "core_hours": 56.73489509144306} {"step": 108200, "l2_params": 342.29094041564264, "train/loss": 3.2876943349838257, "l2_grads": 1.953125, "lr": 4.538957104829124e-06, "uptime": 204417.357679919, "examples_seen": 110796800.0, "progress": 0.9608980222551797, "epoch": 86.48115351082255, "img/sec/core": 549.0384263270358, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.760798965453056, "core_hours": 56.760798965453056} {"step": 108250, "l2_params": 342.29094041564264, "train/loss": 3.181031823158264, "l2_grads": 2.09375, "lr": 4.436629572243023e-06, "uptime": 204511.655076388, "examples_seen": 110848000.0, "progress": 0.9613420601582551, "epoch": 86.52111707529151, "img/sec/core": 542.9630288554413, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.78699268669445, "core_hours": 56.78699268669445} {"step": 108300, "l2_params": 342.29094041564264, "train/loss": 2.161801815032959, "l2_grads": 2.421875, "lr": 4.335463538412158e-06, "uptime": 204605.21482197, "examples_seen": 110899200.0, "progress": 0.9617860980613305, "epoch": 86.56108063976046, "img/sec/core": 547.2438994089463, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.81298150491167, "core_hours": 56.81298150491167} {"step": 108350, "l2_params": 342.29094041564264, "train/loss": 2.274304211139679, "l2_grads": 2.21875, "lr": 4.235459240449071e-06, "uptime": 204698.799119065, "examples_seen": 110950400.0, "progress": 0.9622301359644059, "epoch": 86.60104420422942, "img/sec/core": 547.1003318861449, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.838977142993606, "core_hours": 56.838977142993606} {"step": 108400, "l2_params": 342.29094041564264, "train/loss": 3.819781243801117, "l2_grads": 2.109375, "lr": 4.1366169127431095e-06, "uptime": 204793.055470975, "examples_seen": 111001600.0, "progress": 0.9626741738674813, "epoch": 86.64100776869839, "img/sec/core": 543.1994657387525, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.865159462968606, "core_hours": 56.865159462968606} {"step": 108450, "l2_params": 342.29094041564264, "train/loss": 2.085258364677429, "l2_grads": 2.328125, "lr": 4.0389367869605165e-06, "uptime": 204886.349235288, "examples_seen": 111052800.0, "progress": 0.9631182117705568, "epoch": 86.68097133316734, "img/sec/core": 548.8040961474862, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.891074397500006, "core_hours": 56.891074397500006} {"step": 108500, "l2_params": 342.29094041564264, "train/loss": 2.5735133290290833, "l2_grads": 2.125, "lr": 3.942419092043431e-06, "uptime": 204981.569262214, "examples_seen": 111104000.0, "progress": 0.9635622496736321, "epoch": 86.7209348976363, "img/sec/core": 537.7020113614782, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.917524404979446, "core_hours": 56.917524404979446} {"step": 108550, "l2_params": 342.29094041564264, "train/loss": 2.276002824306488, "l2_grads": 2.375, "lr": 3.847064054209455e-06, "uptime": 205074.70533384001, "examples_seen": 111155200.0, "progress": 0.9640062875767076, "epoch": 86.76089846210525, "img/sec/core": 549.7332999570236, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.943395535986674, "core_hours": 56.943395535986674} {"step": 108600, "l2_params": 342.29094041564264, "train/loss": 3.4310620427131653, "l2_grads": 2.03125, "lr": 3.752871896951259e-06, "uptime": 205168.494397971, "examples_seen": 111206400.0, "progress": 0.9644503254797829, "epoch": 86.80086202657421, "img/sec/core": 545.9058630598764, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.96944805380083, "core_hours": 56.96944805380083} {"step": 108650, "l2_params": 342.29094041564264, "train/loss": 2.5541895627975464, "l2_grads": 2.21875, "lr": 3.6598428410359082e-06, "uptime": 205262.165779408, "examples_seen": 111257600.0, "progress": 0.9648943633828584, "epoch": 86.84082559104317, "img/sec/core": 546.591704045985, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 56.99546788197778, "core_hours": 56.99546788197778} {"step": 108700, "l2_params": 342.29094041564264, "train/loss": 4.572780609130859, "l2_grads": 2.109375, "lr": 3.567977104504382e-06, "uptime": 205356.483231415, "examples_seen": 111308800.0, "progress": 0.9653384012859337, "epoch": 86.88078915551212, "img/sec/core": 542.8475739166358, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.02166717420195, "core_hours": 57.02166717420195} {"step": 108750, "l2_params": 342.29094041564264, "train/loss": 4.014870345592499, "l2_grads": 1.9921875, "lr": 3.4772749026711092e-06, "uptime": 205450.011304712, "examples_seen": 111360000.0, "progress": 0.9657824391890092, "epoch": 86.92075271998108, "img/sec/core": 547.4292177217666, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.04764719456223, "core_hours": 57.04764719456223} {"step": 108800, "l2_params": 342.29094041564264, "train/loss": 2.0480165779590607, "l2_grads": 2.34375, "lr": 3.387736448123376e-06, "uptime": 205543.64560353901, "examples_seen": 111411200.0, "progress": 0.9662264770920845, "epoch": 86.96071628445004, "img/sec/core": 546.8081743699007, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.07365672201417, "core_hours": 57.07365672201417} {"step": 108850, "l2_params": 342.29094041564264, "train/loss": 2.027504861354828, "l2_grads": 2.453125, "lr": 3.2993619507210312e-06, "uptime": 205638.054815831, "examples_seen": 111462400.0, "progress": 0.96667051499516, "epoch": 87.00067984891899, "img/sec/core": 542.3199575232551, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.09988150320639, "core_hours": 57.09988150320639} {"step": 108900, "l2_params": 342.29094041564264, "train/loss": 3.0051870346069336, "l2_grads": 2.15625, "lr": 3.2121516175956662e-06, "uptime": 205731.856122417, "examples_seen": 111513600.0, "progress": 0.9671145528982354, "epoch": 87.04064341338795, "img/sec/core": 545.8346142872372, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.125937421702496, "core_hours": 57.125937421702496} {"step": 108950, "l2_params": 342.29094041564264, "train/loss": 2.1993273496627808, "l2_grads": 2.375, "lr": 3.12610565315044e-06, "uptime": 205825.765518831, "examples_seen": 111564800.0, "progress": 0.9675585908013108, "epoch": 87.0806069778569, "img/sec/core": 545.2063579908659, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.15202336515083, "core_hours": 57.15202336515083} {"step": 109000, "l2_params": 342.29094041564264, "train/loss": 2.2025639414787292, "l2_grads": 2.421875, "lr": 3.041224259059364e-06, "uptime": 205920.090508685, "examples_seen": 111616000.0, "progress": 0.9680026287043862, "epoch": 87.12057054232586, "img/sec/core": 542.8041930271563, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.17822475122139, "core_hours": 57.17822475122139} {"step": 109050, "l2_params": 342.29094041564264, "train/loss": 4.222482442855835, "l2_grads": 2.015625, "lr": 2.957507634266968e-06, "uptime": 206014.26964265, "examples_seen": 111667200.0, "progress": 0.9684466666074616, "epoch": 87.16053410679483, "img/sec/core": 543.6448377092859, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.20438562176722, "core_hours": 57.20438562176722} {"step": 109100, "l2_params": 342.29094041564264, "train/loss": 4.667453408241272, "l2_grads": 2.078125, "lr": 2.87495597498796e-06, "uptime": 206107.797611732, "examples_seen": 111718400.0, "progress": 0.968890704510537, "epoch": 87.20049767126378, "img/sec/core": 547.4298277032977, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.2303656131789, "core_hours": 57.2303656131789} {"step": 109150, "l2_params": 342.29094041564264, "train/loss": 2.2451117634773254, "l2_grads": 2.359375, "lr": 2.7935694747063474e-06, "uptime": 206202.07559589, "examples_seen": 111769600.0, "progress": 0.9693347424136124, "epoch": 87.24046123573274, "img/sec/core": 543.0748276734404, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.256553942111665, "core_hours": 57.256553942111665} {"step": 109200, "l2_params": 342.29094041564264, "train/loss": 4.296654105186462, "l2_grads": 2.203125, "lr": 2.7133483241754344e-06, "uptime": 206296.15352451502, "examples_seen": 111820800.0, "progress": 0.9697787803166878, "epoch": 87.28042480020169, "img/sec/core": 544.2296694698315, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.28268670006306, "core_hours": 57.28268670006306} {"step": 109250, "l2_params": 342.29094041564264, "train/loss": 3.7598201632499695, "l2_grads": 2.015625, "lr": 2.6342927114170945e-06, "uptime": 206389.386069538, "examples_seen": 111872000.0, "progress": 0.9702228182197632, "epoch": 87.32038836467065, "img/sec/core": 549.1644574045489, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.30858462923611, "core_hours": 57.30858462923611} {"step": 109300, "l2_params": 342.29094041564264, "train/loss": 3.7515920996665955, "l2_grads": 2.15625, "lr": 2.5564028217213927e-06, "uptime": 206482.848218814, "examples_seen": 111923200.0, "progress": 0.9706668561228387, "epoch": 87.36035192913961, "img/sec/core": 547.8153498140523, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.33454633736834, "core_hours": 57.33454633736834} {"step": 109350, "l2_params": 342.29094041564264, "train/loss": 3.082898795604706, "l2_grads": 1.9765625, "lr": 2.4796788376463488e-06, "uptime": 206576.486822598, "examples_seen": 111974400.0, "progress": 0.9711108940259141, "epoch": 87.40031549360856, "img/sec/core": 546.783035318489, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.36055706064167, "core_hours": 57.36055706064167} {"step": 109400, "l2_params": 342.29094041564264, "train/loss": 2.115805447101593, "l2_grads": 2.375, "lr": 2.4041209390172293e-06, "uptime": 206670.139006682, "examples_seen": 112025600.0, "progress": 0.9715549319289895, "epoch": 87.44027905807752, "img/sec/core": 546.7037474969842, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.38657155622056, "core_hours": 57.38657155622056} {"step": 109450, "l2_params": 342.29094041564264, "train/loss": 2.0880287289619446, "l2_grads": 2.171875, "lr": 2.329729302926042e-06, "uptime": 206764.494913053, "examples_seen": 112076800.0, "progress": 0.9719989698320649, "epoch": 87.48024262254647, "img/sec/core": 542.6263386065801, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.412781530212506, "core_hours": 57.412781530212506} {"step": 109500, "l2_params": 342.29094041564264, "train/loss": 2.209841102361679, "l2_grads": 2.390625, "lr": 2.2565041037317023e-06, "uptime": 206858.797907227, "examples_seen": 112128000.0, "progress": 0.9724430077351403, "epoch": 87.52020618701543, "img/sec/core": 542.9307992652365, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.43897680637194, "core_hours": 57.43897680637194} {"step": 109550, "l2_params": 342.29094041564264, "train/loss": 4.085643172264099, "l2_grads": 1.984375, "lr": 2.1844455130589277e-06, "uptime": 206951.906911848, "examples_seen": 112179200.0, "progress": 0.9728870456382157, "epoch": 87.5601697514844, "img/sec/core": 549.8931087107729, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.46484041876667, "core_hours": 57.46484041876667} {"step": 109600, "l2_params": 342.29094041564264, "train/loss": 2.7042278051376343, "l2_grads": 2.140625, "lr": 2.1135536997983407e-06, "uptime": 207045.125378035, "examples_seen": 112230400.0, "progress": 0.973331083541291, "epoch": 87.60013331595334, "img/sec/core": 549.2473980132213, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.49073443715194, "core_hours": 57.49073443715194} {"step": 109650, "l2_params": 342.29094041564264, "train/loss": 4.000117123126984, "l2_grads": 2.0625, "lr": 2.0438288301056953e-06, "uptime": 207139.315310492, "examples_seen": 112281600.0, "progress": 0.9737751214443665, "epoch": 87.6400968804223, "img/sec/core": 543.5825110435853, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.51689830727889, "core_hours": 57.51689830727889} {"step": 109700, "l2_params": 342.29094041564264, "train/loss": 2.4599740505218506, "l2_grads": 2.25, "lr": 1.9752710674018254e-06, "uptime": 207233.499476391, "examples_seen": 112332800.0, "progress": 0.9742191593474419, "epoch": 87.68006044489125, "img/sec/core": 543.6157926471883, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.543060575584164, "core_hours": 57.543060575584164} {"step": 109750, "l2_params": 342.29094041564264, "train/loss": 2.15575248003006, "l2_grads": 2.296875, "lr": 1.907880572372029e-06, "uptime": 207326.634360939, "examples_seen": 112384000.0, "progress": 0.9746631972505173, "epoch": 87.72002400936022, "img/sec/core": 549.7403067441944, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.568931376847495, "core_hours": 57.568931376847495} {"step": 109800, "l2_params": 342.29094041564264, "train/loss": 2.339510202407837, "l2_grads": 2.21875, "lr": 1.8416575029657945e-06, "uptime": 207419.828564353, "examples_seen": 112435200.0, "progress": 0.9751072351535927, "epoch": 87.75998757382918, "img/sec/core": 549.3903925822057, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.59481865557361, "core_hours": 57.59481865557361} {"step": 109850, "l2_params": 342.29094041564264, "train/loss": 2.85246878862381, "l2_grads": 2.0625, "lr": 1.776602014396351e-06, "uptime": 207513.071852989, "examples_seen": 112486400.0, "progress": 0.9755512730566681, "epoch": 87.79995113829813, "img/sec/core": 549.1011819614247, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.62071956908361, "core_hours": 57.62071956908361} {"step": 109900, "l2_params": 342.29094041564264, "train/loss": 2.1430035829544067, "l2_grads": 2.296875, "lr": 1.7127142591404525e-06, "uptime": 207607.773548831, "examples_seen": 112537600.0, "progress": 0.9759953109597436, "epoch": 87.83991470276709, "img/sec/core": 540.6450174389954, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.64702559570639, "core_hours": 57.64702559570639} {"step": 109950, "l2_params": 342.29094041564264, "train/loss": 2.8588370084762573, "l2_grads": 2.078125, "lr": 1.64999438693782e-06, "uptime": 207701.130194526, "examples_seen": 112588800.0, "progress": 0.9764393488628189, "epoch": 87.87987826723604, "img/sec/core": 548.434443191938, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.67295799728833, "core_hours": 57.67295799728833} {"step": 110000, "l2_params": 342.29094041564264, "train/loss": 2.1468923091888428, "l2_grads": 2.203125, "lr": 1.5884425447910856e-06, "uptime": 207794.595539896, "examples_seen": 112640000.0, "progress": 0.9768833867658944, "epoch": 87.919841831705, "img/sec/core": 547.7966169954716, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.69892059322444, "core_hours": 57.69892059322444, "val/acc@1": 0.6653778698979592, "val/loss": 1.374728994101894, "z/secs/eval/val": 31.709822231990984} {"step": 110050, "l2_params": 342.29094041564264, "train/loss": 4.638709783554077, "l2_grads": 2.21875, "lr": 1.5280588769649606e-06, "uptime": 207919.419260799, "examples_seen": 112691200.0, "progress": 0.9773274246689697, "epoch": 87.95980539617396, "img/sec/core": 410.1784470900314, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.73359384903084, "core_hours": 57.73359384903084} {"step": 110100, "l2_params": 342.29094041564264, "train/loss": 3.86029452085495, "l2_grads": 2.078125, "lr": 1.468843524986456e-06, "uptime": 208012.592550626, "examples_seen": 112742400.0, "progress": 0.9777714625720452, "epoch": 87.99976896064291, "img/sec/core": 549.5137082212592, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.75947531842722, "core_hours": 57.75947531842722} {"step": 110150, "l2_params": 342.29094041564264, "train/loss": 2.0620584189891815, "l2_grads": 2.3125, "lr": 1.4107966276441656e-06, "uptime": 208105.837717186, "examples_seen": 112793600.0, "progress": 0.9782155004751205, "epoch": 88.03973252511187, "img/sec/core": 549.0901232618584, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.785376753582774, "core_hours": 57.785376753582774} {"step": 110200, "l2_params": 342.29094041564264, "train/loss": 2.21158504486084, "l2_grads": 2.265625, "lr": 1.3539183209880375e-06, "uptime": 208199.104852102, "examples_seen": 112844800.0, "progress": 0.978659538378196, "epoch": 88.07969608958082, "img/sec/core": 548.960789308133, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.811284291059444, "core_hours": 57.811284291059444} {"step": 110250, "l2_params": 342.29094041564264, "train/loss": 2.1760764718055725, "l2_grads": 2.328125, "lr": 1.2982087383292674e-06, "uptime": 208293.430845849, "examples_seen": 112896000.0, "progress": 0.9791035762812713, "epoch": 88.11965965404978, "img/sec/core": 542.7984160688567, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.83748595598917, "core_hours": 57.83748595598917} {"step": 110300, "l2_params": 342.29094041564264, "train/loss": 2.183889329433441, "l2_grads": 2.265625, "lr": 1.2436680102395749e-06, "uptime": 208386.666119509, "examples_seen": 112947200.0, "progress": 0.9795476141843468, "epoch": 88.15962321851875, "img/sec/core": 549.1483854782059, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.86338464311694, "core_hours": 57.86338464311694} {"step": 110350, "l2_params": 342.29094041564264, "train/loss": 2.282764196395874, "l2_grads": 2.296875, "lr": 1.1902962645512601e-06, "uptime": 208480.73952307, "examples_seen": 112998400.0, "progress": 0.9799916520874222, "epoch": 88.1995867829877, "img/sec/core": 544.2558476881745, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.88951614410611, "core_hours": 57.88951614410611} {"step": 110400, "l2_params": 342.29094041564264, "train/loss": 4.602721810340881, "l2_grads": 2.0, "lr": 1.1380936263567045e-06, "uptime": 208575.056452521, "examples_seen": 113049600.0, "progress": 0.9804356899904976, "epoch": 88.23955034745666, "img/sec/core": 542.8505815235574, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.915715291175836, "core_hours": 57.915715291175836} {"step": 110450, "l2_params": 342.29094041564264, "train/loss": 2.7384443283081055, "l2_grads": 2.15625, "lr": 1.0870602180082599e-06, "uptime": 208668.24976089, "examples_seen": 113100800.0, "progress": 0.980879727893573, "epoch": 88.2795139119256, "img/sec/core": 549.3956690246038, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.94160232127833, "core_hours": 57.94160232127833} {"step": 110500, "l2_params": 342.29094041564264, "train/loss": 2.08848237991333, "l2_grads": 2.3125, "lr": 1.0371961591176346e-06, "uptime": 208763.134083056, "examples_seen": 113152000.0, "progress": 0.9813237657966484, "epoch": 88.31947747639457, "img/sec/core": 539.6044239049551, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.96795907743556, "core_hours": 57.96795907743556} {"step": 110550, "l2_params": 342.29094041564264, "train/loss": 2.062107414007187, "l2_grads": 2.265625, "lr": 9.885015665560086e-07, "uptime": 208856.276571298, "examples_seen": 113203200.0, "progress": 0.9817678036997238, "epoch": 88.35944104086353, "img/sec/core": 549.6954286531823, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 57.993831990836114, "core_hours": 57.993831990836114} {"step": 110600, "l2_params": 342.29094041564264, "train/loss": 2.2910197973251343, "l2_grads": 2.390625, "lr": 9.409765544535298e-07, "uptime": 208950.660458452, "examples_seen": 113254400.0, "progress": 0.9822118416027992, "epoch": 88.39940460533248, "img/sec/core": 542.4654731209458, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.020049737267776, "core_hours": 58.020049737267776} {"step": 110650, "l2_params": 342.29094041564264, "train/loss": 4.459449529647827, "l2_grads": 2.203125, "lr": 8.946212341989309e-07, "uptime": 209043.853181037, "examples_seen": 113305600.0, "progress": 0.9826558795058746, "epoch": 88.43936816980144, "img/sec/core": 549.3991223757236, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.0459366046525, "core_hours": 58.0459366046525} {"step": 110700, "l2_params": 342.29094041564264, "train/loss": 2.2438840866088867, "l2_grads": 2.21875, "lr": 8.494357144397472e-07, "uptime": 209138.396793158, "examples_seen": 113356800.0, "progress": 0.98309991740895, "epoch": 88.47933173427039, "img/sec/core": 541.5490148025681, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.072198719130554, "core_hours": 58.072198719130554} {"step": 110750, "l2_params": 342.29094041564264, "train/loss": 2.181984931230545, "l2_grads": 2.390625, "lr": 8.054201010814298e-07, "uptime": 209231.64342399, "examples_seen": 113408000.0, "progress": 0.9835439553120254, "epoch": 88.51929529873935, "img/sec/core": 549.0815007809315, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.09810056102833, "core_hours": 58.09810056102833} {"step": 110800, "l2_params": 342.29094041564264, "train/loss": 2.757455348968506, "l2_grads": 2.234375, "lr": 7.625744972875673e-07, "uptime": 209325.55343688402, "examples_seen": 113459200.0, "progress": 0.9839879932151009, "epoch": 88.55925886320831, "img/sec/core": 545.2027789388244, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.12418667572112, "core_hours": 58.12418667572112} {"step": 110850, "l2_params": 342.29094041564264, "train/loss": 2.0920573472976685, "l2_grads": 2.328125, "lr": 7.208990034794984e-07, "uptime": 209419.642540768, "examples_seen": 113510400.0, "progress": 0.9844320311181762, "epoch": 88.59922242767726, "img/sec/core": 544.1650295993468, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.1503225379111, "core_hours": 58.1503225379111} {"step": 110900, "l2_params": 342.29094041564264, "train/loss": 3.3859331011772156, "l2_grads": 2.171875, "lr": 6.803937173359206e-07, "uptime": 209512.84089279, "examples_seen": 113561600.0, "progress": 0.9848760690212517, "epoch": 88.63918599214622, "img/sec/core": 549.3659371563662, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.17621096902833, "core_hours": 58.17621096902833} {"step": 110950, "l2_params": 342.29094041564264, "train/loss": 2.336913824081421, "l2_grads": 2.3125, "lr": 6.410587337930041e-07, "uptime": 209607.512716273, "examples_seen": 113612800.0, "progress": 0.985320106924327, "epoch": 88.67914955661519, "img/sec/core": 540.8156103510514, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.20250869777361, "core_hours": 58.20250869777361} {"step": 111000, "l2_params": 342.29094041564264, "train/loss": 4.280592679977417, "l2_grads": 2.125, "lr": 6.028941450438361e-07, "uptime": 209700.742701293, "examples_seen": 113664000.0, "progress": 0.9857641448274025, "epoch": 88.71911312108413, "img/sec/core": 549.179536916289, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.22840591583472, "core_hours": 58.22840591583472} {"step": 111050, "l2_params": 342.29094041564264, "train/loss": 2.7854822278022766, "l2_grads": 2.140625, "lr": 5.659000405383638e-07, "uptime": 209794.526681573, "examples_seen": 113715200.0, "progress": 0.9862081827304778, "epoch": 88.7590766855531, "img/sec/core": 545.9354555770577, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.254457021468056, "core_hours": 58.254457021468056} {"step": 111100, "l2_params": 342.29094041564264, "train/loss": 2.1427004039287567, "l2_grads": 2.21875, "lr": 5.30076506983173e-07, "uptime": 209888.371433222, "examples_seen": 113766400.0, "progress": 0.9866522206335533, "epoch": 88.79904025002205, "img/sec/core": 545.5819222742302, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.28052500803722, "core_hours": 58.28052500803722} {"step": 111150, "l2_params": 342.29094041564264, "train/loss": 2.623774826526642, "l2_grads": 2.171875, "lr": 4.954236283412671e-07, "uptime": 209981.640496831, "examples_seen": 113817600.0, "progress": 0.9870962585366286, "epoch": 88.83900381449101, "img/sec/core": 548.949437453695, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.30643308126195, "core_hours": 58.30643308126195} {"step": 111200, "l2_params": 342.29094041564264, "train/loss": 2.220647931098938, "l2_grads": 2.375, "lr": 4.6194148583190023e-07, "uptime": 210076.105937511, "examples_seen": 113868800.0, "progress": 0.9875402964397041, "epoch": 88.87896737895997, "img/sec/core": 541.9971540009952, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.332673481450826, "core_hours": 58.332673481450826} {"step": 111250, "l2_params": 342.29094041564264, "train/loss": 4.7924946546554565, "l2_grads": 2.1875, "lr": 4.296301579303537e-07, "uptime": 210170.00265509, "examples_seen": 113920000.0, "progress": 0.9879843343427795, "epoch": 88.91893094342892, "img/sec/core": 545.2799769801727, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.35875590300056, "core_hours": 58.35875590300056} {"step": 111300, "l2_params": 342.29094041564264, "train/loss": 2.1775166392326355, "l2_grads": 2.3125, "lr": 3.9848972036766e-07, "uptime": 210264.250463781, "examples_seen": 113971200.0, "progress": 0.9884283722458549, "epoch": 88.95889450789788, "img/sec/core": 543.2487047827824, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.38493584985917, "core_hours": 58.38493584985917} {"step": 111350, "l2_params": 342.29094041564264, "train/loss": 4.0815078020095825, "l2_grads": 2.046875, "lr": 3.6852024613065813e-07, "uptime": 210358.541287557, "examples_seen": 114022400.0, "progress": 0.9888724101489303, "epoch": 88.99885807236683, "img/sec/core": 543.0008769638173, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.411127745352495, "core_hours": 58.411127745352495} {"step": 111400, "l2_params": 342.29094041564264, "train/loss": 2.6741024255752563, "l2_grads": 2.1875, "lr": 3.397218054616601e-07, "uptime": 210451.704315459, "examples_seen": 114073600.0, "progress": 0.9893164480520057, "epoch": 89.03882163683579, "img/sec/core": 549.5742372591061, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.43700636421417, "core_hours": 58.43700636421417} {"step": 111450, "l2_params": 342.29094041564264, "train/loss": 2.1593473851680756, "l2_grads": 2.265625, "lr": 3.120944658582289e-07, "uptime": 210546.79128379602, "examples_seen": 114124800.0, "progress": 0.9897604859550811, "epoch": 89.07878520130475, "img/sec/core": 538.4544369795753, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.463419410974446, "core_hours": 58.463419410974446} {"step": 111500, "l2_params": 342.29094041564264, "train/loss": 2.6156850457191467, "l2_grads": 2.203125, "lr": 2.856382920732896e-07, "uptime": 210639.986830232, "examples_seen": 114176000.0, "progress": 0.9902045238581565, "epoch": 89.1187487657737, "img/sec/core": 549.3824754294728, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.48930706276222, "core_hours": 58.48930706276222} {"step": 111550, "l2_params": 342.29094041564264, "train/loss": 2.646580159664154, "l2_grads": 2.1875, "lr": 2.6035334611457464e-07, "uptime": 210734.091228128, "examples_seen": 114227200.0, "progress": 0.990648561761232, "epoch": 89.15871233024266, "img/sec/core": 544.076590942962, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.51544717328889, "core_hours": 58.51544717328889} {"step": 111600, "l2_params": 342.29094041564264, "train/loss": 2.1885318756103516, "l2_grads": 2.296875, "lr": 2.3623968724484547e-07, "uptime": 210827.22586194202, "examples_seen": 114278400.0, "progress": 0.9910925996643073, "epoch": 89.19867589471161, "img/sec/core": 549.7417867368695, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.54131790490389, "core_hours": 58.54131790490389} {"step": 111650, "l2_params": 342.29094041564264, "train/loss": 2.208272099494934, "l2_grads": 2.296875, "lr": 2.1329737198150412e-07, "uptime": 210921.653758308, "examples_seen": 114329600.0, "progress": 0.9915366375673828, "epoch": 89.23863945918058, "img/sec/core": 542.2126508204327, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.56754787611667, "core_hours": 58.56754787611667} {"step": 111700, "l2_params": 342.29094041564264, "train/loss": 2.188948094844818, "l2_grads": 2.421875, "lr": 1.9152645409675932e-07, "uptime": 211015.381190384, "examples_seen": 114380800.0, "progress": 0.9919806754704582, "epoch": 89.27860302364954, "img/sec/core": 546.2648326744032, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.593583273915556, "core_hours": 58.593583273915556} {"step": 111750, "l2_params": 342.29094041564264, "train/loss": 4.32533073425293, "l2_grads": 2.09375, "lr": 1.7092698461707176e-07, "uptime": 211109.152385916, "examples_seen": 114432000.0, "progress": 0.9924247133735336, "epoch": 89.31856658811849, "img/sec/core": 546.0098883193733, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.61963082823, "core_hours": 58.61963082823} {"step": 111800, "l2_params": 342.29094041564264, "train/loss": 3.8392317295074463, "l2_grads": 2.015625, "lr": 1.5149901182337641e-07, "uptime": 211203.370766843, "examples_seen": 114483200.0, "progress": 0.992868751276609, "epoch": 89.35853015258745, "img/sec/core": 543.4183807475315, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.64580260070972, "core_hours": 58.64580260070972} {"step": 111850, "l2_params": 342.29094041564264, "train/loss": 2.196939468383789, "l2_grads": 2.21875, "lr": 1.3324258125085988e-07, "uptime": 211297.052800779, "examples_seen": 114534400.0, "progress": 0.9933127891796844, "epoch": 89.3984937170564, "img/sec/core": 546.529551599817, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.67182538791417, "core_hours": 58.67182538791417} {"step": 111900, "l2_params": 342.29094041564264, "train/loss": 2.2707661390304565, "l2_grads": 2.40625, "lr": 1.1615773568890532e-07, "uptime": 211390.219106083, "examples_seen": 114585600.0, "progress": 0.9937568270827598, "epoch": 89.43845728152536, "img/sec/core": 549.5549043501267, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.69770491716528, "core_hours": 58.69770491716528} {"step": 111950, "l2_params": 342.29094041564264, "train/loss": 4.648118495941162, "l2_grads": 2.046875, "lr": 1.0024451518075941e-07, "uptime": 211485.643436864, "examples_seen": 114636800.0, "progress": 0.9942008649858352, "epoch": 89.47842084599432, "img/sec/core": 536.5507893109018, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.72421167571555, "core_hours": 58.72421167571555} {"step": 112000, "l2_params": 342.29094041564264, "train/loss": 4.072975754737854, "l2_grads": 2.046875, "lr": 8.550295702386487e-08, "uptime": 211578.922442507, "examples_seen": 114688000.0, "progress": 0.9946449028889106, "epoch": 89.51838441046327, "img/sec/core": 548.8909283183065, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.750122510616386, "core_hours": 58.750122510616386} {"step": 112050, "l2_params": 342.29094041564264, "train/loss": 2.111414611339569, "l2_grads": 2.421875, "lr": 7.193309576930607e-08, "uptime": 211673.783503319, "examples_seen": 114739200.0, "progress": 0.995088940791986, "epoch": 89.55834797493223, "img/sec/core": 539.7367429979995, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.77647280528639, "core_hours": 58.77647280528639} {"step": 112100, "l2_params": 342.29094041564264, "train/loss": 2.9602622985839844, "l2_grads": 2.21875, "lr": 5.9534963222085965e-08, "uptime": 211766.821787431, "examples_seen": 114790400.0, "progress": 0.9955329786950614, "epoch": 89.59831153940118, "img/sec/core": 550.3110949291014, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.80231677309528, "core_hours": 58.80231677309528} {"step": 112150, "l2_params": 342.29094041564264, "train/loss": 2.594558596611023, "l2_grads": 2.15625, "lr": 4.8308588440904485e-08, "uptime": 211861.143765357, "examples_seen": 114841600.0, "progress": 0.9959770165981369, "epoch": 89.63827510387014, "img/sec/core": 542.8215260727777, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.82851732251916, "core_hours": 58.82851732251916} {"step": 112200, "l2_params": 342.29094041564264, "train/loss": 2.199849009513855, "l2_grads": 2.25, "lr": 3.825399773810282e-08, "uptime": 211954.914593876, "examples_seen": 114892800.0, "progress": 0.9964210545012122, "epoch": 89.6782386683391, "img/sec/core": 546.0120253670644, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.85456477488555, "core_hours": 58.85456477488555} {"step": 112250, "l2_params": 342.29094041564264, "train/loss": 2.216042935848236, "l2_grads": 2.4375, "lr": 2.9371214679496948e-08, "uptime": 212048.605026271, "examples_seen": 114944000.0, "progress": 0.9968650924042877, "epoch": 89.71820223280805, "img/sec/core": 546.4805604070654, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.880589894995275, "core_hours": 58.880589894995275} {"step": 112300, "l2_params": 342.29094041564264, "train/loss": 2.0094719529151917, "l2_grads": 2.34375, "lr": 2.1660260084544132e-08, "uptime": 212142.315790895, "examples_seen": 114995200.0, "progress": 0.997309130307363, "epoch": 89.75816579727702, "img/sec/core": 546.3619916605103, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.90662066294639, "core_hours": 58.90662066294639} {"step": 112350, "l2_params": 342.29094041564264, "train/loss": 3.213792085647583, "l2_grads": 2.046875, "lr": 1.5121152026120887e-08, "uptime": 212235.990262303, "examples_seen": 115046400.0, "progress": 0.9977531682104385, "epoch": 89.79812936174596, "img/sec/core": 546.5736740268457, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.932641349448616, "core_hours": 58.932641349448616} {"step": 112400, "l2_params": 342.29094041564264, "train/loss": 4.742911219596863, "l2_grads": 2.203125, "lr": 9.753905830634049e-09, "uptime": 212329.643585274, "examples_seen": 115097600.0, "progress": 0.9981972061135138, "epoch": 89.83809292621493, "img/sec/core": 546.6970992140879, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.958656161384994, "core_hours": 58.958656161384994} {"step": 112450, "l2_params": 342.29094041564264, "train/loss": 2.6904194355010986, "l2_grads": 2.078125, "lr": 5.5585340776876375e-09, "uptime": 212423.944206413, "examples_seen": 115148800.0, "progress": 0.9986412440165893, "epoch": 89.87805649068389, "img/sec/core": 542.9444618877919, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 58.98485077836805, "core_hours": 58.98485077836805} {"step": 112500, "l2_params": 342.29094041564264, "train/loss": 2.9611271023750305, "l2_grads": 2.078125, "lr": 2.5350466004714607e-09, "uptime": 212517.061204017, "examples_seen": 115200000.0, "progress": 0.9990852819196646, "epoch": 89.91802005515284, "img/sec/core": 549.8459069496736, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 59.01071661103583, "core_hours": 59.01071661103583} {"step": 112550, "l2_params": 342.29094041564264, "train/loss": 2.003170132637024, "l2_grads": 2.21875, "lr": 6.834504853170453e-10, "uptime": 212611.447955518, "examples_seen": 115251200.0, "progress": 0.9995293198227401, "epoch": 89.9579836196218, "img/sec/core": 542.4490109658478, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 59.036935153119444, "core_hours": 59.036935153119444} {"step": 112603, "l2_params": 342.29094041564264, "train/loss": 2.5168460607528687, "l2_grads": 2.265625, "lr": 2.3437951579552636e-13, "uptime": 212711.46330443, "examples_seen": 115305472.0, "progress": 1.0, "epoch": 90.00034499795889, "img/sec/core": 542.6367111686525, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 59.0647171944839, "core_hours": 59.0647171944839, "val/acc@1": 0.6655970982142857, "val/loss": 1.374718103785904, "z/secs/eval/val": 31.63136170897633} {"step": 112603, "l2_params": 342.29094041564264, "train/loss": 2.5168460607528687, "l2_grads": 2.265625, "lr": 2.3437951579552636e-13, "uptime": 212711.46330443, "examples_seen": 115305472.0, "progress": 1.0, "epoch": 90.00034499795889, "img/sec/core": 542.6367111686525, "core_hours_NVIDIA GeForce RTX 3080 Laptop GPU": 59.0647171944839, "core_hours": 59.0647171944839, "val/acc@1": 0.6655970982142857, "val/loss": 1.374718103785904, "z/secs/eval/val": 31.63136170897633}