{"step": 1, "z/secs/update0": 38.605508919001295, "global_schedule": 0.0, "l2_grads": 0.5865829586982727, "l2_params": 207.7718963623047, "l2_updates": 0.0, "train/loss": 6.907753944396973, "uptime": 212.13397713300037, "examples_seen": 1024.0, "progress": 8.88075806150813e-06, "epoch": 0.0007992712893791364} {"step": 2, "global_schedule": 9.999999747378752e-05, "l2_grads": 0.5653113126754761, "l2_params": 207.7718963623047, "l2_updates": 4.5738121116301045e-05, "train/loss": 6.907756328582764, "uptime": 213.31079859800047, "examples_seen": 2048.0, "progress": 1.776151612301626e-05, "epoch": 0.0015985425787582727} {"step": 50, "global_schedule": 0.004900000058114529, "l2_grads": 0.5577670335769653, "l2_params": 207.77073669433594, "l2_updates": 0.016196411103010178, "train/loss": 6.9073615074157715, "uptime": 223.0159139770003, "examples_seen": 51200.0, "progress": 0.0004440379030754065, "epoch": 0.03996356446895682, "img/sec/core": 633.0682078540289, "core_hours_NVIDIA A100-SXM4-40GB": 0.021566923064444077, "core_hours": 0.021566923064444077} {"step": 100, "global_schedule": 0.00989999994635582, "l2_grads": 0.5222258567810059, "l2_params": 207.76840209960938, "l2_updates": 0.023266982287168503, "train/loss": 6.905587196350098, "uptime": 233.43224744800136, "examples_seen": 102400.0, "progress": 0.000888075806150813, "epoch": 0.07992712893791364, "img/sec/core": 614.4196533086737, "core_hours_NVIDIA A100-SXM4-40GB": 0.044714330777779754, "core_hours": 0.044714330777779754} {"step": 150, "global_schedule": 0.01489999983459711, "l2_grads": 0.640091061592102, "l2_params": 207.76898193359375, "l2_updates": 0.03736286237835884, "train/loss": 6.890203952789307, "uptime": 243.82809590600118, "examples_seen": 153600.0, "progress": 0.0013321137092262196, "epoch": 0.11989069340687046, "img/sec/core": 615.6303668581345, "core_hours_NVIDIA A100-SXM4-40GB": 0.06781621624000157, "core_hours": 0.06781621624000157} {"step": 200, "global_schedule": 0.019899999722838402, "l2_grads": 0.6705377101898193, "l2_params": 207.7796173095703, "l2_updates": 0.056803371757268906, "train/loss": 6.872468948364258, "uptime": 254.20368234200032, "examples_seen": 204800.0, "progress": 0.001776151612301626, "epoch": 0.15985425787582727, "img/sec/core": 616.832604063184, "core_hours_NVIDIA A100-SXM4-40GB": 0.09087307498666633, "core_hours": 0.09087307498666633} {"step": 250, "global_schedule": 0.024899998679757118, "l2_grads": 0.7111495137214661, "l2_params": 207.78944396972656, "l2_updates": 0.05303599312901497, "train/loss": 6.850142478942871, "uptime": 264.66288094800075, "examples_seen": 256000.0, "progress": 0.0022201895153770327, "epoch": 0.1998178223447841, "img/sec/core": 611.9015654151867, "core_hours_NVIDIA A100-SXM4-40GB": 0.11411573855555616, "core_hours": 0.11411573855555616} {"step": 300, "global_schedule": 0.029899999499320984, "l2_grads": 0.5904300212860107, "l2_params": 207.79898071289062, "l2_updates": 0.05759379640221596, "train/loss": 6.835823059082031, "uptime": 275.0690463150004, "examples_seen": 307200.0, "progress": 0.0026642274184524393, "epoch": 0.23978138681374092, "img/sec/core": 615.0200169118865, "core_hours_NVIDIA A100-SXM4-40GB": 0.137240550482222, "core_hours": 0.137240550482222} {"step": 350, "global_schedule": 0.0348999984562397, "l2_grads": 0.6441176533699036, "l2_params": 207.8090057373047, "l2_updates": 0.06642083078622818, "train/loss": 6.837291717529297, "uptime": 285.51449228599995, "examples_seen": 358400.0, "progress": 0.003108265321527846, "epoch": 0.2797449512826977, "img/sec/core": 612.7072044380653, "core_hours_NVIDIA A100-SXM4-40GB": 0.16045265263999883, "core_hours": 0.16045265263999883} {"step": 400, "global_schedule": 0.03989999741315842, "l2_grads": 0.7254522442817688, "l2_params": 207.81951904296875, "l2_updates": 0.06559193879365921, "train/loss": 6.766262531280518, "uptime": 296.0862381980005, "examples_seen": 409600.0, "progress": 0.003552303224603252, "epoch": 0.31970851575165454, "img/sec/core": 605.3872324660224, "core_hours_NVIDIA A100-SXM4-40GB": 0.18394542133333341, "core_hours": 0.18394542133333341} {"step": 450, "global_schedule": 0.04490000009536743, "l2_grads": 0.657137930393219, "l2_params": 207.82806396484375, "l2_updates": 0.09094572812318802, "train/loss": 6.795753002166748, "uptime": 306.65117916300005, "examples_seen": 460800.0, "progress": 0.003996341127678659, "epoch": 0.35967208022061137, "img/sec/core": 605.7771663090663, "core_hours_NVIDIA A100-SXM4-40GB": 0.20742306792222126, "core_hours": 0.20742306792222126} {"step": 500, "global_schedule": 0.04989999905228615, "l2_grads": 0.9686818718910217, "l2_params": 207.8369140625, "l2_updates": 0.09892964363098145, "train/loss": 6.796996116638184, "uptime": 317.25585022000087, "examples_seen": 512000.0, "progress": 0.0044403790307540655, "epoch": 0.3996356446895682, "img/sec/core": 603.5076397560634, "core_hours_NVIDIA A100-SXM4-40GB": 0.23098900360444533, "core_hours": 0.23098900360444533} {"step": 550, "global_schedule": 0.054899998009204865, "l2_grads": 1.4972199201583862, "l2_params": 207.84521484375, "l2_updates": 0.08984144777059555, "train/loss": 6.665750026702881, "uptime": 327.7813402740012, "examples_seen": 563200.0, "progress": 0.004884416933829472, "epoch": 0.439599209158525, "img/sec/core": 608.0476982226219, "core_hours_NVIDIA A100-SXM4-40GB": 0.2543789815022238, "core_hours": 0.2543789815022238} {"step": 600, "global_schedule": 0.05989999696612358, "l2_grads": 1.278633713722229, "l2_params": 207.84339904785156, "l2_updates": 0.09109123051166534, "train/loss": 6.624872207641602, "uptime": 338.46725385600075, "examples_seen": 614400.0, "progress": 0.0053284548369048786, "epoch": 0.47956277362748184, "img/sec/core": 598.9193110059222, "core_hours_NVIDIA A100-SXM4-40GB": 0.2781254561288895, "core_hours": 0.2781254561288895} {"step": 650, "global_schedule": 0.0648999959230423, "l2_grads": 1.1237664222717285, "l2_params": 207.84339904785156, "l2_updates": 0.08300457894802094, "train/loss": 6.7081193923950195, "uptime": 349.03674676300034, "examples_seen": 665600.0, "progress": 0.005772492739980285, "epoch": 0.5195263380964387, "img/sec/core": 605.5162774896833, "core_hours_NVIDIA A100-SXM4-40GB": 0.30161321814444414, "core_hours": 0.30161321814444414} {"step": 700, "global_schedule": 0.06989999860525131, "l2_grads": 1.7115908861160278, "l2_params": 207.8311309814453, "l2_updates": 0.0902533158659935, "train/loss": 6.6014723777771, "uptime": 359.7347034890008, "examples_seen": 716800.0, "progress": 0.006216530643055692, "epoch": 0.5594899025653954, "img/sec/core": 598.2450821141703, "core_hours_NVIDIA A100-SXM4-40GB": 0.32538645531333416, "core_hours": 0.32538645531333416} {"step": 750, "global_schedule": 0.07490000128746033, "l2_grads": 0.8147153854370117, "l2_params": 207.82066345214844, "l2_updates": 0.09375308454036713, "train/loss": 6.7318549156188965, "uptime": 370.3128130900004, "examples_seen": 768000.0, "progress": 0.006660568546131097, "epoch": 0.5994534670343523, "img/sec/core": 605.023037329394, "core_hours_NVIDIA A100-SXM4-40GB": 0.3488933655377776, "core_hours": 0.3488933655377776} {"step": 800, "global_schedule": 0.07989999651908875, "l2_grads": 1.259162187576294, "l2_params": 207.8129119873047, "l2_updates": 0.10623602569103241, "train/loss": 6.537596225738525, "uptime": 380.84645218600053, "examples_seen": 819200.0, "progress": 0.007104606449206504, "epoch": 0.6394170315033091, "img/sec/core": 607.577299893466, "core_hours_NVIDIA A100-SXM4-40GB": 0.3723014524177779, "core_hours": 0.3723014524177779} {"step": 850, "global_schedule": 0.08489999920129776, "l2_grads": 1.2817261219024658, "l2_params": 207.80137634277344, "l2_updates": 0.10764996707439423, "train/loss": 6.505598545074463, "uptime": 391.43153740300113, "examples_seen": 870400.0, "progress": 0.00754864435228191, "epoch": 0.679380595972266, "img/sec/core": 604.6243245846548, "core_hours_NVIDIA A100-SXM4-40GB": 0.3958238640111126, "core_hours": 0.3958238640111126} {"step": 900, "global_schedule": 0.08989999443292618, "l2_grads": 1.5574201345443726, "l2_params": 207.77993774414062, "l2_updates": 0.11691944301128387, "train/loss": 6.470272541046143, "uptime": 402.1706101150012, "examples_seen": 921600.0, "progress": 0.007992682255357318, "epoch": 0.7193441604412227, "img/sec/core": 595.9546202577168, "core_hours_NVIDIA A100-SXM4-40GB": 0.4196884700377793, "core_hours": 0.4196884700377793} {"step": 950, "global_schedule": 0.09489999711513519, "l2_grads": 1.08329176902771, "l2_params": 207.75526428222656, "l2_updates": 0.14020879566669464, "train/loss": 6.480486869812012, "uptime": 412.35153096199974, "examples_seen": 972800.0, "progress": 0.008436720158432724, "epoch": 0.7593077249101795, "img/sec/core": 628.6268301444251, "core_hours_NVIDIA A100-SXM4-40GB": 0.44231273858666503, "core_hours": 0.44231273858666503} {"step": 1000, "global_schedule": 0.09989999979734421, "l2_grads": 1.3083912134170532, "l2_params": 207.73338317871094, "l2_updates": 0.11800455302000046, "train/loss": 6.468853950500488, "uptime": 421.6471941110012, "examples_seen": 1024000.0, "progress": 0.008880758061508131, "epoch": 0.7992712893791364, "img/sec/core": 688.4931066685082, "core_hours_NVIDIA A100-SXM4-40GB": 0.4629697678066683, "core_hours": 0.4629697678066683} {"step": 1050, "global_schedule": 0.10489999502897263, "l2_grads": 0.9634691476821899, "l2_params": 207.7014617919922, "l2_updates": 0.1372220814228058, "train/loss": 6.427849769592285, "uptime": 431.4349229520012, "examples_seen": 1075200.0, "progress": 0.009324795964583537, "epoch": 0.8392348538480932, "img/sec/core": 712.95738015606, "core_hours_NVIDIA A100-SXM4-40GB": 0.4829179759577771, "core_hours": 0.4829179759577771} {"step": 1100, "global_schedule": 0.10989999771118164, "l2_grads": 1.8411287069320679, "l2_params": 207.6746368408203, "l2_updates": 0.12977157533168793, "train/loss": 6.747613430023193, "uptime": 440.9499605150013, "examples_seen": 1126400.0, "progress": 0.009768833867658944, "epoch": 0.87919841831705, "img/sec/core": 672.6195201674105, "core_hours_NVIDIA A100-SXM4-40GB": 0.504062503875555, "core_hours": 0.504062503875555} {"step": 1150, "global_schedule": 0.11490000039339066, "l2_grads": 2.1191017627716064, "l2_params": 207.63949584960938, "l2_updates": 0.11844266951084137, "train/loss": 6.339458465576172, "uptime": 450.2215731190008, "examples_seen": 1177600.0, "progress": 0.01021287177073435, "epoch": 0.9191619827860068, "img/sec/core": 690.2790564436665, "core_hours_NVIDIA A100-SXM4-40GB": 0.5246660874399984, "core_hours": 0.5246660874399984} {"step": 1200, "global_schedule": 0.11989999562501907, "l2_grads": 1.6981121301651, "l2_params": 207.6151123046875, "l2_updates": 0.1465073525905609, "train/loss": 6.393484115600586, "uptime": 459.78423140000086, "examples_seen": 1228800.0, "progress": 0.010656909673809757, "epoch": 0.9591255472549637, "img/sec/core": 669.2699678201512, "core_hours_NVIDIA A100-SXM4-40GB": 0.5459164391755541, "core_hours": 0.5459164391755541} {"step": 1250, "global_schedule": 0.12489999830722809, "l2_grads": 2.5395119190216064, "l2_params": 207.59507751464844, "l2_updates": 0.12699146568775177, "train/loss": 6.3393354415893555, "uptime": 469.2894221890001, "examples_seen": 1280000.0, "progress": 0.011100947576885163, "epoch": 0.9990891117239205, "img/sec/core": 673.316311273519, "core_hours_NVIDIA A100-SXM4-40GB": 0.5670390853733301, "core_hours": 0.5670390853733301} {"step": 1300, "global_schedule": 0.1298999935388565, "l2_grads": 1.9179892539978027, "l2_params": 207.5568389892578, "l2_updates": 0.15819358825683594, "train/loss": 6.3552632331848145, "uptime": 479.5368690940013, "examples_seen": 1331200.0, "progress": 0.01154498547996057, "epoch": 1.0390526761928773, "img/sec/core": 624.5458072953296, "core_hours_NVIDIA A100-SXM4-40GB": 0.5898111896066661, "core_hours": 0.5898111896066661} {"step": 1350, "global_schedule": 0.13490000367164612, "l2_grads": 1.5064588785171509, "l2_params": 207.5205841064453, "l2_updates": 0.1689976304769516, "train/loss": 6.594691276550293, "uptime": 488.74166599900127, "examples_seen": 1382400.0, "progress": 0.011989023383035976, "epoch": 1.079016240661834, "img/sec/core": 695.2896480012041, "core_hours_NVIDIA A100-SXM4-40GB": 0.6102662938399993, "core_hours": 0.6102662938399993} {"step": 1400, "global_schedule": 0.13989999890327454, "l2_grads": 1.530970811843872, "l2_params": 207.48435974121094, "l2_updates": 0.1419948935508728, "train/loss": 6.259324550628662, "uptime": 497.55591239000023, "examples_seen": 1433600.0, "progress": 0.012433061286111383, "epoch": 1.1189798051307909, "img/sec/core": 726.097242588502, "core_hours_NVIDIA A100-SXM4-40GB": 0.6298535080422193, "core_hours": 0.6298535080422193} {"step": 1450, "global_schedule": 0.14489999413490295, "l2_grads": 1.9207345247268677, "l2_params": 207.46621704101562, "l2_updates": 0.1371823102235794, "train/loss": 6.545238971710205, "uptime": 506.244358594, "examples_seen": 1484800.0, "progress": 0.012877099189186789, "epoch": 1.1589433695997478, "img/sec/core": 736.6104191395839, "core_hours_NVIDIA A100-SXM4-40GB": 0.64916116627333, "core_hours": 0.64916116627333} {"step": 1500, "global_schedule": 0.14989998936653137, "l2_grads": 1.8604434728622437, "l2_params": 207.44520568847656, "l2_updates": 0.17030999064445496, "train/loss": 6.173192977905273, "uptime": 515.2977974920013, "examples_seen": 1536000.0, "progress": 0.013321137092262195, "epoch": 1.1989069340687046, "img/sec/core": 706.913701202853, "core_hours_NVIDIA A100-SXM4-40GB": 0.6692799193799995, "core_hours": 0.6692799193799995} {"step": 1550, "global_schedule": 0.15489999949932098, "l2_grads": 1.6682862043380737, "l2_params": 207.40240478515625, "l2_updates": 0.15580937266349792, "train/loss": 6.308918476104736, "uptime": 523.922089093001, "examples_seen": 1587200.0, "progress": 0.013765174995337602, "epoch": 1.2388704985376613, "img/sec/core": 742.0899357412934, "core_hours_NVIDIA A100-SXM4-40GB": 0.6884450118266654, "core_hours": 0.6884450118266654} {"step": 1600, "global_schedule": 0.1598999947309494, "l2_grads": 1.5370688438415527, "l2_params": 207.3639678955078, "l2_updates": 0.17708253860473633, "train/loss": 6.2307047843933105, "uptime": 532.5466877859999, "examples_seen": 1638400.0, "progress": 0.014209212898413008, "epoch": 1.2788340630066182, "img/sec/core": 742.0635124965581, "core_hours_NVIDIA A100-SXM4-40GB": 0.7076107866999963, "core_hours": 0.7076107866999963} {"step": 1650, "global_schedule": 0.16489998996257782, "l2_grads": 1.621561884880066, "l2_params": 207.32652282714844, "l2_updates": 0.17671437561511993, "train/loss": 6.448636054992676, "uptime": 541.5437051440003, "examples_seen": 1689600.0, "progress": 0.014653250801488415, "epoch": 1.318797627475575, "img/sec/core": 711.3468547783679, "core_hours_NVIDIA A100-SXM4-40GB": 0.7276041586066639, "core_hours": 0.7276041586066639} {"step": 1700, "global_schedule": 0.16990000009536743, "l2_grads": 1.226978063583374, "l2_params": 207.2808074951172, "l2_updates": 0.1985219419002533, "train/loss": 6.711350440979004, "uptime": 550.011184242001, "examples_seen": 1740800.0, "progress": 0.01509728870456382, "epoch": 1.358761191944532, "img/sec/core": 755.8329847558928, "core_hours_NVIDIA A100-SXM4-40GB": 0.7464207788244434, "core_hours": 0.7464207788244434} {"step": 1750, "global_schedule": 0.17489999532699585, "l2_grads": 1.4367767572402954, "l2_params": 207.24612426757812, "l2_updates": 0.19266347587108612, "train/loss": 6.511279582977295, "uptime": 558.6970191270011, "examples_seen": 1792000.0, "progress": 0.015541326607639228, "epoch": 1.3987247564134886, "img/sec/core": 736.8318745101201, "core_hours_NVIDIA A100-SXM4-40GB": 0.7657226341244435, "core_hours": 0.7657226341244435} {"step": 1800, "global_schedule": 0.17989999055862427, "l2_grads": 1.6059099435806274, "l2_params": 207.2095184326172, "l2_updates": 0.20982380211353302, "train/loss": 6.134070873260498, "uptime": 567.8784460349998, "examples_seen": 1843200.0, "progress": 0.015985364510714636, "epoch": 1.4386883208824455, "img/sec/core": 697.0594074461827, "core_hours_NVIDIA A100-SXM4-40GB": 0.7861258050311072, "core_hours": 0.7861258050311072} {"step": 1850, "global_schedule": 0.18490000069141388, "l2_grads": 1.2044209241867065, "l2_params": 207.1824951171875, "l2_updates": 0.21917115151882172, "train/loss": 6.256562232971191, "uptime": 577.3723501430013, "examples_seen": 1894400.0, "progress": 0.01642940241379004, "epoch": 1.4786518853514024, "img/sec/core": 674.116772951819, "core_hours_NVIDIA A100-SXM4-40GB": 0.807223369715555, "core_hours": 0.807223369715555} {"step": 1900, "global_schedule": 0.1898999959230423, "l2_grads": 1.3524847030639648, "l2_params": 207.15829467773438, "l2_updates": 0.22725936770439148, "train/loss": 6.190034866333008, "uptime": 586.8749335230004, "examples_seen": 1945600.0, "progress": 0.016873440316865447, "epoch": 1.518615449820359, "img/sec/core": 673.5010621922678, "core_hours_NVIDIA A100-SXM4-40GB": 0.8283402216711087, "core_hours": 0.8283402216711087} {"step": 1950, "global_schedule": 0.19489999115467072, "l2_grads": 1.366194248199463, "l2_params": 207.1477508544922, "l2_updates": 0.2316821664571762, "train/loss": 6.671849250793457, "uptime": 596.3951751240002, "examples_seen": 1996800.0, "progress": 0.017317478219940854, "epoch": 1.558579014289316, "img/sec/core": 672.251846983372, "core_hours_NVIDIA A100-SXM4-40GB": 0.8494963141177746, "core_hours": 0.8494963141177746} {"step": 2000, "global_schedule": 0.19990000128746033, "l2_grads": 1.592488169670105, "l2_params": 207.13682556152344, "l2_updates": 0.2495422512292862, "train/loss": 6.0666069984436035, "uptime": 605.2966644600001, "examples_seen": 2048000.0, "progress": 0.017761516123016262, "epoch": 1.5985425787582728, "img/sec/core": 718.9808085391659, "core_hours_NVIDIA A100-SXM4-40GB": 0.8692774015311079, "core_hours": 0.8692774015311079} {"step": 2050, "global_schedule": 0.20489999651908875, "l2_grads": 1.694317102432251, "l2_params": 207.1298828125, "l2_updates": 0.22725333273410797, "train/loss": 6.077362537384033, "uptime": 614.5707909450011, "examples_seen": 2099200.0, "progress": 0.018205554026091666, "epoch": 1.6385061432272296, "img/sec/core": 755.7846951045467, "core_hours_NVIDIA A100-SXM4-40GB": 0.8880952240066674, "core_hours": 0.8880952240066674} {"step": 2100, "global_schedule": 0.20989999175071716, "l2_grads": 1.4432029724121094, "l2_params": 207.115478515625, "l2_updates": 0.24569854140281677, "train/loss": 6.658808708190918, "uptime": 623.5052457729998, "examples_seen": 2150400.0, "progress": 0.018649591929167073, "epoch": 1.6784697076961863, "img/sec/core": 716.3279823122216, "core_hours_NVIDIA A100-SXM4-40GB": 0.9079495680688867, "core_hours": 0.9079495680688867} {"step": 2150, "global_schedule": 0.21490000188350677, "l2_grads": 1.2065236568450928, "l2_params": 207.0861358642578, "l2_updates": 0.28416305780410767, "train/loss": 6.207632541656494, "uptime": 633.0468416650001, "examples_seen": 2201600.0, "progress": 0.01909362983224248, "epoch": 1.7184332721651432, "img/sec/core": 670.7473333015292, "core_hours_NVIDIA A100-SXM4-40GB": 0.9291531144955539, "core_hours": 0.9291531144955539} {"step": 2200, "global_schedule": 0.2198999971151352, "l2_grads": 1.856994390487671, "l2_params": 207.08822631835938, "l2_updates": 0.2552189528942108, "train/loss": 6.030084133148193, "uptime": 642.7341108540004, "examples_seen": 2252800.0, "progress": 0.019537667735317888, "epoch": 1.7583968366341, "img/sec/core": 660.6609019667874, "core_hours_NVIDIA A100-SXM4-40GB": 0.9506803793599992, "core_hours": 0.9506803793599992} {"step": 2250, "global_schedule": 0.2248999923467636, "l2_grads": 2.1021735668182373, "l2_params": 207.10765075683594, "l2_updates": 0.2386227548122406, "train/loss": 6.065042972564697, "uptime": 651.9592744110014, "examples_seen": 2304000.0, "progress": 0.019981705638393292, "epoch": 1.7983604011030567, "img/sec/core": 693.754637568786, "core_hours_NVIDIA A100-SXM4-40GB": 0.9711807428200013, "core_hours": 0.9711807428200013} {"step": 2300, "global_schedule": 0.22989998757839203, "l2_grads": 1.4236533641815186, "l2_params": 207.10888671875, "l2_updates": 0.2932097315788269, "train/loss": 5.961605548858643, "uptime": 661.4218600229997, "examples_seen": 2355200.0, "progress": 0.0204257435414687, "epoch": 1.8383239655720136, "img/sec/core": 676.3479098022616, "core_hours_NVIDIA A100-SXM4-40GB": 0.9922087108466642, "core_hours": 0.9922087108466642} {"step": 2350, "global_schedule": 0.23489999771118164, "l2_grads": 1.3539894819259644, "l2_params": 207.09078979492188, "l2_updates": 0.2930847406387329, "train/loss": 5.937834739685059, "uptime": 670.9255876250008, "examples_seen": 2406400.0, "progress": 0.020869781444544107, "epoch": 1.8782875300409705, "img/sec/core": 673.4199745637045, "core_hours_NVIDIA A100-SXM4-40GB": 1.0133281055177779, "core_hours": 1.0133281055177779} {"step": 2400, "global_schedule": 0.23989999294281006, "l2_grads": 1.9094294309616089, "l2_params": 207.10482788085938, "l2_updates": 0.2769569754600525, "train/loss": 6.717165946960449, "uptime": 679.5437222020009, "examples_seen": 2457600.0, "progress": 0.021313819347619514, "epoch": 1.9182510945099274, "img/sec/core": 742.6201044806372, "core_hours_NVIDIA A100-SXM4-40GB": 1.032479515688889, "core_hours": 1.032479515688889} {"step": 2450, "global_schedule": 0.24489998817443848, "l2_grads": 1.4950292110443115, "l2_params": 207.12034606933594, "l2_updates": 0.2981712222099304, "train/loss": 5.912501335144043, "uptime": 688.7185884379996, "examples_seen": 2508800.0, "progress": 0.021757857250694918, "epoch": 1.958214658978884, "img/sec/core": 697.5578537471009, "core_hours_NVIDIA A100-SXM4-40GB": 1.052868107324442, "core_hours": 1.052868107324442} {"step": 2500, "global_schedule": 0.2498999983072281, "l2_grads": 1.4590818881988525, "l2_params": 207.1592254638672, "l2_updates": 0.2789834439754486, "train/loss": 6.4360809326171875, "uptime": 698.5002182099997, "examples_seen": 2560000.0, "progress": 0.022201895153770326, "epoch": 1.998178223447841, "img/sec/core": 654.2876953204668, "core_hours_NVIDIA A100-SXM4-40GB": 1.0746050623733308, "core_hours": 1.0746050623733308, "val/acc@1": 0.06344, "val/loss": 5.507733486328125, "z/secs/eval/val": 6.181980656001542} {"step": 2550, "global_schedule": 0.2549000084400177, "l2_grads": 1.4777352809906006, "l2_params": 207.1964874267578, "l2_updates": 0.31919947266578674, "train/loss": 6.517998218536377, "uptime": 713.973116608, "examples_seen": 2611200.0, "progress": 0.022645933056845733, "epoch": 2.0381417879167976, "img/sec/core": 688.9091471306594, "core_hours_NVIDIA A100-SXM4-40GB": 1.0952496165666648, "core_hours": 1.0952496165666648} {"step": 2600, "global_schedule": 0.2599000036716461, "l2_grads": 1.316410779953003, "l2_params": 207.238525390625, "l2_updates": 0.32714763283729553, "train/loss": 5.925455570220947, "uptime": 722.8573966170006, "examples_seen": 2662400.0, "progress": 0.02308997095992114, "epoch": 2.0781053523857547, "img/sec/core": 720.373512937033, "core_hours_NVIDIA A100-SXM4-40GB": 1.1149924610311104, "core_hours": 1.1149924610311104} {"step": 2650, "global_schedule": 0.26489999890327454, "l2_grads": 1.4139888286590576, "l2_params": 207.2888946533203, "l2_updates": 0.3027748763561249, "train/loss": 5.844012260437012, "uptime": 731.9928691639998, "examples_seen": 2713600.0, "progress": 0.023534008862996544, "epoch": 2.1180689168547113, "img/sec/core": 700.5658401439005, "core_hours_NVIDIA A100-SXM4-40GB": 1.135293511135553, "core_hours": 1.135293511135553} {"step": 2700, "global_schedule": 0.26989999413490295, "l2_grads": 1.2960916757583618, "l2_params": 207.29827880859375, "l2_updates": 0.3176978528499603, "train/loss": 6.155135154724121, "uptime": 740.6604243490001, "examples_seen": 2764800.0, "progress": 0.023978046766071952, "epoch": 2.158032481323668, "img/sec/core": 738.3858381514038, "core_hours_NVIDIA A100-SXM4-40GB": 1.1545547448799982, "core_hours": 1.1545547448799982} {"step": 2750, "global_schedule": 0.27489998936653137, "l2_grads": 1.614317774772644, "l2_params": 207.35546875, "l2_updates": 0.29545706510543823, "train/loss": 6.318309783935547, "uptime": 749.3520569800003, "examples_seen": 2816000.0, "progress": 0.02442208466914736, "epoch": 2.197996045792625, "img/sec/core": 736.340371447974, "core_hours_NVIDIA A100-SXM4-40GB": 1.1738694840599986, "core_hours": 1.1738694840599986} {"step": 2800, "global_schedule": 0.2798999845981598, "l2_grads": 1.6128761768341064, "l2_params": 207.3966064453125, "l2_updates": 0.3367685377597809, "train/loss": 5.823238372802734, "uptime": 758.1033666300009, "examples_seen": 2867200.0, "progress": 0.024866122572222767, "epoch": 2.2379596102615817, "img/sec/core": 731.3191117628372, "core_hours_NVIDIA A100-SXM4-40GB": 1.1933168388377777, "core_hours": 1.1933168388377777} {"step": 2850, "global_schedule": 0.2848999798297882, "l2_grads": 1.6141501665115356, "l2_params": 207.44537353515625, "l2_updates": 0.3441261053085327, "train/loss": 5.920030117034912, "uptime": 767.396433201, "examples_seen": 2918400.0, "progress": 0.02531016047529817, "epoch": 2.277923174730539, "img/sec/core": 688.6854786957481, "core_hours_NVIDIA A100-SXM4-40GB": 1.2139680978844425, "core_hours": 1.2139680978844425} {"step": 2900, "global_schedule": 0.289900004863739, "l2_grads": 1.296355128288269, "l2_params": 207.5064239501953, "l2_updates": 0.335824191570282, "train/loss": 6.382574081420898, "uptime": 777.2630501479998, "examples_seen": 2969600.0, "progress": 0.025754198378373578, "epoch": 2.3178867391994955, "img/sec/core": 648.6519173064781, "core_hours_NVIDIA A100-SXM4-40GB": 1.2358939133222195, "core_hours": 1.2358939133222195} {"step": 2950, "global_schedule": 0.29490000009536743, "l2_grads": 1.4815248250961304, "l2_params": 207.58584594726562, "l2_updates": 0.35565492510795593, "train/loss": 5.977816104888916, "uptime": 786.2114829950006, "examples_seen": 3020800.0, "progress": 0.026198236281448985, "epoch": 2.357850303668452, "img/sec/core": 715.2090326235285, "core_hours_NVIDIA A100-SXM4-40GB": 1.255779319648888, "core_hours": 1.255779319648888} {"step": 3000, "global_schedule": 0.29989999532699585, "l2_grads": 1.6113698482513428, "l2_params": 207.6547393798828, "l2_updates": 0.3625665009021759, "train/loss": 5.687808513641357, "uptime": 794.9189868410012, "examples_seen": 3072000.0, "progress": 0.02664227418452439, "epoch": 2.3978138681374093, "img/sec/core": 734.9982398158211, "core_hours_NVIDIA A100-SXM4-40GB": 1.2751293281955562, "core_hours": 1.2751293281955562} {"step": 3050, "global_schedule": 0.30489999055862427, "l2_grads": 1.575883150100708, "l2_params": 207.7259063720703, "l2_updates": 0.3823453187942505, "train/loss": 6.16989803314209, "uptime": 805.1068230290002, "examples_seen": 3123200.0, "progress": 0.027086312087599797, "epoch": 2.437777432606366, "img/sec/core": 699.1908270240194, "core_hours_NVIDIA A100-SXM4-40GB": 1.2954703018933327, "core_hours": 1.2954703018933327} {"step": 3100, "global_schedule": 0.3098999857902527, "l2_grads": 1.2948908805847168, "l2_params": 207.81947326660156, "l2_updates": 0.38082173466682434, "train/loss": 5.8007588386535645, "uptime": 814.1374440520012, "examples_seen": 3174400.0, "progress": 0.027530349990675204, "epoch": 2.4777409970753226, "img/sec/core": 708.6998760881662, "core_hours_NVIDIA A100-SXM4-40GB": 1.3155383486111127, "core_hours": 1.3155383486111127} {"step": 3150, "global_schedule": 0.3148999810218811, "l2_grads": 1.4405272006988525, "l2_params": 207.90223693847656, "l2_updates": 0.39390039443969727, "train/loss": 5.80734395980835, "uptime": 823.6075193380002, "examples_seen": 3225600.0, "progress": 0.02797438789375061, "epoch": 2.5177045615442797, "img/sec/core": 675.813001134434, "core_hours_NVIDIA A100-SXM4-40GB": 1.3365829603577772, "core_hours": 1.3365829603577772} {"step": 3200, "global_schedule": 0.3199000060558319, "l2_grads": 1.6196181774139404, "l2_params": 207.9614715576172, "l2_updates": 0.3928675055503845, "train/loss": 5.739917755126953, "uptime": 832.1527575359996, "examples_seen": 3276800.0, "progress": 0.028418425796826016, "epoch": 2.5576681260132363, "img/sec/core": 748.9551317011083, "core_hours_NVIDIA A100-SXM4-40GB": 1.3555723785755538, "core_hours": 1.3555723785755538} {"step": 3250, "global_schedule": 0.3249000012874603, "l2_grads": 1.2572835683822632, "l2_params": 208.05943298339844, "l2_updates": 0.3606553375720978, "train/loss": 6.551417827606201, "uptime": 840.7448184040004, "examples_seen": 3328000.0, "progress": 0.028862463699901423, "epoch": 2.597631690482193, "img/sec/core": 744.8736802872735, "core_hours_NVIDIA A100-SXM4-40GB": 1.374665847171111, "core_hours": 1.374665847171111} {"step": 3300, "global_schedule": 0.32989999651908875, "l2_grads": 1.6140483617782593, "l2_params": 208.15261840820312, "l2_updates": 0.4250048100948334, "train/loss": 5.780648231506348, "uptime": 849.6884259369999, "examples_seen": 3379200.0, "progress": 0.02930650160297683, "epoch": 2.63759525495115, "img/sec/core": 715.59490690817, "core_hours_NVIDIA A100-SXM4-40GB": 1.3945405305777767, "core_hours": 1.3945405305777767} {"step": 3350, "global_schedule": 0.33489999175071716, "l2_grads": 1.2910959720611572, "l2_params": 208.28501892089844, "l2_updates": 0.4064769148826599, "train/loss": 6.114736557006836, "uptime": 858.6735041250013, "examples_seen": 3430400.0, "progress": 0.029750539506052238, "epoch": 2.6775588194201068, "img/sec/core": 712.2920764948425, "core_hours_NVIDIA A100-SXM4-40GB": 1.4145073709955573, "core_hours": 1.4145073709955573} {"step": 3400, "global_schedule": 0.3398999869823456, "l2_grads": 1.856823205947876, "l2_params": 208.3782196044922, "l2_updates": 0.3918739855289459, "train/loss": 6.26747465133667, "uptime": 867.7631859390003, "examples_seen": 3481600.0, "progress": 0.03019457740912764, "epoch": 2.717522383889064, "img/sec/core": 704.0950531561334, "core_hours_NVIDIA A100-SXM4-40GB": 1.4347066639155552, "core_hours": 1.4347066639155552} {"step": 3450, "global_schedule": 0.344899982213974, "l2_grads": 1.3156996965408325, "l2_params": 208.48941040039062, "l2_updates": 0.4450678825378418, "train/loss": 5.746856689453125, "uptime": 876.8166689990012, "examples_seen": 3532800.0, "progress": 0.03063861531220305, "epoch": 2.7574859483580205, "img/sec/core": 706.910252947376, "core_hours_NVIDIA A100-SXM4-40GB": 1.4548255151600016, "core_hours": 1.4548255151600016} {"step": 3500, "global_schedule": 0.3498999774456024, "l2_grads": 1.1290228366851807, "l2_params": 208.61691284179688, "l2_updates": 0.4082944393157959, "train/loss": 6.237624168395996, "uptime": 885.2807142180009, "examples_seen": 3584000.0, "progress": 0.031082653215278457, "epoch": 2.797449512826977, "img/sec/core": 756.1396276137083, "core_hours_NVIDIA A100-SXM4-40GB": 1.4736345045355566, "core_hours": 1.4736345045355566} {"step": 3550, "global_schedule": 0.3549000024795532, "l2_grads": 1.2374483346939087, "l2_params": 208.7517547607422, "l2_updates": 0.455348938703537, "train/loss": 5.513610363006592, "uptime": 893.8266365010004, "examples_seen": 3635200.0, "progress": 0.031526691118353864, "epoch": 2.8374130772959343, "img/sec/core": 748.8951792519307, "core_hours_NVIDIA A100-SXM4-40GB": 1.492625442942222, "core_hours": 1.492625442942222} {"step": 3600, "global_schedule": 0.35989999771118164, "l2_grads": 1.2032991647720337, "l2_params": 208.875732421875, "l2_updates": 0.4261053204536438, "train/loss": 6.167971611022949, "uptime": 902.6733964249997, "examples_seen": 3686400.0, "progress": 0.03197072902142927, "epoch": 2.877376641764891, "img/sec/core": 723.4286964923945, "core_hours_NVIDIA A100-SXM4-40GB": 1.5122849094399984, "core_hours": 1.5122849094399984} {"step": 3650, "global_schedule": 0.36489999294281006, "l2_grads": 1.4226988554000854, "l2_params": 208.97947692871094, "l2_updates": 0.4091397523880005, "train/loss": 5.726563930511475, "uptime": 911.743025617001, "examples_seen": 3737600.0, "progress": 0.03241476692450468, "epoch": 2.9173402062338476, "img/sec/core": 705.6517818439971, "core_hours_NVIDIA A100-SXM4-40GB": 1.5324396409777787, "core_hours": 1.5324396409777787} {"step": 3700, "global_schedule": 0.3698999881744385, "l2_grads": 1.8060100078582764, "l2_params": 209.1243133544922, "l2_updates": 0.4236809313297272, "train/loss": 5.502999782562256, "uptime": 920.2221581909998, "examples_seen": 3788800.0, "progress": 0.03285880482758008, "epoch": 2.9573037707028047, "img/sec/core": 754.7941896350935, "core_hours_NVIDIA A100-SXM4-40GB": 1.5512821578088876, "core_hours": 1.5512821578088876} {"step": 3750, "global_schedule": 0.3748999834060669, "l2_grads": 1.4139256477355957, "l2_params": 209.29376220703125, "l2_updates": 0.4402444064617157, "train/loss": 5.424935817718506, "uptime": 929.4883860720001, "examples_seen": 3840000.0, "progress": 0.03330284273065549, "epoch": 2.9972673351717614, "img/sec/core": 690.6801863919959, "core_hours_NVIDIA A100-SXM4-40GB": 1.5718737753222214, "core_hours": 1.5718737753222214} {"step": 3800, "global_schedule": 0.3798999786376953, "l2_grads": 1.151553750038147, "l2_params": 209.46951293945312, "l2_updates": 0.43273526430130005, "train/loss": 5.923369407653809, "uptime": 938.8334184530013, "examples_seen": 3891200.0, "progress": 0.033746880633730894, "epoch": 3.037230899640718, "img/sec/core": 684.8558398803921, "core_hours_NVIDIA A100-SXM4-40GB": 1.5926405139466686, "core_hours": 1.5926405139466686} {"step": 3850, "global_schedule": 0.3849000036716461, "l2_grads": 1.5911015272140503, "l2_params": 209.64588928222656, "l2_updates": 0.49186837673187256, "train/loss": 5.437906265258789, "uptime": 947.5261462260005, "examples_seen": 3942400.0, "progress": 0.0341909185368063, "epoch": 3.077194464109675, "img/sec/core": 736.2476045642738, "core_hours_NVIDIA A100-SXM4-40GB": 1.6119576867755554, "core_hours": 1.6119576867755554} {"step": 3900, "global_schedule": 0.38989999890327454, "l2_grads": 1.7020153999328613, "l2_params": 209.83680725097656, "l2_updates": 0.4726259708404541, "train/loss": 5.352508544921875, "uptime": 956.024121081, "examples_seen": 3993600.0, "progress": 0.03463495643988171, "epoch": 3.117158028578632, "img/sec/core": 753.120609227831, "core_hours_NVIDIA A100-SXM4-40GB": 1.6308420753422213, "core_hours": 1.6308420753422213} {"step": 3950, "global_schedule": 0.39489999413490295, "l2_grads": 1.4298309087753296, "l2_params": 210.00857543945312, "l2_updates": 0.4833565950393677, "train/loss": 5.686365127563477, "uptime": 964.644991696001, "examples_seen": 4044800.0, "progress": 0.035078994342957116, "epoch": 3.1571215930475884, "img/sec/core": 742.3844163562222, "core_hours_NVIDIA A100-SXM4-40GB": 1.6499995655977788, "core_hours": 1.6499995655977788} {"step": 4000, "global_schedule": 0.39989998936653137, "l2_grads": 1.468529224395752, "l2_params": 210.16282653808594, "l2_updates": 0.4919097423553467, "train/loss": 5.432093620300293, "uptime": 973.1620774479998, "examples_seen": 4096000.0, "progress": 0.035523032246032524, "epoch": 3.1970851575165455, "img/sec/core": 751.4307342154005, "core_hours_NVIDIA A100-SXM4-40GB": 1.6689264228244427, "core_hours": 1.6689264228244427} {"step": 4050, "global_schedule": 0.4048999845981598, "l2_grads": 1.3110672235488892, "l2_params": 210.35064697265625, "l2_updates": 0.49411070346832275, "train/loss": 5.57602071762085, "uptime": 982.0261610420002, "examples_seen": 4147200.0, "progress": 0.03596707014910793, "epoch": 3.237048721985502, "img/sec/core": 778.1980474703423, "core_hours_NVIDIA A100-SXM4-40GB": 1.6872022618199967, "core_hours": 1.6872022618199967} {"step": 4100, "global_schedule": 0.4098999798297882, "l2_grads": 1.150431752204895, "l2_params": 210.5728302001953, "l2_updates": 0.502150297164917, "train/loss": 6.219711780548096, "uptime": 991.3097380840009, "examples_seen": 4198400.0, "progress": 0.03641110805218333, "epoch": 3.2770122864544593, "img/sec/core": 689.3894423502082, "core_hours_NVIDIA A100-SXM4-40GB": 1.7078324330244423, "core_hours": 1.7078324330244423} {"step": 4150, "global_schedule": 0.4148999750614166, "l2_grads": 1.2499139308929443, "l2_params": 210.78965759277344, "l2_updates": 0.4716930389404297, "train/loss": 6.402318477630615, "uptime": 1000.8287513570012, "examples_seen": 4249600.0, "progress": 0.03685514595525874, "epoch": 3.316975850923416, "img/sec/core": 672.3385939751639, "core_hours_NVIDIA A100-SXM4-40GB": 1.7289857958533321, "core_hours": 1.7289857958533321} {"step": 4200, "global_schedule": 0.41990000009536743, "l2_grads": 1.521246075630188, "l2_params": 211.0115203857422, "l2_updates": 0.4985155463218689, "train/loss": 5.2539191246032715, "uptime": 1010.236390080001, "examples_seen": 4300800.0, "progress": 0.037299183858334146, "epoch": 3.3569394153923726, "img/sec/core": 680.2982330043459, "core_hours_NVIDIA A100-SXM4-40GB": 1.7498916596822205, "core_hours": 1.7498916596822205} {"step": 4250, "global_schedule": 0.42489999532699585, "l2_grads": 1.5953028202056885, "l2_params": 211.22415161132812, "l2_updates": 0.5156526565551758, "train/loss": 5.672638416290283, "uptime": 1019.5532883020005, "examples_seen": 4352000.0, "progress": 0.037743221761409554, "epoch": 3.3969029798613297, "img/sec/core": 686.9238932854297, "core_hours_NVIDIA A100-SXM4-40GB": 1.7705958779533304, "core_hours": 1.7705958779533304} {"step": 4300, "global_schedule": 0.42989999055862427, "l2_grads": 1.5048786401748657, "l2_params": 211.45408630371094, "l2_updates": 0.5028802752494812, "train/loss": 5.554953098297119, "uptime": 1028.984312849001, "examples_seen": 4403200.0, "progress": 0.03818725966448496, "epoch": 3.4368665443302864, "img/sec/core": 678.6113182194456, "core_hours_NVIDIA A100-SXM4-40GB": 1.7915537102799983, "core_hours": 1.7915537102799983} {"step": 4350, "global_schedule": 0.4348999857902527, "l2_grads": 1.0689373016357422, "l2_params": 211.6834716796875, "l2_updates": 0.5484316945075989, "train/loss": 6.42812967300415, "uptime": 1038.3782170260001, "examples_seen": 4454400.0, "progress": 0.03863129756756037, "epoch": 3.476830108799243, "img/sec/core": 681.2928766795789, "core_hours_NVIDIA A100-SXM4-40GB": 1.812429052895552, "core_hours": 1.812429052895552} {"step": 4400, "global_schedule": 0.4398999810218811, "l2_grads": 1.626086950302124, "l2_params": 211.89874267578125, "l2_updates": 0.4996497333049774, "train/loss": 5.288634300231934, "uptime": 1047.9216286770006, "examples_seen": 4505600.0, "progress": 0.039075335470635776, "epoch": 3.5167936732682, "img/sec/core": 670.6197148405568, "core_hours_NVIDIA A100-SXM4-40GB": 1.8336366343422197, "core_hours": 1.8336366343422197} {"step": 4450, "global_schedule": 0.4448999762535095, "l2_grads": 1.3911274671554565, "l2_params": 212.15538024902344, "l2_updates": 0.5432109236717224, "train/loss": 5.317190170288086, "uptime": 1057.2348700410002, "examples_seen": 4556800.0, "progress": 0.03951937337371118, "epoch": 3.556757237737157, "img/sec/core": 687.1936149683856, "core_hours_NVIDIA A100-SXM4-40GB": 1.8543327262622187, "core_hours": 1.8543327262622187} {"step": 4500, "global_schedule": 0.4499000012874603, "l2_grads": 1.2817364931106567, "l2_params": 212.40267944335938, "l2_updates": 0.482883095741272, "train/loss": 6.201126575469971, "uptime": 1066.450962977, "examples_seen": 4608000.0, "progress": 0.039963411276786584, "epoch": 3.5967208022061135, "img/sec/core": 694.4374415974488, "core_hours_NVIDIA A100-SXM4-40GB": 1.8748129327866627, "core_hours": 1.8748129327866627} {"step": 4550, "global_schedule": 0.45489999651908875, "l2_grads": 1.549308180809021, "l2_params": 212.5906982421875, "l2_updates": 0.48361361026763916, "train/loss": 6.514946460723877, "uptime": 1074.9887732780007, "examples_seen": 4659200.0, "progress": 0.04040744917986199, "epoch": 3.6366843666750706, "img/sec/core": 749.6067228443638, "core_hours_NVIDIA A100-SXM4-40GB": 1.8937858445666644, "core_hours": 1.8937858445666644} {"step": 4600, "global_schedule": 0.45989999175071716, "l2_grads": 1.1199519634246826, "l2_params": 212.84043884277344, "l2_updates": 0.474467009305954, "train/loss": 6.331567287445068, "uptime": 1083.6442624070005, "examples_seen": 4710400.0, "progress": 0.0408514870829374, "epoch": 3.676647931144027, "img/sec/core": 739.4151739567365, "core_hours_NVIDIA A100-SXM4-40GB": 1.9130202648533303, "core_hours": 1.9130202648533303} {"step": 4650, "global_schedule": 0.4648999869823456, "l2_grads": 1.5493829250335693, "l2_params": 213.06785583496094, "l2_updates": 0.5560997724533081, "train/loss": 5.172418594360352, "uptime": 1092.243311264001, "examples_seen": 4761600.0, "progress": 0.041295524986012806, "epoch": 3.7166114956129843, "img/sec/core": 744.2683611210942, "core_hours_NVIDIA A100-SXM4-40GB": 1.9321292623133317, "core_hours": 1.9321292623133317} {"step": 4700, "global_schedule": 0.469899982213974, "l2_grads": 1.5784573554992676, "l2_params": 213.3223419189453, "l2_updates": 0.5283311605453491, "train/loss": 5.172364234924316, "uptime": 1100.9163057040005, "examples_seen": 4812800.0, "progress": 0.041739562889088214, "epoch": 3.756575060081941, "img/sec/core": 737.9227606192725, "core_hours_NVIDIA A100-SXM4-40GB": 1.9514025832911082, "core_hours": 1.9514025832911082} {"step": 4750, "global_schedule": 0.4748999774456024, "l2_grads": 1.3699531555175781, "l2_params": 213.5331268310547, "l2_updates": 0.5389734506607056, "train/loss": 6.256735801696777, "uptime": 1109.5718244130003, "examples_seen": 4864000.0, "progress": 0.04218360079216362, "epoch": 3.7965386245508976, "img/sec/core": 739.412647025467, "core_hours_NVIDIA A100-SXM4-40GB": 1.9706370693111077, "core_hours": 1.9706370693111077} {"step": 4800, "global_schedule": 0.4799000024795532, "l2_grads": 1.2643640041351318, "l2_params": 213.777587890625, "l2_updates": 0.5769025087356567, "train/loss": 5.142219543457031, "uptime": 1118.0578299870012, "examples_seen": 4915200.0, "progress": 0.04262763869523903, "epoch": 3.8365021890198547, "img/sec/core": 754.1828654470878, "core_hours_NVIDIA A100-SXM4-40GB": 1.9894948594755542, "core_hours": 1.9894948594755542} {"step": 4850, "global_schedule": 0.48489999771118164, "l2_grads": 1.840379238128662, "l2_params": 214.04135131835938, "l2_updates": 0.5238959789276123, "train/loss": 5.281200408935547, "uptime": 1126.7973065630013, "examples_seen": 4966400.0, "progress": 0.04307167659831443, "epoch": 3.8764657534888114, "img/sec/core": 732.3093030051035, "core_hours_NVIDIA A100-SXM4-40GB": 2.008915918533332, "core_hours": 2.008915918533332} {"step": 4900, "global_schedule": 0.48989999294281006, "l2_grads": 1.6855247020721436, "l2_params": 214.34902954101562, "l2_updates": 0.5252418518066406, "train/loss": 5.185340881347656, "uptime": 1135.794756966001, "examples_seen": 5017600.0, "progress": 0.043515714501389836, "epoch": 3.916429317957768, "img/sec/core": 711.3126178351918, "core_hours_NVIDIA A100-SXM4-40GB": 2.0289102527622203, "core_hours": 2.0289102527622203} {"step": 4950, "global_schedule": 0.4948999881744385, "l2_grads": 1.5029853582382202, "l2_params": 214.62026977539062, "l2_updates": 0.5852479338645935, "train/loss": 5.114703178405762, "uptime": 1145.395345193001, "examples_seen": 5068800.0, "progress": 0.043959752404465244, "epoch": 3.956392882426725, "img/sec/core": 666.6258200722561, "core_hours_NVIDIA A100-SXM4-40GB": 2.050244893266665, "core_hours": 2.050244893266665} {"step": 5000, "global_schedule": 0.4998999834060669, "l2_grads": 1.46238374710083, "l2_params": 214.92263793945312, "l2_updates": 0.5550622344017029, "train/loss": 5.08908748626709, "uptime": 1154.612689171001, "examples_seen": 5120000.0, "progress": 0.04440379030754065, "epoch": 3.996356446895682, "img/sec/core": 694.3431877204114, "core_hours_NVIDIA A100-SXM4-40GB": 2.0707278798844424, "core_hours": 2.0707278798844424, "val/acc@1": 0.16776, "val/loss": 4.3923121875, "z/secs/eval/val": 2.708416223000313} {"step": 5050, "global_schedule": 0.5048999786376953, "l2_grads": 1.377196192741394, "l2_params": 215.24838256835938, "l2_updates": 0.5644378662109375, "train/loss": 5.305618762969971, "uptime": 1165.989069172001, "examples_seen": 5171200.0, "progress": 0.04484782821061606, "epoch": 4.036320011364639, "img/sec/core": 793.1815760928041, "core_hours_NVIDIA A100-SXM4-40GB": 2.0886584807088853, "core_hours": 2.0886584807088853} {"step": 5100, "global_schedule": 0.5098999738693237, "l2_grads": 2.202956199645996, "l2_params": 215.54722595214844, "l2_updates": 0.5297715067863464, "train/loss": 5.12152624130249, "uptime": 1174.5900026609997, "examples_seen": 5222400.0, "progress": 0.045291866113691466, "epoch": 4.076283575833595, "img/sec/core": 744.1052774313595, "core_hours_NVIDIA A100-SXM4-40GB": 2.107771666239993, "core_hours": 2.107771666239993} {"step": 5150, "global_schedule": 0.5148999691009521, "l2_grads": 1.4886540174484253, "l2_params": 215.8461151123047, "l2_updates": 0.5711134672164917, "train/loss": 5.322055816650391, "uptime": 1183.7494792220004, "examples_seen": 5273600.0, "progress": 0.04573590401676687, "epoch": 4.116247140302552, "img/sec/core": 698.7298845492957, "core_hours_NVIDIA A100-SXM4-40GB": 2.1281260585977724, "core_hours": 2.1281260585977724} {"step": 5200, "global_schedule": 0.5198999643325806, "l2_grads": 1.364076018333435, "l2_params": 216.12213134765625, "l2_updates": 0.5871381759643555, "train/loss": 5.111039161682129, "uptime": 1192.9672264399996, "examples_seen": 5324800.0, "progress": 0.04617994191984228, "epoch": 4.156210704771509, "img/sec/core": 694.3128129509695, "core_hours_NVIDIA A100-SXM4-40GB": 2.1486099413044375, "core_hours": 2.1486099413044375} {"step": 5250, "global_schedule": 0.524899959564209, "l2_grads": 1.5114766359329224, "l2_params": 216.37197875976562, "l2_updates": 0.6042847037315369, "train/loss": 4.9805521965026855, "uptime": 1201.9053466510013, "examples_seen": 5376000.0, "progress": 0.04662397982291768, "epoch": 4.1961742692404655, "img/sec/core": 716.0342274343586, "core_hours_NVIDIA A100-SXM4-40GB": 2.1684724306622187, "core_hours": 2.1684724306622187} {"step": 5300, "global_schedule": 0.5299000144004822, "l2_grads": 1.590165138244629, "l2_params": 216.66885375976562, "l2_updates": 0.5838577747344971, "train/loss": 5.328749179840088, "uptime": 1210.3511995420013, "examples_seen": 5427200.0, "progress": 0.04706801772599309, "epoch": 4.236137833709423, "img/sec/core": 757.7683488685846, "core_hours_NVIDIA A100-SXM4-40GB": 2.1872409926422187, "core_hours": 2.1872409926422187} {"step": 5350, "global_schedule": 0.5349000096321106, "l2_grads": 0.9171110987663269, "l2_params": 216.9355926513672, "l2_updates": 0.5683191418647766, "train/loss": 6.233970642089844, "uptime": 1218.8547530630003, "examples_seen": 5478400.0, "progress": 0.047512055629068496, "epoch": 4.27610139817838, "img/sec/core": 752.6265324485298, "core_hours_NVIDIA A100-SXM4-40GB": 2.206137778244439, "core_hours": 2.206137778244439} {"step": 5400, "global_schedule": 0.539900004863739, "l2_grads": 1.0449106693267822, "l2_params": 217.19583129882812, "l2_updates": 0.5964521765708923, "train/loss": 6.079451084136963, "uptime": 1227.383860115, "examples_seen": 5529600.0, "progress": 0.047956093532143904, "epoch": 4.316064962647336, "img/sec/core": 750.3716345662995, "core_hours_NVIDIA A100-SXM4-40GB": 2.2250913494711053, "core_hours": 2.2250913494711053} {"step": 5450, "global_schedule": 0.5449000000953674, "l2_grads": 1.8729268312454224, "l2_params": 217.5164794921875, "l2_updates": 0.6102457046508789, "train/loss": 5.006141662597656, "uptime": 1236.9136667370003, "examples_seen": 5580800.0, "progress": 0.04840013143521931, "epoch": 4.356028527116293, "img/sec/core": 671.5771110428552, "core_hours_NVIDIA A100-SXM4-40GB": 2.2462686975199944, "core_hours": 2.2462686975199944} {"step": 5500, "global_schedule": 0.5498999953269958, "l2_grads": 1.2493343353271484, "l2_params": 217.8810272216797, "l2_updates": 0.6285028457641602, "train/loss": 6.415246963500977, "uptime": 1245.8648867930006, "examples_seen": 5632000.0, "progress": 0.04884416933829472, "epoch": 4.39599209158525, "img/sec/core": 714.9863325848985, "core_hours_NVIDIA A100-SXM4-40GB": 2.2661602976444395, "core_hours": 2.2661602976444395} {"step": 5550, "global_schedule": 0.5548999905586243, "l2_grads": 1.393245816230774, "l2_params": 218.2358856201172, "l2_updates": 0.6089304089546204, "train/loss": 4.944112777709961, "uptime": 1254.8648711320002, "examples_seen": 5683200.0, "progress": 0.049288207241370126, "epoch": 4.435955656054206, "img/sec/core": 711.1123485256386, "core_hours_NVIDIA A100-SXM4-40GB": 2.286160262842216, "core_hours": 2.286160262842216} {"step": 5600, "global_schedule": 0.5598999857902527, "l2_grads": 1.3300431966781616, "l2_params": 218.56204223632812, "l2_updates": 0.6286945939064026, "train/loss": 5.050079345703125, "uptime": 1264.1352608409998, "examples_seen": 5734400.0, "progress": 0.04973224514444553, "epoch": 4.4759192205231635, "img/sec/core": 690.3701139755715, "core_hours_NVIDIA A100-SXM4-40GB": 2.3067611288622154, "core_hours": 2.3067611288622154} {"step": 5650, "global_schedule": 0.5648999810218811, "l2_grads": 1.0970935821533203, "l2_params": 218.89234924316406, "l2_updates": 0.6190263032913208, "train/loss": 6.2973833084106445, "uptime": 1273.509417917001, "examples_seen": 5785600.0, "progress": 0.050176283047520934, "epoch": 4.515882784992121, "img/sec/core": 682.728052038369, "core_hours_NVIDIA A100-SXM4-40GB": 2.327592589031107, "core_hours": 2.327592589031107} {"step": 5700, "global_schedule": 0.5698999762535095, "l2_grads": 1.392694354057312, "l2_params": 219.27268981933594, "l2_updates": 0.6357149481773376, "train/loss": 5.0599589347839355, "uptime": 1282.6601337909997, "examples_seen": 5836800.0, "progress": 0.05062032095059634, "epoch": 4.555846349461078, "img/sec/core": 699.3988326296169, "core_hours_NVIDIA A100-SXM4-40GB": 2.3479275131955486, "core_hours": 2.3479275131955486} {"step": 5750, "global_schedule": 0.5748999714851379, "l2_grads": 1.7924233675003052, "l2_params": 219.59375, "l2_updates": 0.6128847002983093, "train/loss": 4.869146823883057, "uptime": 1291.5519044310004, "examples_seen": 5888000.0, "progress": 0.05106435885367175, "epoch": 4.595809913930034, "img/sec/core": 719.7666538100791, "core_hours_NVIDIA A100-SXM4-40GB": 2.3676870035066613, "core_hours": 2.3676870035066613} {"step": 5800, "global_schedule": 0.5798999667167664, "l2_grads": 1.207354187965393, "l2_params": 219.93780517578125, "l2_updates": 0.6523821949958801, "train/loss": 5.739550590515137, "uptime": 1300.261006136001, "examples_seen": 5939200.0, "progress": 0.051508396756747156, "epoch": 4.635773478398991, "img/sec/core": 734.8633896794668, "core_hours_NVIDIA A100-SXM4-40GB": 2.387040562851107, "core_hours": 2.387040562851107} {"step": 5850, "global_schedule": 0.5848999619483948, "l2_grads": 1.477917194366455, "l2_params": 220.27157592773438, "l2_updates": 0.6447721719741821, "train/loss": 4.8292012214660645, "uptime": 1309.1931493520005, "examples_seen": 5990400.0, "progress": 0.05195243465982256, "epoch": 4.675737042867948, "img/sec/core": 716.5133658555902, "core_hours_NVIDIA A100-SXM4-40GB": 2.4068897699977727, "core_hours": 2.4068897699977727} {"step": 5900, "global_schedule": 0.5898999571800232, "l2_grads": 1.3821122646331787, "l2_params": 220.54931640625, "l2_updates": 0.6293660998344421, "train/loss": 5.261200904846191, "uptime": 1317.5552654900002, "examples_seen": 6041600.0, "progress": 0.05239647256289797, "epoch": 4.715700607336904, "img/sec/core": 765.3565071784508, "core_hours_NVIDIA A100-SXM4-40GB": 2.4254722503044386, "core_hours": 2.4254722503044386} {"step": 5950, "global_schedule": 0.5949000120162964, "l2_grads": 1.4554173946380615, "l2_params": 220.89645385742188, "l2_updates": 0.6638365387916565, "train/loss": 4.799397945404053, "uptime": 1326.0802183790001, "examples_seen": 6092800.0, "progress": 0.05284051046597338, "epoch": 4.755664171805861, "img/sec/core": 750.7372865670825, "core_hours_NVIDIA A100-SXM4-40GB": 2.444416590057772, "core_hours": 2.444416590057772} {"step": 6000, "global_schedule": 0.5999000072479248, "l2_grads": 0.9970159530639648, "l2_params": 221.2620849609375, "l2_updates": 0.6798563003540039, "train/loss": 6.408370494842529, "uptime": 1334.7715057260011, "examples_seen": 6144000.0, "progress": 0.05328454836904878, "epoch": 4.7956277362748185, "img/sec/core": 736.3696244847304, "core_hours_NVIDIA A100-SXM4-40GB": 2.4637305619399963, "core_hours": 2.4637305619399963} {"step": 6050, "global_schedule": 0.6049000024795532, "l2_grads": 1.4427794218063354, "l2_params": 221.6134490966797, "l2_updates": 0.6424261331558228, "train/loss": 4.927013397216797, "uptime": 1344.0722502360004, "examples_seen": 6195200.0, "progress": 0.053728586272124186, "epoch": 4.835591300743775, "img/sec/core": 741.5032505037432, "core_hours_NVIDIA A100-SXM4-40GB": 2.4829108180111064, "core_hours": 2.4829108180111064} {"step": 6100, "global_schedule": 0.6098999977111816, "l2_grads": 1.2525001764297485, "l2_params": 221.90753173828125, "l2_updates": 0.6302354335784912, "train/loss": 5.144436359405518, "uptime": 1352.968055112, "examples_seen": 6246400.0, "progress": 0.054172624175199593, "epoch": 4.875554865212732, "img/sec/core": 719.4402405640498, "core_hours_NVIDIA A100-SXM4-40GB": 2.5026792732911054, "core_hours": 2.5026792732911054} {"step": 6150, "global_schedule": 0.6148999929428101, "l2_grads": 1.4198355674743652, "l2_params": 222.3267364501953, "l2_updates": 0.730038583278656, "train/loss": 4.7280683517456055, "uptime": 1361.537673353001, "examples_seen": 6297600.0, "progress": 0.054616662078275, "epoch": 4.915518429681689, "img/sec/core": 746.8243998757603, "core_hours_NVIDIA A100-SXM4-40GB": 2.5217228693822187, "core_hours": 2.5217228693822187} {"step": 6200, "global_schedule": 0.6198999881744385, "l2_grads": 1.4914637804031372, "l2_params": 222.71803283691406, "l2_updates": 0.6906023621559143, "train/loss": 4.650601387023926, "uptime": 1370.7198705560004, "examples_seen": 6348800.0, "progress": 0.05506069998135041, "epoch": 4.955481994150645, "img/sec/core": 697.0009310962611, "core_hours_NVIDIA A100-SXM4-40GB": 2.5421277520555505, "core_hours": 2.5421277520555505} {"step": 6250, "global_schedule": 0.6248999834060669, "l2_grads": 1.3065630197525024, "l2_params": 223.1219940185547, "l2_updates": 0.7074288725852966, "train/loss": 4.843931674957275, "uptime": 1379.565189764, "examples_seen": 6400000.0, "progress": 0.055504737884425816, "epoch": 4.995445558619602, "img/sec/core": 723.546527773909, "core_hours_NVIDIA A100-SXM4-40GB": 2.5617840169622164, "core_hours": 2.5617840169622164} {"step": 6300, "global_schedule": 0.6298999786376953, "l2_grads": 1.998672366142273, "l2_params": 223.4993438720703, "l2_updates": 0.6122795343399048, "train/loss": 5.31709623336792, "uptime": 1388.7600631740006, "examples_seen": 6451200.0, "progress": 0.05594877578750122, "epoch": 5.035409123088559, "img/sec/core": 696.0400338996723, "core_hours_NVIDIA A100-SXM4-40GB": 2.58221706898444, "core_hours": 2.58221706898444} {"step": 6350, "global_schedule": 0.6348999738693237, "l2_grads": 1.697557806968689, "l2_params": 223.88465881347656, "l2_updates": 0.671107828617096, "train/loss": 4.671871662139893, "uptime": 1397.7736774370005, "examples_seen": 6502400.0, "progress": 0.05639281369057663, "epoch": 5.075372687557516, "img/sec/core": 710.0370409982414, "core_hours_NVIDIA A100-SXM4-40GB": 2.6022473229022176, "core_hours": 2.6022473229022176} {"step": 6400, "global_schedule": 0.6398999691009521, "l2_grads": 1.4407652616500854, "l2_params": 224.25718688964844, "l2_updates": 0.6578227877616882, "train/loss": 4.842389106750488, "uptime": 1407.0357266580013, "examples_seen": 6553600.0, "progress": 0.05683685159365203, "epoch": 5.115336252026473, "img/sec/core": 690.9917932079904, "core_hours_NVIDIA A100-SXM4-40GB": 2.6228296545044416, "core_hours": 2.6228296545044416} {"step": 6450, "global_schedule": 0.6448999643325806, "l2_grads": 1.5028265714645386, "l2_params": 224.6506805419922, "l2_updates": 0.7011168599128723, "train/loss": 4.801886081695557, "uptime": 1415.4610223520012, "examples_seen": 6604800.0, "progress": 0.05728088949672744, "epoch": 5.15529981649543, "img/sec/core": 759.6172564670635, "core_hours_NVIDIA A100-SXM4-40GB": 2.641552533824441, "core_hours": 2.641552533824441} {"step": 6500, "global_schedule": 0.649899959564209, "l2_grads": 1.6830335855484009, "l2_params": 225.12254333496094, "l2_updates": 0.7025181651115417, "train/loss": 4.7799553871154785, "uptime": 1423.9183373150008, "examples_seen": 6656000.0, "progress": 0.057724927399802846, "epoch": 5.195263380964386, "img/sec/core": 756.7413568017439, "core_hours_NVIDIA A100-SXM4-40GB": 2.6603465670755515, "core_hours": 2.6603465670755515} {"step": 6550, "global_schedule": 0.6548999547958374, "l2_grads": 1.355905532836914, "l2_params": 225.53839111328125, "l2_updates": 0.7247837781906128, "train/loss": 4.567618370056152, "uptime": 1432.5742750000009, "examples_seen": 6707200.0, "progress": 0.05816896530287825, "epoch": 5.235226945433343, "img/sec/core": 739.3768570088754, "core_hours_NVIDIA A100-SXM4-40GB": 2.6795819841533297, "core_hours": 2.6795819841533297} {"step": 6600, "global_schedule": 0.6599000096321106, "l2_grads": 1.2980130910873413, "l2_params": 225.91259765625, "l2_updates": 0.7263311147689819, "train/loss": 4.918176651000977, "uptime": 1441.6116796810002, "examples_seen": 6758400.0, "progress": 0.05861300320595366, "epoch": 5.2751905099023, "img/sec/core": 708.1679116854947, "core_hours_NVIDIA A100-SXM4-40GB": 2.699665105666661, "core_hours": 2.699665105666661} {"step": 6650, "global_schedule": 0.664900004863739, "l2_grads": 1.2947412729263306, "l2_params": 226.27976989746094, "l2_updates": 0.6496223211288452, "train/loss": 5.370218753814697, "uptime": 1450.2677193590007, "examples_seen": 6809600.0, "progress": 0.05905704110902907, "epoch": 5.315154074371256, "img/sec/core": 739.368145026612, "core_hours_NVIDIA A100-SXM4-40GB": 2.7189007493955515, "core_hours": 2.7189007493955515} {"step": 6700, "global_schedule": 0.6699000000953674, "l2_grads": 1.384953260421753, "l2_params": 226.7232666015625, "l2_updates": 0.7700015902519226, "train/loss": 4.716605186462402, "uptime": 1458.951321335, "examples_seen": 6860800.0, "progress": 0.059501079012104476, "epoch": 5.3551176388402135, "img/sec/core": 737.0213441022456, "core_hours_NVIDIA A100-SXM4-40GB": 2.73819764267555, "core_hours": 2.73819764267555} {"step": 6750, "global_schedule": 0.6748999953269958, "l2_grads": 1.372406005859375, "l2_params": 227.20547485351562, "l2_updates": 0.783062756061554, "train/loss": 4.446175575256348, "uptime": 1468.0001045110002, "examples_seen": 6912000.0, "progress": 0.05994511691517988, "epoch": 5.395081203309171, "img/sec/core": 707.277417915655, "core_hours_NVIDIA A100-SXM4-40GB": 2.7583060497333283, "core_hours": 2.7583060497333283} {"step": 6800, "global_schedule": 0.6798999905586243, "l2_grads": 1.407589316368103, "l2_params": 227.61598205566406, "l2_updates": 0.7061936259269714, "train/loss": 4.923236846923828, "uptime": 1476.627495367, "examples_seen": 6963200.0, "progress": 0.06038915481825528, "epoch": 5.435044767778128, "img/sec/core": 741.8233515581699, "core_hours_NVIDIA A100-SXM4-40GB": 2.7774780294133277, "core_hours": 2.7774780294133277} {"step": 6850, "global_schedule": 0.6848999857902527, "l2_grads": 1.3563109636306763, "l2_params": 228.03582763671875, "l2_updates": 0.7696581482887268, "train/loss": 4.753300666809082, "uptime": 1485.3218840320005, "examples_seen": 7014400.0, "progress": 0.06083319272133069, "epoch": 5.475008332247084, "img/sec/core": 736.1069589358607, "core_hours_NVIDIA A100-SXM4-40GB": 2.7967988931133285, "core_hours": 2.7967988931133285} {"step": 6900, "global_schedule": 0.6898999810218811, "l2_grads": 1.3611946105957031, "l2_params": 228.49359130859375, "l2_updates": 0.7675113677978516, "train/loss": 5.719525337219238, "uptime": 1493.8093575439998, "examples_seen": 7065600.0, "progress": 0.0612772306244061, "epoch": 5.514971896716041, "img/sec/core": 754.0524269032383, "core_hours_NVIDIA A100-SXM4-40GB": 2.8156599453622158, "core_hours": 2.8156599453622158} {"step": 6950, "global_schedule": 0.6948999762535095, "l2_grads": 1.3623631000518799, "l2_params": 228.9696807861328, "l2_updates": 0.7711731195449829, "train/loss": 5.652544975280762, "uptime": 1502.2732973439997, "examples_seen": 7116800.0, "progress": 0.061721268527481506, "epoch": 5.554935461184998, "img/sec/core": 756.1490453890101, "core_hours_NVIDIA A100-SXM4-40GB": 2.834468700473327, "core_hours": 2.834468700473327} {"step": 7000, "global_schedule": 0.6998999714851379, "l2_grads": 1.394045114517212, "l2_params": 229.37840270996094, "l2_updates": 0.780290424823761, "train/loss": 4.59821081161499, "uptime": 1510.8557621970012, "examples_seen": 7168000.0, "progress": 0.06216530643055691, "epoch": 5.594899025653954, "img/sec/core": 745.7065201684751, "core_hours_NVIDIA A100-SXM4-40GB": 2.8535408445911083, "core_hours": 2.8535408445911083} {"step": 7050, "global_schedule": 0.7048999667167664, "l2_grads": 1.3746843338012695, "l2_params": 229.86302185058594, "l2_updates": 0.7366275787353516, "train/loss": 4.611019134521484, "uptime": 1520.723681597001, "examples_seen": 7219200.0, "progress": 0.06260934433363231, "epoch": 5.6348625901229115, "img/sec/core": 733.4956802856827, "core_hours_NVIDIA A100-SXM4-40GB": 2.8729304914622156, "core_hours": 2.8729304914622156} {"step": 7100, "global_schedule": 0.7098999619483948, "l2_grads": 1.4445910453796387, "l2_params": 230.24810791015625, "l2_updates": 0.7796706557273865, "train/loss": 4.610995292663574, "uptime": 1529.8623264340004, "examples_seen": 7270400.0, "progress": 0.06305338223670773, "epoch": 5.674826154591869, "img/sec/core": 700.3226533203751, "core_hours_NVIDIA A100-SXM4-40GB": 2.8932385910999923, "core_hours": 2.8932385910999923} {"step": 7150, "global_schedule": 0.7148999571800232, "l2_grads": 0.9967826008796692, "l2_params": 230.71632385253906, "l2_updates": 0.7356266379356384, "train/loss": 5.901478290557861, "uptime": 1538.338068223, "examples_seen": 7321600.0, "progress": 0.06349742013978313, "epoch": 5.714789719060825, "img/sec/core": 755.0961507943023, "core_hours_NVIDIA A100-SXM4-40GB": 2.9120735728533247, "core_hours": 2.9120735728533247} {"step": 7200, "global_schedule": 0.7198999524116516, "l2_grads": 1.2914063930511475, "l2_params": 231.1688690185547, "l2_updates": 0.7176058888435364, "train/loss": 4.536174774169922, "uptime": 1547.267207195, "examples_seen": 7372800.0, "progress": 0.06394145804285854, "epoch": 5.754753283529782, "img/sec/core": 716.7544396015136, "core_hours_NVIDIA A100-SXM4-40GB": 2.9319161039022137, "core_hours": 2.9319161039022137} {"step": 7250, "global_schedule": 0.7249000072479248, "l2_grads": 1.3580870628356934, "l2_params": 231.61264038085938, "l2_updates": 0.7655962705612183, "train/loss": 4.917579174041748, "uptime": 1556.7120164290009, "examples_seen": 7424000.0, "progress": 0.06438549594593394, "epoch": 5.794716847998739, "img/sec/core": 677.6208858682246, "core_hours_NVIDIA A100-SXM4-40GB": 2.9529045688666598, "core_hours": 2.9529045688666598} {"step": 7300, "global_schedule": 0.7299000024795532, "l2_grads": 1.1633144617080688, "l2_params": 232.06910705566406, "l2_updates": 0.7933735847473145, "train/loss": 6.265371322631836, "uptime": 1566.1841444029997, "examples_seen": 7475200.0, "progress": 0.06482953384900936, "epoch": 5.834680412467695, "img/sec/core": 675.6665469014084, "core_hours_NVIDIA A100-SXM4-40GB": 2.973953742142213, "core_hours": 2.973953742142213} {"step": 7350, "global_schedule": 0.7348999977111816, "l2_grads": 0.9706376194953918, "l2_params": 232.44735717773438, "l2_updates": 0.722855269908905, "train/loss": 6.1451215744018555, "uptime": 1574.630689566, "examples_seen": 7526400.0, "progress": 0.06527357175208476, "epoch": 5.874643976936652, "img/sec/core": 757.706242788457, "core_hours_NVIDIA A100-SXM4-40GB": 2.9927238425044362, "core_hours": 2.9927238425044362} {"step": 7400, "global_schedule": 0.7398999929428101, "l2_grads": 1.099764108657837, "l2_params": 232.88967895507812, "l2_updates": 0.7972134351730347, "train/loss": 5.578461647033691, "uptime": 1583.6192040200003, "examples_seen": 7577600.0, "progress": 0.06571760965516016, "epoch": 5.914607541405609, "img/sec/core": 712.0197706476058, "core_hours_NVIDIA A100-SXM4-40GB": 3.012698319068881, "core_hours": 3.012698319068881} {"step": 7450, "global_schedule": 0.7448999881744385, "l2_grads": 1.5119600296020508, "l2_params": 233.43325805664062, "l2_updates": 0.8371706008911133, "train/loss": 4.486956596374512, "uptime": 1592.8299525990005, "examples_seen": 7628800.0, "progress": 0.06616164755823557, "epoch": 5.954571105874566, "img/sec/core": 694.8403753622699, "core_hours_NVIDIA A100-SXM4-40GB": 3.033166649244437, "core_hours": 3.033166649244437} {"step": 7500, "global_schedule": 0.7498999834060669, "l2_grads": 1.4754236936569214, "l2_params": 233.9635467529297, "l2_updates": 0.8387309908866882, "train/loss": 4.578578948974609, "uptime": 1601.9252501520004, "examples_seen": 7680000.0, "progress": 0.06660568546131097, "epoch": 5.994534670343523, "img/sec/core": 703.6603214689862, "core_hours_NVIDIA A100-SXM4-40GB": 3.0533784215844366, "core_hours": 3.0533784215844366, "val/acc@1": 0.26632, "val/loss": 3.5986194287109377, "z/secs/eval/val": 7.61311389399998} {"step": 7550, "global_schedule": 0.7548999786376953, "l2_grads": 1.3960282802581787, "l2_params": 234.5211181640625, "l2_updates": 0.824013352394104, "train/loss": 4.55387544631958, "uptime": 1619.4228473700005, "examples_seen": 7731200.0, "progress": 0.06704972336438639, "epoch": 6.03449823481248, "img/sec/core": 647.5439806205242, "core_hours_NVIDIA A100-SXM4-40GB": 3.0753417517177715, "core_hours": 3.0753417517177715} {"step": 7600, "global_schedule": 0.7598999738693237, "l2_grads": 1.7837345600128174, "l2_params": 235.0823516845703, "l2_updates": 0.7883622050285339, "train/loss": 4.543320178985596, "uptime": 1627.9959333450006, "examples_seen": 7782400.0, "progress": 0.06749376126746179, "epoch": 6.074461799281436, "img/sec/core": 746.5223163121137, "core_hours_NVIDIA A100-SXM4-40GB": 3.0943930538844384, "core_hours": 3.0943930538844384} {"step": 7650, "global_schedule": 0.7648999691009521, "l2_grads": 1.5726687908172607, "l2_params": 235.56991577148438, "l2_updates": 0.7842307686805725, "train/loss": 4.509238243103027, "uptime": 1637.118668514, "examples_seen": 7833600.0, "progress": 0.0679377991705372, "epoch": 6.114425363750393, "img/sec/core": 701.5439866925235, "core_hours_NVIDIA A100-SXM4-40GB": 3.1146657987044373, "core_hours": 3.1146657987044373} {"step": 7700, "global_schedule": 0.7698999643325806, "l2_grads": 1.553638219833374, "l2_params": 236.04640197753906, "l2_updates": 0.7919045090675354, "train/loss": 5.0907182693481445, "uptime": 1646.4514912579998, "examples_seen": 7884800.0, "progress": 0.0683818370736126, "epoch": 6.15438892821935, "img/sec/core": 685.7518004523023, "core_hours_NVIDIA A100-SXM4-40GB": 3.1354054048022144, "core_hours": 3.1354054048022144} {"step": 7750, "global_schedule": 0.774899959564209, "l2_grads": 0.888221800327301, "l2_params": 236.4922637939453, "l2_updates": 0.815305233001709, "train/loss": 6.208433628082275, "uptime": 1655.7839539640008, "examples_seen": 7936000.0, "progress": 0.068825874976688, "epoch": 6.1943524926883065, "img/sec/core": 685.7782561386105, "core_hours_NVIDIA A100-SXM4-40GB": 3.15614421081555, "core_hours": 3.15614421081555} {"step": 7800, "global_schedule": 0.7798999547958374, "l2_grads": 1.2751126289367676, "l2_params": 236.98788452148438, "l2_updates": 0.8355690836906433, "train/loss": 4.318458080291748, "uptime": 1664.6351549200008, "examples_seen": 7987200.0, "progress": 0.06926991287976342, "epoch": 6.234316057157264, "img/sec/core": 723.0657208908625, "core_hours_NVIDIA A100-SXM4-40GB": 3.1758135462733277, "core_hours": 3.1758135462733277} {"step": 7850, "global_schedule": 0.7849000096321106, "l2_grads": 1.3189517259597778, "l2_params": 237.5470733642578, "l2_updates": 0.8718035817146301, "train/loss": 4.382920265197754, "uptime": 1673.12592434, "examples_seen": 8038400.0, "progress": 0.06971395078283882, "epoch": 6.274279621626221, "img/sec/core": 753.7597222844623, "core_hours_NVIDIA A100-SXM4-40GB": 3.1946819227622147, "core_hours": 3.1946819227622147} {"step": 7900, "global_schedule": 0.789900004863739, "l2_grads": 1.5082616806030273, "l2_params": 238.01954650878906, "l2_updates": 0.8072781562805176, "train/loss": 4.552950382232666, "uptime": 1681.5580473850005, "examples_seen": 8089600.0, "progress": 0.07015798868591423, "epoch": 6.314243186095177, "img/sec/core": 759.0022068990853, "core_hours_NVIDIA A100-SXM4-40GB": 3.2134199739733273, "core_hours": 3.2134199739733273} {"step": 7950, "global_schedule": 0.7949000000953674, "l2_grads": 0.7897986769676208, "l2_params": 238.537841796875, "l2_updates": 0.7352026104927063, "train/loss": 6.1368513107299805, "uptime": 1690.0254545059997, "examples_seen": 8140800.0, "progress": 0.07060202658898963, "epoch": 6.354206750564134, "img/sec/core": 755.8394096969691, "core_hours_NVIDIA A100-SXM4-40GB": 3.2322364342422145, "core_hours": 3.2322364342422145} {"step": 8000, "global_schedule": 0.7998999953269958, "l2_grads": 1.2817658185958862, "l2_params": 239.08203125, "l2_updates": 0.811672568321228, "train/loss": 4.97573709487915, "uptime": 1698.416439863, "examples_seen": 8192000.0, "progress": 0.07104606449206505, "epoch": 6.394170315033091, "img/sec/core": 762.7232950252612, "core_hours_NVIDIA A100-SXM4-40GB": 3.2508830683688816, "core_hours": 3.2508830683688816} {"step": 8050, "global_schedule": 0.8048999905586243, "l2_grads": 1.2649024724960327, "l2_params": 239.62623596191406, "l2_updates": 0.7801791429519653, "train/loss": 4.693783760070801, "uptime": 1708.0663188010003, "examples_seen": 8243200.0, "progress": 0.07149010239514045, "epoch": 6.434133879502048, "img/sec/core": 738.5356398325913, "core_hours_NVIDIA A100-SXM4-40GB": 3.2701403952399937, "core_hours": 3.2701403952399937} {"step": 8100, "global_schedule": 0.8098999857902527, "l2_grads": 1.5173996686935425, "l2_params": 240.1874237060547, "l2_updates": 0.8693198561668396, "train/loss": 4.446563243865967, "uptime": 1717.1755733380014, "examples_seen": 8294400.0, "progress": 0.07193414029821586, "epoch": 6.474097443971004, "img/sec/core": 702.582189794311, "core_hours_NVIDIA A100-SXM4-40GB": 3.2903831830999963, "core_hours": 3.2903831830999963} {"step": 8150, "global_schedule": 0.8148999810218811, "l2_grads": 1.1673698425292969, "l2_params": 240.75546264648438, "l2_updates": 0.881807267665863, "train/loss": 5.1699934005737305, "uptime": 1725.8388147370006, "examples_seen": 8345600.0, "progress": 0.07237817820129126, "epoch": 6.5140610084399615, "img/sec/core": 738.753510982549, "core_hours_NVIDIA A100-SXM4-40GB": 3.309634830653328, "core_hours": 3.309634830653328} {"step": 8200, "global_schedule": 0.8198999762535095, "l2_grads": 1.4129856824874878, "l2_params": 241.30833435058594, "l2_updates": 0.8221450448036194, "train/loss": 4.394895553588867, "uptime": 1734.3514449289996, "examples_seen": 8396800.0, "progress": 0.07282221610436666, "epoch": 6.554024572908919, "img/sec/core": 751.8240374185767, "core_hours_NVIDIA A100-SXM4-40GB": 3.3285517866355483, "core_hours": 3.3285517866355483} {"step": 8250, "global_schedule": 0.8248999714851379, "l2_grads": 1.1863548755645752, "l2_params": 241.89454650878906, "l2_updates": 0.9083573222160339, "train/loss": 4.610891342163086, "uptime": 1743.7496676980008, "examples_seen": 8448000.0, "progress": 0.07326625400744208, "epoch": 6.593988137377875, "img/sec/core": 680.9798147272633, "core_hours_NVIDIA A100-SXM4-40GB": 3.3494367261222178, "core_hours": 3.3494367261222178} {"step": 8300, "global_schedule": 0.8298999667167664, "l2_grads": 1.3117239475250244, "l2_params": 242.50747680664062, "l2_updates": 0.9179877638816833, "train/loss": 4.349735260009766, "uptime": 1752.8017529150002, "examples_seen": 8499200.0, "progress": 0.07371029191051748, "epoch": 6.633951701846832, "img/sec/core": 707.019415590691, "core_hours_NVIDIA A100-SXM4-40GB": 3.3695524710488827, "core_hours": 3.3695524710488827} {"step": 8350, "global_schedule": 0.8348999619483948, "l2_grads": 1.2522531747817993, "l2_params": 243.08453369140625, "l2_updates": 0.8196004629135132, "train/loss": 5.9647088050842285, "uptime": 1761.7788742539997, "examples_seen": 8550400.0, "progress": 0.07415432981359289, "epoch": 6.673915266315789, "img/sec/core": 712.923414791816, "core_hours_NVIDIA A100-SXM4-40GB": 3.3895016295799922, "core_hours": 3.3895016295799922} {"step": 8400, "global_schedule": 0.8398999571800232, "l2_grads": 1.4468697309494019, "l2_params": 243.55807495117188, "l2_updates": 0.7806347608566284, "train/loss": 4.418980598449707, "uptime": 1770.9789338730006, "examples_seen": 8601600.0, "progress": 0.07459836771666829, "epoch": 6.713878830784745, "img/sec/core": 695.6476658892537, "core_hours_NVIDIA A100-SXM4-40GB": 3.409946206511106, "core_hours": 3.409946206511106} {"step": 8450, "global_schedule": 0.8448999524116516, "l2_grads": 0.9128408432006836, "l2_params": 244.17893981933594, "l2_updates": 0.8732742667198181, "train/loss": 5.9602370262146, "uptime": 1780.105503097, "examples_seen": 8652800.0, "progress": 0.07504240561974371, "epoch": 6.753842395253702, "img/sec/core": 701.2492693498002, "core_hours_NVIDIA A100-SXM4-40GB": 3.430227471453327, "core_hours": 3.430227471453327} {"step": 8500, "global_schedule": 0.8499000072479248, "l2_grads": 1.28645658493042, "l2_params": 244.7320556640625, "l2_updates": 0.8581956624984741, "train/loss": 4.28877067565918, "uptime": 1789.300674131, "examples_seen": 8704000.0, "progress": 0.07548644352281911, "epoch": 6.793805959722659, "img/sec/core": 696.017504876793, "core_hours_NVIDIA A100-SXM4-40GB": 3.4506611848622155, "core_hours": 3.4506611848622155} {"step": 8550, "global_schedule": 0.8549000024795532, "l2_grads": 1.258067011833191, "l2_params": 245.25521850585938, "l2_updates": 0.9392905235290527, "train/loss": 4.279814720153809, "uptime": 1798.3295197480002, "examples_seen": 8755200.0, "progress": 0.07593048142589451, "epoch": 6.833769524191616, "img/sec/core": 708.8392327751901, "core_hours_NVIDIA A100-SXM4-40GB": 3.4707252862333267, "core_hours": 3.4707252862333267} {"step": 8600, "global_schedule": 0.8598999977111816, "l2_grads": 0.8337072134017944, "l2_params": 245.70089721679688, "l2_updates": 0.8098618388175964, "train/loss": 6.000248908996582, "uptime": 1807.3368004130007, "examples_seen": 8806400.0, "progress": 0.07637451932896992, "epoch": 6.873733088660573, "img/sec/core": 710.5363136810437, "core_hours_NVIDIA A100-SXM4-40GB": 3.4907414654888833, "core_hours": 3.4907414654888833} {"step": 8650, "global_schedule": 0.8648999929428101, "l2_grads": 1.0826945304870605, "l2_params": 246.2244873046875, "l2_updates": 0.9263608455657959, "train/loss": 5.262657165527344, "uptime": 1816.4425605060005, "examples_seen": 8857600.0, "progress": 0.07681855723204532, "epoch": 6.91369665312953, "img/sec/core": 702.8518140863465, "core_hours_NVIDIA A100-SXM4-40GB": 3.5109764879177723, "core_hours": 3.5109764879177723} {"step": 8700, "global_schedule": 0.8698999881744385, "l2_grads": 1.5291556119918823, "l2_params": 246.84115600585938, "l2_updates": 0.9387900829315186, "train/loss": 4.238393783569336, "uptime": 1825.6075998350007, "examples_seen": 8908800.0, "progress": 0.07726259513512074, "epoch": 6.953660217598486, "img/sec/core": 698.3057868337821, "core_hours_NVIDIA A100-SXM4-40GB": 3.5313432419822166, "core_hours": 3.5313432419822166} {"step": 8750, "global_schedule": 0.8748999834060669, "l2_grads": 1.1170363426208496, "l2_params": 247.37628173828125, "l2_updates": 0.9004725217819214, "train/loss": 5.965426445007324, "uptime": 1834.9507362690001, "examples_seen": 8960000.0, "progress": 0.07770663303819614, "epoch": 6.993623782067443, "img/sec/core": 684.9948135949878, "core_hours_NVIDIA A100-SXM4-40GB": 3.5521057673911045, "core_hours": 3.5521057673911045} {"step": 8800, "global_schedule": 0.8798999786376953, "l2_grads": 1.2048345804214478, "l2_params": 248.02325439453125, "l2_updates": 0.905514121055603, "train/loss": 5.035120964050293, "uptime": 1844.6079766190014, "examples_seen": 9011200.0, "progress": 0.07815067094127155, "epoch": 7.0335873465364, "img/sec/core": 662.7152031065621, "core_hours_NVIDIA A100-SXM4-40GB": 3.5735663015022188, "core_hours": 3.5735663015022188} {"step": 8850, "global_schedule": 0.8848999738693237, "l2_grads": 1.462278127670288, "l2_params": 248.71005249023438, "l2_updates": 0.9298979043960571, "train/loss": 4.350156307220459, "uptime": 1853.023712573, "examples_seen": 9062400.0, "progress": 0.07859470884434695, "epoch": 7.0735509110053565, "img/sec/core": 760.4801332864002, "core_hours_NVIDIA A100-SXM4-40GB": 3.592267936955549, "core_hours": 3.592267936955549} {"step": 8900, "global_schedule": 0.8898999691009521, "l2_grads": 1.461405634880066, "l2_params": 249.28660583496094, "l2_updates": 0.933118999004364, "train/loss": 4.198504447937012, "uptime": 1861.4662666920012, "examples_seen": 9113600.0, "progress": 0.07903874674742235, "epoch": 7.113514475474314, "img/sec/core": 758.06443284691, "core_hours_NVIDIA A100-SXM4-40GB": 3.611029168331107, "core_hours": 3.611029168331107} {"step": 8950, "global_schedule": 0.8948999643325806, "l2_grads": 0.9200846552848816, "l2_params": 249.90103149414062, "l2_updates": 0.9290006756782532, "train/loss": 5.607682228088379, "uptime": 1870.0413828649998, "examples_seen": 9164800.0, "progress": 0.07948278465049777, "epoch": 7.153478039943271, "img/sec/core": 746.3455737372249, "core_hours_NVIDIA A100-SXM4-40GB": 3.630084982048882, "core_hours": 3.630084982048882} {"step": 9000, "global_schedule": 0.899899959564209, "l2_grads": 1.2013745307922363, "l2_params": 250.56451416015625, "l2_updates": 0.9091696739196777, "train/loss": 4.418205738067627, "uptime": 1879.087429823001, "examples_seen": 9216000.0, "progress": 0.07992682255357317, "epoch": 7.193441604412227, "img/sec/core": 707.4913528211614, "core_hours_NVIDIA A100-SXM4-40GB": 3.6501873086222174, "core_hours": 3.6501873086222174} {"step": 9050, "global_schedule": 0.9048999547958374, "l2_grads": 1.2147845029830933, "l2_params": 251.1834259033203, "l2_updates": 0.9938790798187256, "train/loss": 4.308413028717041, "uptime": 1887.8958918509998, "examples_seen": 9267200.0, "progress": 0.08037086045664858, "epoch": 7.233405168881184, "img/sec/core": 788.4318774624861, "core_hours_NVIDIA A100-SXM4-40GB": 3.668225927593327, "core_hours": 3.668225927593327} {"step": 9100, "global_schedule": 0.9098999500274658, "l2_grads": 1.4282751083374023, "l2_params": 251.7763671875, "l2_updates": 0.9527028203010559, "train/loss": 4.204559326171875, "uptime": 1897.03699959, "examples_seen": 9318400.0, "progress": 0.08081489835972398, "epoch": 7.273368733350141, "img/sec/core": 700.1339643656722, "core_hours_NVIDIA A100-SXM4-40GB": 3.6885395003466614, "core_hours": 3.6885395003466614} {"step": 9150, "global_schedule": 0.914900004863739, "l2_grads": 0.9485794305801392, "l2_params": 252.37985229492188, "l2_updates": 0.9203898310661316, "train/loss": 5.538987159729004, "uptime": 1906.1959759970014, "examples_seen": 9369600.0, "progress": 0.0812589362627994, "epoch": 7.313332297819097, "img/sec/core": 698.7680408378061, "core_hours_NVIDIA A100-SXM4-40GB": 3.7088927812511083, "core_hours": 3.7088927812511083} {"step": 9200, "global_schedule": 0.9199000000953674, "l2_grads": 1.2135682106018066, "l2_params": 253.07870483398438, "l2_updates": 0.9472148418426514, "train/loss": 4.258012294769287, "uptime": 1915.3687475200004, "examples_seen": 9420800.0, "progress": 0.0817029741658748, "epoch": 7.353295862288054, "img/sec/core": 697.7171494954588, "core_hours_NVIDIA A100-SXM4-40GB": 3.7292767179688844, "core_hours": 3.7292767179688844} {"step": 9250, "global_schedule": 0.9248999953269958, "l2_grads": 1.3498097658157349, "l2_params": 253.69744873046875, "l2_updates": 0.9594866633415222, "train/loss": 4.186370849609375, "uptime": 1924.0993250049996, "examples_seen": 9472000.0, "progress": 0.08214701206895021, "epoch": 7.3932594267570115, "img/sec/core": 733.0557469991419, "core_hours_NVIDIA A100-SXM4-40GB": 3.7486780012688827, "core_hours": 3.7486780012688827} {"step": 9300, "global_schedule": 0.9298999905586243, "l2_grads": 1.2699105739593506, "l2_params": 254.29757690429688, "l2_updates": 0.9928895831108093, "train/loss": 4.319813251495361, "uptime": 1932.739224537001, "examples_seen": 9523200.0, "progress": 0.08259104997202561, "epoch": 7.433222991225969, "img/sec/core": 740.7493543524386, "core_hours_NVIDIA A100-SXM4-40GB": 3.7678777780066635, "core_hours": 3.7678777780066635} {"step": 9350, "global_schedule": 0.9348999857902527, "l2_grads": 1.2497246265411377, "l2_params": 254.94183349609375, "l2_updates": 1.014210820198059, "train/loss": 4.204784393310547, "uptime": 1941.1817577090005, "examples_seen": 9574400.0, "progress": 0.08303508787510101, "epoch": 7.473186555694925, "img/sec/core": 758.0663137014691, "core_hours_NVIDIA A100-SXM4-40GB": 3.786638962833329, "core_hours": 3.786638962833329} {"step": 9400, "global_schedule": 0.9398999810218811, "l2_grads": 1.2373573780059814, "l2_params": 255.58889770507812, "l2_updates": 1.0031955242156982, "train/loss": 4.167064666748047, "uptime": 1949.6589503000014, "examples_seen": 9625600.0, "progress": 0.08347912577817643, "epoch": 7.513150120163882, "img/sec/core": 754.9669222796772, "core_hours_NVIDIA A100-SXM4-40GB": 3.805477168591109, "core_hours": 3.805477168591109} {"step": 9450, "global_schedule": 0.9448999762535095, "l2_grads": 1.4264415502548218, "l2_params": 256.23016357421875, "l2_updates": 0.9689245223999023, "train/loss": 4.152756214141846, "uptime": 1958.035905793, "examples_seen": 9676800.0, "progress": 0.08392316368125183, "epoch": 7.553113684632839, "img/sec/core": 764.000716650467, "core_hours_NVIDIA A100-SXM4-40GB": 3.8240926252422165, "core_hours": 3.8240926252422165} {"step": 9500, "global_schedule": 0.9498999714851379, "l2_grads": 1.2059465646743774, "l2_params": 256.8316955566406, "l2_updates": 0.9984405040740967, "train/loss": 4.130716800689697, "uptime": 1966.3349193860013, "examples_seen": 9728000.0, "progress": 0.08436720158432724, "epoch": 7.593077249101795, "img/sec/core": 771.1759871555381, "core_hours_NVIDIA A100-SXM4-40GB": 3.8425348776711084, "core_hours": 3.8425348776711084} {"step": 9550, "global_schedule": 0.9548999667167664, "l2_grads": 0.9528564214706421, "l2_params": 257.4884338378906, "l2_updates": 0.9501916170120239, "train/loss": 5.509942531585693, "uptime": 1974.6916892650006, "examples_seen": 9779200.0, "progress": 0.08481123948740264, "epoch": 7.633040813570752, "img/sec/core": 765.8461454207662, "core_hours_NVIDIA A100-SXM4-40GB": 3.861105477402218, "core_hours": 3.861105477402218} {"step": 9600, "global_schedule": 0.9598999619483948, "l2_grads": 1.195391297340393, "l2_params": 258.149658203125, "l2_updates": 1.0135891437530518, "train/loss": 4.169358730316162, "uptime": 1982.9873867670012, "examples_seen": 9830400.0, "progress": 0.08525527739047806, "epoch": 7.6730043780397095, "img/sec/core": 771.4842541518121, "core_hours_NVIDIA A100-SXM4-40GB": 3.879540360739997, "core_hours": 3.879540360739997} {"step": 9650, "global_schedule": 0.9648999571800232, "l2_grads": 0.997139573097229, "l2_params": 258.8510437011719, "l2_updates": 0.962028443813324, "train/loss": 4.966435432434082, "uptime": 1991.3454412600004, "examples_seen": 9881600.0, "progress": 0.08569931529355346, "epoch": 7.712967942508666, "img/sec/core": 765.7284366069584, "core_hours_NVIDIA A100-SXM4-40GB": 3.898113815168884, "core_hours": 3.898113815168884} {"step": 9700, "global_schedule": 0.9698999524116516, "l2_grads": 1.3920485973358154, "l2_params": 259.5350341796875, "l2_updates": 0.9788886308670044, "train/loss": 4.047940254211426, "uptime": 2000.2842292490004, "examples_seen": 9932800.0, "progress": 0.08614335319662886, "epoch": 7.752931506977623, "img/sec/core": 715.980735629456, "core_hours_NVIDIA A100-SXM4-40GB": 3.917977788477773, "core_hours": 3.917977788477773} {"step": 9750, "global_schedule": 0.97489994764328, "l2_grads": 1.145172357559204, "l2_params": 260.17620849609375, "l2_updates": 1.065352439880371, "train/loss": 4.483186721801758, "uptime": 2009.3603080560006, "examples_seen": 9984000.0, "progress": 0.08658739109970427, "epoch": 7.79289507144658, "img/sec/core": 705.1503337612975, "core_hours_NVIDIA A100-SXM4-40GB": 3.9381468524933294, "core_hours": 3.9381468524933294} {"step": 9800, "global_schedule": 0.9799000024795532, "l2_grads": 0.8788121938705444, "l2_params": 260.815185546875, "l2_updates": 0.994546115398407, "train/loss": 5.919629096984863, "uptime": 2018.2891783110008, "examples_seen": 10035200.0, "progress": 0.08703142900277967, "epoch": 7.832858635915536, "img/sec/core": 716.7760105390671, "core_hours_NVIDIA A100-SXM4-40GB": 3.9579887863933294, "core_hours": 3.9579887863933294} {"step": 9850, "global_schedule": 0.9848999977111816, "l2_grads": 1.4416025876998901, "l2_params": 261.52349853515625, "l2_updates": 1.061081051826477, "train/loss": 4.032670974731445, "uptime": 2026.8558564650011, "examples_seen": 10086400.0, "progress": 0.08747546690585509, "epoch": 7.872822200384493, "img/sec/core": 747.0807102764135, "core_hours_NVIDIA A100-SXM4-40GB": 3.9770258489577746, "core_hours": 3.9770258489577746} {"step": 9900, "global_schedule": 0.9898999929428101, "l2_grads": 1.6814873218536377, "l2_params": 262.1935119628906, "l2_updates": 0.9920998215675354, "train/loss": 4.257248401641846, "uptime": 2035.9867326149997, "examples_seen": 10137600.0, "progress": 0.08791950480893049, "epoch": 7.91278576485345, "img/sec/core": 700.9184983853922, "core_hours_NVIDIA A100-SXM4-40GB": 3.9973166848466604, "core_hours": 3.9973166848466604} {"step": 9950, "global_schedule": 0.9948999881744385, "l2_grads": 1.3066749572753906, "l2_params": 262.8629455566406, "l2_updates": 0.9425944089889526, "train/loss": 4.910287857055664, "uptime": 2045.1506054250003, "examples_seen": 10188800.0, "progress": 0.0883635427120059, "epoch": 7.9527493293224065, "img/sec/core": 698.3946779592604, "core_hours_NVIDIA A100-SXM4-40GB": 4.017680846646662, "core_hours": 4.017680846646662} {"step": 10000, "global_schedule": 0.9998999834060669, "l2_grads": 1.2037643194198608, "l2_params": 263.56561279296875, "l2_updates": 1.0394872426986694, "train/loss": 4.026905536651611, "uptime": 2053.59687949, "examples_seen": 10240000.0, "progress": 0.0888075806150813, "epoch": 7.992712893791364, "img/sec/core": 757.7305627011109, "core_hours_NVIDIA A100-SXM4-40GB": 4.036450344568883, "core_hours": 4.036450344568883, "val/acc@1": 0.34472, "val/loss": 3.0967336474609377, "z/secs/eval/val": 2.5879256409989466} {"step": 10050, "global_schedule": 0.9999994039535522, "l2_grads": 1.2060045003890991, "l2_params": 264.1851806640625, "l2_updates": 1.0617982149124146, "train/loss": 4.155440807342529, "uptime": 2065.6103467700013, "examples_seen": 10291200.0, "progress": 0.08925161851815672, "epoch": 8.03267645826032, "img/sec/core": 728.6470592928846, "core_hours_NVIDIA A100-SXM4-40GB": 4.055969015564446, "core_hours": 4.055969015564446} {"step": 10100, "global_schedule": 0.9999977350234985, "l2_grads": 1.296430230140686, "l2_params": 264.942138671875, "l2_updates": 1.0443862676620483, "train/loss": 4.21400785446167, "uptime": 2074.095067716, "examples_seen": 10342400.0, "progress": 0.08969565642123212, "epoch": 8.072640022729278, "img/sec/core": 754.2970523996165, "core_hours_NVIDIA A100-SXM4-40GB": 4.074823950999998, "core_hours": 4.074823950999998} {"step": 10150, "global_schedule": 0.9999947547912598, "l2_grads": 1.2846834659576416, "l2_params": 265.6836242675781, "l2_updates": 1.0883591175079346, "train/loss": 4.000758647918701, "uptime": 2083.0986828309997, "examples_seen": 10393600.0, "progress": 0.09013969432430752, "epoch": 8.112603587198235, "img/sec/core": 710.825587084212, "core_hours_NVIDIA A100-SXM4-40GB": 4.094831984588887, "core_hours": 4.094831984588887} {"step": 10200, "global_schedule": 0.999990701675415, "l2_grads": 1.2266631126403809, "l2_params": 266.3954772949219, "l2_updates": 1.0052536725997925, "train/loss": 3.993025779724121, "uptime": 2092.1004688930007, "examples_seen": 10444800.0, "progress": 0.09058373222738293, "epoch": 8.15256715166719, "img/sec/core": 710.9700181629697, "core_hours_NVIDIA A100-SXM4-40GB": 4.114835953615556, "core_hours": 4.114835953615556} {"step": 10250, "global_schedule": 0.9999854564666748, "l2_grads": 0.86759352684021, "l2_params": 266.9893798828125, "l2_updates": 0.9846769571304321, "train/loss": 5.924134254455566, "uptime": 2100.631011804, "examples_seen": 10496000.0, "progress": 0.09102777013045833, "epoch": 8.192530716136147, "img/sec/core": 750.2453321872081, "core_hours_NVIDIA A100-SXM4-40GB": 4.133792715639999, "core_hours": 4.133792715639999} {"step": 10300, "global_schedule": 0.9999790191650391, "l2_grads": 0.9390602707862854, "l2_params": 267.71661376953125, "l2_updates": 1.0237388610839844, "train/loss": 5.476423263549805, "uptime": 2109.0735952100003, "examples_seen": 10547200.0, "progress": 0.09147180803353375, "epoch": 8.232494280605104, "img/sec/core": 758.0618031503753, "core_hours_NVIDIA A100-SXM4-40GB": 4.152554012097777, "core_hours": 4.152554012097777} {"step": 10350, "global_schedule": 0.9999714493751526, "l2_grads": 1.0327210426330566, "l2_params": 268.3476257324219, "l2_updates": 1.0430103540420532, "train/loss": 4.893980503082275, "uptime": 2117.8150468130007, "examples_seen": 10598400.0, "progress": 0.09191584593660915, "epoch": 8.272457845074062, "img/sec/core": 732.1438464297324, "core_hours_NVIDIA A100-SXM4-40GB": 4.171979460104445, "core_hours": 4.171979460104445} {"step": 10400, "global_schedule": 0.9999626874923706, "l2_grads": 1.139664649963379, "l2_params": 269.0352478027344, "l2_updates": 1.0463366508483887, "train/loss": 4.469531059265137, "uptime": 2126.621073139, "examples_seen": 10649600.0, "progress": 0.09235988383968456, "epoch": 8.312421409543019, "img/sec/core": 726.775024633327, "core_hours_NVIDIA A100-SXM4-40GB": 4.191548407495555, "core_hours": 4.191548407495555} {"step": 10450, "global_schedule": 0.9999527931213379, "l2_grads": 1.126116394996643, "l2_params": 269.6680603027344, "l2_updates": 1.0745022296905518, "train/loss": 4.216222763061523, "uptime": 2135.3256408220004, "examples_seen": 10700800.0, "progress": 0.09280392174275996, "epoch": 8.352384974011976, "img/sec/core": 735.2461642062915, "core_hours_NVIDIA A100-SXM4-40GB": 4.210891891235556, "core_hours": 4.210891891235556} {"step": 10500, "global_schedule": 0.9999416470527649, "l2_grads": 1.0084470510482788, "l2_params": 270.2828369140625, "l2_updates": 1.0174007415771484, "train/loss": 6.076140403747559, "uptime": 2144.036524680001, "examples_seen": 10752000.0, "progress": 0.09324795964583536, "epoch": 8.392348538480931, "img/sec/core": 734.7130445461976, "core_hours_NVIDIA A100-SXM4-40GB": 4.230249410920001, "core_hours": 4.230249410920001} {"step": 10550, "global_schedule": 0.9999293684959412, "l2_grads": 1.0073413848876953, "l2_params": 270.87860107421875, "l2_updates": 1.0411139726638794, "train/loss": 5.509415626525879, "uptime": 2153.358708863001, "examples_seen": 10803200.0, "progress": 0.09369199754891078, "epoch": 8.432312102949888, "img/sec/core": 686.5343866162923, "core_hours_NVIDIA A100-SXM4-40GB": 4.250965375771112, "core_hours": 4.250965375771112} {"step": 10600, "global_schedule": 0.9999158978462219, "l2_grads": 0.818238377571106, "l2_params": 271.5255432128906, "l2_updates": 0.9536301493644714, "train/loss": 5.338136672973633, "uptime": 2161.7806444380003, "examples_seen": 10854400.0, "progress": 0.09413603545198618, "epoch": 8.472275667418845, "img/sec/core": 759.9203227104464, "core_hours_NVIDIA A100-SXM4-40GB": 4.26968078816, "core_hours": 4.26968078816} {"step": 10650, "global_schedule": 0.999901294708252, "l2_grads": 0.842587411403656, "l2_params": 272.01556396484375, "l2_updates": 0.973650336265564, "train/loss": 5.8122148513793945, "uptime": 2170.118504879001, "examples_seen": 10905600.0, "progress": 0.09458007335506159, "epoch": 8.512239231887802, "img/sec/core": 767.583008289323, "core_hours_NVIDIA A100-SXM4-40GB": 4.288209366917779, "core_hours": 4.288209366917779} {"step": 10700, "global_schedule": 0.9998854994773865, "l2_grads": 0.9972146153450012, "l2_params": 272.5759582519531, "l2_updates": 1.0544592142105103, "train/loss": 5.114058494567871, "uptime": 2178.5810045690014, "examples_seen": 10956800.0, "progress": 0.09502411125813699, "epoch": 8.55220279635676, "img/sec/core": 756.2777234204967, "core_hours_NVIDIA A100-SXM4-40GB": 4.307014921784446, "core_hours": 4.307014921784446} {"step": 10750, "global_schedule": 0.9998685121536255, "l2_grads": 0.896084189414978, "l2_params": 273.1321105957031, "l2_updates": 0.9280884265899658, "train/loss": 4.913329124450684, "uptime": 2187.643119284001, "examples_seen": 11008000.0, "progress": 0.0954681491612124, "epoch": 8.592166360825717, "img/sec/core": 706.2369216543642, "core_hours_NVIDIA A100-SXM4-40GB": 4.327152954484445, "core_hours": 4.327152954484445} {"step": 10800, "global_schedule": 0.9998503923416138, "l2_grads": 0.7758012413978577, "l2_params": 273.77093505859375, "l2_updates": 1.0158826112747192, "train/loss": 5.697793960571289, "uptime": 2196.640435835001, "examples_seen": 11059200.0, "progress": 0.09591218706428781, "epoch": 8.632129925294672, "img/sec/core": 711.3231999477275, "core_hours_NVIDIA A100-SXM4-40GB": 4.347146991264446, "core_hours": 4.347146991264446} {"step": 10850, "global_schedule": 0.9998310804367065, "l2_grads": 0.9330188632011414, "l2_params": 274.3775939941406, "l2_updates": 1.008656620979309, "train/loss": 4.627009868621826, "uptime": 2205.5429503900014, "examples_seen": 11110400.0, "progress": 0.09635622496736321, "epoch": 8.672093489763629, "img/sec/core": 718.8980102711809, "core_hours_NVIDIA A100-SXM4-40GB": 4.366930356942223, "core_hours": 4.366930356942223} {"step": 10900, "global_schedule": 0.9998105764389038, "l2_grads": 0.795693039894104, "l2_params": 275.02813720703125, "l2_updates": 0.9392260909080505, "train/loss": 5.7788190841674805, "uptime": 2214.205126187, "examples_seen": 11161600.0, "progress": 0.09680026287043862, "epoch": 8.712057054232586, "img/sec/core": 738.8443908304694, "core_hours_NVIDIA A100-SXM4-40GB": 4.38617963649111, "core_hours": 4.38617963649111} {"step": 10950, "global_schedule": 0.9997889399528503, "l2_grads": 1.2915416955947876, "l2_params": 275.6253662109375, "l2_updates": 1.0876842737197876, "train/loss": 3.894700527191162, "uptime": 2222.669652797, "examples_seen": 11212800.0, "progress": 0.09724430077351402, "epoch": 8.752020618701543, "img/sec/core": 756.096624758588, "core_hours_NVIDIA A100-SXM4-40GB": 4.404989695624442, "core_hours": 4.404989695624442} {"step": 11000, "global_schedule": 0.9997661113739014, "l2_grads": 0.8580338954925537, "l2_params": 276.2099914550781, "l2_updates": 1.0204684734344482, "train/loss": 6.013738632202148, "uptime": 2231.203637462, "examples_seen": 11264000.0, "progress": 0.09768833867658944, "epoch": 8.7919841831705, "img/sec/core": 749.9427584218313, "core_hours_NVIDIA A100-SXM4-40GB": 4.42395410599111, "core_hours": 4.42395410599111} {"step": 11050, "global_schedule": 0.9997421503067017, "l2_grads": 1.3180699348449707, "l2_params": 276.7318420410156, "l2_updates": 1.0846426486968994, "train/loss": 4.32362699508667, "uptime": 2240.8154310480004, "examples_seen": 11315200.0, "progress": 0.09813237657966484, "epoch": 8.831947747639457, "img/sec/core": 738.0744408434704, "core_hours_NVIDIA A100-SXM4-40GB": 4.443223466146664, "core_hours": 4.443223466146664} {"step": 11100, "global_schedule": 0.9997169375419617, "l2_grads": 0.958523690700531, "l2_params": 277.2255859375, "l2_updates": 1.0357680320739746, "train/loss": 5.244359970092773, "uptime": 2249.7541305820014, "examples_seen": 11366400.0, "progress": 0.09857641448274025, "epoch": 8.871911312108413, "img/sec/core": 715.9878207848587, "core_hours_NVIDIA A100-SXM4-40GB": 4.463087242888889, "core_hours": 4.463087242888889} {"step": 11150, "global_schedule": 0.999690592288971, "l2_grads": 0.9055464267730713, "l2_params": 277.78240966796875, "l2_updates": 1.0138880014419556, "train/loss": 5.574686050415039, "uptime": 2258.605637898001, "examples_seen": 11417600.0, "progress": 0.09902045238581565, "epoch": 8.91187487657737, "img/sec/core": 723.0406948239842, "core_hours_NVIDIA A100-SXM4-40GB": 4.482757259146666, "core_hours": 4.482757259146666} {"step": 11200, "global_schedule": 0.9996631145477295, "l2_grads": 1.279990792274475, "l2_params": 278.36328125, "l2_updates": 1.0534796714782715, "train/loss": 3.921111583709717, "uptime": 2267.433604089001, "examples_seen": 11468800.0, "progress": 0.09946449028889107, "epoch": 8.951838441046327, "img/sec/core": 724.9687936644633, "core_hours_NVIDIA A100-SXM4-40GB": 4.5023749617933335, "core_hours": 4.5023749617933335} {"step": 11250, "global_schedule": 0.9996343851089478, "l2_grads": 1.378275752067566, "l2_params": 278.8249816894531, "l2_updates": 1.077122449874878, "train/loss": 3.976081609725952, "uptime": 2275.8192757430006, "examples_seen": 11520000.0, "progress": 0.09990852819196647, "epoch": 8.991802005515284, "img/sec/core": 763.206605752038, "core_hours_NVIDIA A100-SXM4-40GB": 4.52100978769111, "core_hours": 4.52100978769111} {"step": 11300, "global_schedule": 0.9996045827865601, "l2_grads": 0.8018187284469604, "l2_params": 279.367431640625, "l2_updates": 0.9419171810150146, "train/loss": 5.6899871826171875, "uptime": 2284.9640011990014, "examples_seen": 11571200.0, "progress": 0.10035256609504187, "epoch": 9.031765569984241, "img/sec/core": 699.8569864992872, "core_hours_NVIDIA A100-SXM4-40GB": 4.541331399815556, "core_hours": 4.541331399815556} {"step": 11350, "global_schedule": 0.9995735287666321, "l2_grads": 1.1891746520996094, "l2_params": 279.9140319824219, "l2_updates": 1.1093050241470337, "train/loss": 3.961397171020508, "uptime": 2293.5906573890006, "examples_seen": 11622400.0, "progress": 0.10079660399811728, "epoch": 9.071729134453198, "img/sec/core": 741.8865269511273, "core_hours_NVIDIA A100-SXM4-40GB": 4.5605017469044435, "core_hours": 4.5605017469044435} {"step": 11400, "global_schedule": 0.9995413422584534, "l2_grads": 1.2332128286361694, "l2_params": 280.530517578125, "l2_updates": 1.0770947933197021, "train/loss": 3.78645658493042, "uptime": 2302.8385143860014, "examples_seen": 11673600.0, "progress": 0.10124064190119268, "epoch": 9.111692698922155, "img/sec/core": 692.0522237828305, "core_hours_NVIDIA A100-SXM4-40GB": 4.581052540231111, "core_hours": 4.581052540231111} {"step": 11450, "global_schedule": 0.9995079636573792, "l2_grads": 1.1789045333862305, "l2_params": 281.1133117675781, "l2_updates": 1.0260510444641113, "train/loss": 3.751701593399048, "uptime": 2312.1050459240014, "examples_seen": 11724800.0, "progress": 0.1016846798042681, "epoch": 9.15165626339111, "img/sec/core": 690.657553341833, "core_hours_NVIDIA A100-SXM4-40GB": 4.601644832537778, "core_hours": 4.601644832537778} {"step": 11500, "global_schedule": 0.9994734525680542, "l2_grads": 1.3425214290618896, "l2_params": 281.6195373535156, "l2_updates": 1.0698778629302979, "train/loss": 3.8049302101135254, "uptime": 2320.7727177550005, "examples_seen": 11776000.0, "progress": 0.1021287177073435, "epoch": 9.191619827860068, "img/sec/core": 738.3759012553998, "core_hours_NVIDIA A100-SXM4-40GB": 4.620906325495554, "core_hours": 4.620906325495554} {"step": 11550, "global_schedule": 0.9994377493858337, "l2_grads": 1.2408291101455688, "l2_params": 282.0204162597656, "l2_updates": 1.0564255714416504, "train/loss": 3.8436169624328613, "uptime": 2329.8423592090003, "examples_seen": 11827200.0, "progress": 0.10257275561041891, "epoch": 9.231583392329025, "img/sec/core": 705.6508278149786, "core_hours_NVIDIA A100-SXM4-40GB": 4.641061084282219, "core_hours": 4.641061084282219} {"step": 11600, "global_schedule": 0.9994008541107178, "l2_grads": 1.192142367362976, "l2_params": 282.5394592285156, "l2_updates": 1.122583031654358, "train/loss": 3.795660972595215, "uptime": 2338.371041057, "examples_seen": 11878400.0, "progress": 0.10301679351349431, "epoch": 9.271546956797982, "img/sec/core": 750.4090449218585, "core_hours_NVIDIA A100-SXM4-40GB": 4.660013710611109, "core_hours": 4.660013710611109} {"step": 11650, "global_schedule": 0.9993628263473511, "l2_grads": 1.1267999410629272, "l2_params": 283.1496887207031, "l2_updates": 1.0670291185379028, "train/loss": 4.641560077667236, "uptime": 2346.993583953001, "examples_seen": 11929600.0, "progress": 0.10346083141656971, "epoch": 9.31151052126694, "img/sec/core": 742.2404361674465, "core_hours_NVIDIA A100-SXM4-40GB": 4.679174917046666, "core_hours": 4.679174917046666} {"step": 11700, "global_schedule": 0.9993236064910889, "l2_grads": 1.1413663625717163, "l2_params": 283.68267822265625, "l2_updates": 1.124226689338684, "train/loss": 3.8281097412109375, "uptime": 2355.6627995119998, "examples_seen": 11980800.0, "progress": 0.10390486931964513, "epoch": 9.351474085735896, "img/sec/core": 738.2444185917778, "core_hours_NVIDIA A100-SXM4-40GB": 4.698439840511108, "core_hours": 4.698439840511108} {"step": 11750, "global_schedule": 0.9992831945419312, "l2_grads": 0.913998544216156, "l2_params": 284.2589111328125, "l2_updates": 1.048657774925232, "train/loss": 4.821071147918701, "uptime": 2364.151979465001, "examples_seen": 12032000.0, "progress": 0.10434890722272053, "epoch": 9.391437650204852, "img/sec/core": 753.9008520766735, "core_hours_NVIDIA A100-SXM4-40GB": 4.717304684851111, "core_hours": 4.717304684851111} {"step": 11800, "global_schedule": 0.9992416501045227, "l2_grads": 1.0807180404663086, "l2_params": 284.7250671386719, "l2_updates": 1.0306848287582397, "train/loss": 4.620946884155273, "uptime": 2372.543242040001, "examples_seen": 12083200.0, "progress": 0.10479294512579594, "epoch": 9.431401214673809, "img/sec/core": 762.6980973122576, "core_hours_NVIDIA A100-SXM4-40GB": 4.735951935017778, "core_hours": 4.735951935017778} {"step": 11850, "global_schedule": 0.9991989135742188, "l2_grads": 1.3129223585128784, "l2_params": 285.260009765625, "l2_updates": 1.0323001146316528, "train/loss": 3.887240409851074, "uptime": 2381.635952509001, "examples_seen": 12134400.0, "progress": 0.10523698302887134, "epoch": 9.471364779142766, "img/sec/core": 703.8605289170615, "core_hours_NVIDIA A100-SXM4-40GB": 4.7561579582822215, "core_hours": 4.7561579582822215} {"step": 11900, "global_schedule": 0.9991550445556641, "l2_grads": 1.5521516799926758, "l2_params": 285.7662048339844, "l2_updates": 0.9801872968673706, "train/loss": 3.7812130451202393, "uptime": 2390.9405701760006, "examples_seen": 12185600.0, "progress": 0.10568102093194676, "epoch": 9.511328343611723, "img/sec/core": 687.8305191086699, "core_hours_NVIDIA A100-SXM4-40GB": 4.776834886431109, "core_hours": 4.776834886431109} {"step": 11950, "global_schedule": 0.9991099834442139, "l2_grads": 1.175847053527832, "l2_params": 286.20501708984375, "l2_updates": 1.1065081357955933, "train/loss": 3.732252597808838, "uptime": 2400.030776582, "examples_seen": 12236800.0, "progress": 0.10612505883502216, "epoch": 9.55129190808068, "img/sec/core": 704.0544201258443, "core_hours_NVIDIA A100-SXM4-40GB": 4.797035345111108, "core_hours": 4.797035345111108} {"step": 12000, "global_schedule": 0.9990637302398682, "l2_grads": 1.4768637418746948, "l2_params": 286.7170104980469, "l2_updates": 0.9757872819900513, "train/loss": 3.7661356925964355, "uptime": 2409.1579381250012, "examples_seen": 12288000.0, "progress": 0.10656909673809756, "epoch": 9.591255472549637, "img/sec/core": 701.2037608677399, "core_hours_NVIDIA A100-SXM4-40GB": 4.817317926317778, "core_hours": 4.817317926317778} {"step": 12050, "global_schedule": 0.999016284942627, "l2_grads": 1.3025976419448853, "l2_params": 287.1568298339844, "l2_updates": 1.0648332834243774, "train/loss": 3.6897788047790527, "uptime": 2418.137821944001, "examples_seen": 12339200.0, "progress": 0.10701313464117297, "epoch": 9.631219037018592, "img/sec/core": 807.3960144375849, "core_hours_NVIDIA A100-SXM4-40GB": 4.834932853773333, "core_hours": 4.834932853773333} {"step": 12100, "global_schedule": 0.9989677667617798, "l2_grads": 1.147552251815796, "l2_params": 287.6923828125, "l2_updates": 1.0224807262420654, "train/loss": 3.7771522998809814, "uptime": 2426.594565728001, "examples_seen": 12390400.0, "progress": 0.10745717254424837, "epoch": 9.67118260148755, "img/sec/core": 756.7924680547803, "core_hours_NVIDIA A100-SXM4-40GB": 4.853725617737776, "core_hours": 4.853725617737776} {"step": 12150, "global_schedule": 0.9989179372787476, "l2_grads": 1.139087200164795, "l2_params": 288.1593322753906, "l2_updates": 1.0098280906677246, "train/loss": 3.7992782592773438, "uptime": 2435.2009042669997, "examples_seen": 12441600.0, "progress": 0.10790121044732379, "epoch": 9.711146165956507, "img/sec/core": 743.6379560249623, "core_hours_NVIDIA A100-SXM4-40GB": 4.872850814491106, "core_hours": 4.872850814491106} {"step": 12200, "global_schedule": 0.9988670349121094, "l2_grads": 1.1799113750457764, "l2_params": 288.6170654296875, "l2_updates": 1.1022077798843384, "train/loss": 3.8146109580993652, "uptime": 2443.6595379130013, "examples_seen": 12492800.0, "progress": 0.10834524835039919, "epoch": 9.751109730425464, "img/sec/core": 756.6233824330866, "core_hours_NVIDIA A100-SXM4-40GB": 4.891647778148888, "core_hours": 4.891647778148888} {"step": 12250, "global_schedule": 0.9988149404525757, "l2_grads": 0.9609447121620178, "l2_params": 289.1090393066406, "l2_updates": 0.9536007642745972, "train/loss": 4.862606525421143, "uptime": 2452.72193935, "examples_seen": 12544000.0, "progress": 0.1087892862534746, "epoch": 9.79107329489442, "img/sec/core": 706.2145772831228, "core_hours_NVIDIA A100-SXM4-40GB": 4.911786448008885, "core_hours": 4.911786448008885} {"step": 12300, "global_schedule": 0.9987617135047913, "l2_grads": 1.309814453125, "l2_params": 289.527099609375, "l2_updates": 1.0693373680114746, "train/loss": 3.832263946533203, "uptime": 2461.859288757001, "examples_seen": 12595200.0, "progress": 0.10923332415655, "epoch": 9.831036859363378, "img/sec/core": 700.4219402068809, "core_hours_NVIDIA A100-SXM4-40GB": 4.9320916689133325, "core_hours": 4.9320916689133325} {"step": 12350, "global_schedule": 0.9987072944641113, "l2_grads": 1.1071279048919678, "l2_params": 289.95196533203125, "l2_updates": 1.0123413801193237, "train/loss": 4.140542030334473, "uptime": 2470.3094505830013, "examples_seen": 12646400.0, "progress": 0.10967736205962542, "epoch": 9.871000423832333, "img/sec/core": 757.3819450780202, "core_hours_NVIDIA A100-SXM4-40GB": 4.950869806304444, "core_hours": 4.950869806304444} {"step": 12400, "global_schedule": 0.9986517429351807, "l2_grads": 1.4426923990249634, "l2_params": 290.3678283691406, "l2_updates": 0.9420751333236694, "train/loss": 3.691215753555298, "uptime": 2478.7462255950013, "examples_seen": 12697600.0, "progress": 0.11012139996270082, "epoch": 9.91096398830129, "img/sec/core": 758.5836994464113, "core_hours_NVIDIA A100-SXM4-40GB": 4.969618195219999, "core_hours": 4.969618195219999} {"step": 12450, "global_schedule": 0.9985949397087097, "l2_grads": 1.1722400188446045, "l2_params": 290.7190246582031, "l2_updates": 1.0568084716796875, "train/loss": 3.7437198162078857, "uptime": 2487.557985839001, "examples_seen": 12748800.0, "progress": 0.11056543786577622, "epoch": 9.950927552770247, "img/sec/core": 726.3021034143546, "core_hours_NVIDIA A100-SXM4-40GB": 4.98919988465111, "core_hours": 4.98919988465111} {"step": 12500, "global_schedule": 0.998537003993988, "l2_grads": 1.2109498977661133, "l2_params": 291.1400146484375, "l2_updates": 1.0632580518722534, "train/loss": 3.654829263687134, "uptime": 2496.1214666120013, "examples_seen": 12800000.0, "progress": 0.11100947576885163, "epoch": 9.990891117239205, "img/sec/core": 747.3596507834189, "core_hours_NVIDIA A100-SXM4-40GB": 5.008229841924444, "core_hours": 5.008229841924444, "val/acc@1": 0.41012, "val/loss": 2.7527794384765625, "z/secs/eval/val": 2.6007621989992913} {"step": 12550, "global_schedule": 0.9984779357910156, "l2_grads": 1.1841248273849487, "l2_params": 291.6455993652344, "l2_updates": 1.0592204332351685, "train/loss": 4.012051105499268, "uptime": 2507.4633927209998, "examples_seen": 12851200.0, "progress": 0.11145351367192703, "epoch": 10.030854681708162, "img/sec/core": 732.2379851216497, "core_hours_NVIDIA A100-SXM4-40GB": 5.027652792537775, "core_hours": 5.027652792537775} {"step": 12600, "global_schedule": 0.9984176158905029, "l2_grads": 1.1955313682556152, "l2_params": 292.0773620605469, "l2_updates": 1.0170068740844727, "train/loss": 3.7716064453125, "uptime": 2515.8646291550012, "examples_seen": 12902400.0, "progress": 0.11189755157500245, "epoch": 10.070818246177119, "img/sec/core": 761.792630201184, "core_hours_NVIDIA A100-SXM4-40GB": 5.046322206835555, "core_hours": 5.046322206835555} {"step": 12650, "global_schedule": 0.9983562231063843, "l2_grads": 0.9026830196380615, "l2_params": 292.50909423828125, "l2_updates": 1.063474178314209, "train/loss": 5.950062274932861, "uptime": 2524.613623856001, "examples_seen": 12953600.0, "progress": 0.11234158947807785, "epoch": 10.110781810646076, "img/sec/core": 731.5126158744341, "core_hours_NVIDIA A100-SXM4-40GB": 5.065764417282222, "core_hours": 5.065764417282222} {"step": 12700, "global_schedule": 0.9982936382293701, "l2_grads": 1.3254598379135132, "l2_params": 292.9806823730469, "l2_updates": 1.063274621963501, "train/loss": 3.660339832305908, "uptime": 2533.216218114001, "examples_seen": 13004800.0, "progress": 0.11278562738115326, "epoch": 10.150745375115031, "img/sec/core": 743.9616246050825, "core_hours_NVIDIA A100-SXM4-40GB": 5.084881293411111, "core_hours": 5.084881293411111} {"step": 12750, "global_schedule": 0.9982298612594604, "l2_grads": 1.3996026515960693, "l2_params": 293.4214782714844, "l2_updates": 0.9669883251190186, "train/loss": 3.8965835571289062, "uptime": 2542.3909698120005, "examples_seen": 13056000.0, "progress": 0.11322966528422866, "epoch": 10.190708939583988, "img/sec/core": 697.5665620896873, "core_hours_NVIDIA A100-SXM4-40GB": 5.1052696305177765, "core_hours": 5.1052696305177765} {"step": 12800, "global_schedule": 0.9981648921966553, "l2_grads": 1.1212836503982544, "l2_params": 293.75616455078125, "l2_updates": 1.0075654983520508, "train/loss": 5.229947090148926, "uptime": 2551.149415578, "examples_seen": 13107200.0, "progress": 0.11367370318730406, "epoch": 10.230672504052945, "img/sec/core": 730.7232551287702, "core_hours_NVIDIA A100-SXM4-40GB": 5.124732843331108, "core_hours": 5.124732843331108} {"step": 12850, "global_schedule": 0.9980987906455994, "l2_grads": 1.2226344347000122, "l2_params": 294.1864929199219, "l2_updates": 1.0584867000579834, "train/loss": 5.034521579742432, "uptime": 2560.3602692269997, "examples_seen": 13158400.0, "progress": 0.11411774109037948, "epoch": 10.270636068521902, "img/sec/core": 694.8324491829428, "core_hours_NVIDIA A100-SXM4-40GB": 5.145201406995552, "core_hours": 5.145201406995552} {"step": 12900, "global_schedule": 0.998031497001648, "l2_grads": 1.159246563911438, "l2_params": 294.63482666015625, "l2_updates": 1.0333704948425293, "train/loss": 3.6043286323547363, "uptime": 2569.150145619, "examples_seen": 13209600.0, "progress": 0.11456177899345488, "epoch": 10.31059963299086, "img/sec/core": 728.1103527035625, "core_hours_NVIDIA A100-SXM4-40GB": 5.164734465644441, "core_hours": 5.164734465644441} {"step": 12950, "global_schedule": 0.9979630708694458, "l2_grads": 1.2037450075149536, "l2_params": 295.0501708984375, "l2_updates": 1.1009801626205444, "train/loss": 3.464799404144287, "uptime": 2577.522136609001, "examples_seen": 13260800.0, "progress": 0.11500581689653029, "epoch": 10.350563197459817, "img/sec/core": 764.4537610759229, "core_hours_NVIDIA A100-SXM4-40GB": 5.183338890066666, "core_hours": 5.183338890066666} {"step": 13000, "global_schedule": 0.9978934526443481, "l2_grads": 1.2019625902175903, "l2_params": 295.42938232421875, "l2_updates": 1.0057014226913452, "train/loss": 3.7232346534729004, "uptime": 2585.975847687001, "examples_seen": 13312000.0, "progress": 0.11544985479960569, "epoch": 10.390526761928772, "img/sec/core": 757.0639617262599, "core_hours_NVIDIA A100-SXM4-40GB": 5.202124914684444, "core_hours": 5.202124914684444} {"step": 13050, "global_schedule": 0.9978227019309998, "l2_grads": 1.2135841846466064, "l2_params": 295.7861633300781, "l2_updates": 1.042748212814331, "train/loss": 3.477708339691162, "uptime": 2595.0340474269997, "examples_seen": 13363200.0, "progress": 0.1158938927026811, "epoch": 10.430490326397729, "img/sec/core": 767.8610325105003, "core_hours_NVIDIA A100-SXM4-40GB": 5.2206467846844395, "core_hours": 5.2206467846844395} {"step": 13100, "global_schedule": 0.9977507591247559, "l2_grads": 1.33875572681427, "l2_params": 296.1610412597656, "l2_updates": 1.0139389038085938, "train/loss": 3.8660662174224854, "uptime": 2603.4792154429997, "examples_seen": 13414400.0, "progress": 0.1163379306057565, "epoch": 10.470453890866686, "img/sec/core": 757.8298013579723, "core_hours_NVIDIA A100-SXM4-40GB": 5.239413824719995, "core_hours": 5.239413824719995} {"step": 13150, "global_schedule": 0.9976776838302612, "l2_grads": 1.2106151580810547, "l2_params": 296.52056884765625, "l2_updates": 1.0229636430740356, "train/loss": 3.827202320098877, "uptime": 2611.9165134760005, "examples_seen": 13465600.0, "progress": 0.11678196850883191, "epoch": 10.510417455335643, "img/sec/core": 758.5366754816115, "core_hours_NVIDIA A100-SXM4-40GB": 5.2581633759044415, "core_hours": 5.2581633759044415} {"step": 13200, "global_schedule": 0.9976033568382263, "l2_grads": 1.1832377910614014, "l2_params": 296.9778747558594, "l2_updates": 1.0625675916671753, "train/loss": 4.0525102615356445, "uptime": 2620.310323044001, "examples_seen": 13516800.0, "progress": 0.11722600641190732, "epoch": 10.5503810198046, "img/sec/core": 762.4666664345766, "core_hours_NVIDIA A100-SXM4-40GB": 5.276816286055554, "core_hours": 5.276816286055554} {"step": 13250, "global_schedule": 0.9975279569625854, "l2_grads": 1.292513132095337, "l2_params": 297.34100341796875, "l2_updates": 1.0429338216781616, "train/loss": 3.6030051708221436, "uptime": 2629.369237653, "examples_seen": 13568000.0, "progress": 0.11767004431498272, "epoch": 10.590344584273558, "img/sec/core": 706.486403309565, "core_hours_NVIDIA A100-SXM4-40GB": 5.296947207408885, "core_hours": 5.296947207408885} {"step": 13300, "global_schedule": 0.9974513053894043, "l2_grads": 1.292931318283081, "l2_params": 297.67413330078125, "l2_updates": 1.0512691736221313, "train/loss": 3.412865161895752, "uptime": 2638.4661657100005, "examples_seen": 13619200.0, "progress": 0.11811408221805814, "epoch": 10.630308148742513, "img/sec/core": 703.5341996658719, "core_hours_NVIDIA A100-SXM4-40GB": 5.317162603091108, "core_hours": 5.317162603091108} {"step": 13350, "global_schedule": 0.9973735809326172, "l2_grads": 0.9827912449836731, "l2_params": 298.1074523925781, "l2_updates": 1.0561693906784058, "train/loss": 4.616840839385986, "uptime": 2647.285766399, "examples_seen": 13670400.0, "progress": 0.11855812012113354, "epoch": 10.67027171321147, "img/sec/core": 725.6564356686462, "core_hours_NVIDIA A100-SXM4-40GB": 5.336761715733329, "core_hours": 5.336761715733329} {"step": 13400, "global_schedule": 0.9972946047782898, "l2_grads": 1.186296820640564, "l2_params": 298.51043701171875, "l2_updates": 1.0505465269088745, "train/loss": 3.5899932384490967, "uptime": 2655.831127229001, "examples_seen": 13721600.0, "progress": 0.11900215802420895, "epoch": 10.710235277680427, "img/sec/core": 748.9443836626178, "core_hours_NVIDIA A100-SXM4-40GB": 5.355751406466665, "core_hours": 5.355751406466665} {"step": 13450, "global_schedule": 0.9972144961357117, "l2_grads": 1.2121775150299072, "l2_params": 298.88446044921875, "l2_updates": 1.1076124906539917, "train/loss": 3.7143986225128174, "uptime": 2664.3544581389997, "examples_seen": 13772800.0, "progress": 0.11944619592728435, "epoch": 10.750198842149384, "img/sec/core": 750.8801509152117, "core_hours_NVIDIA A100-SXM4-40GB": 5.3746921418222176, "core_hours": 5.3746921418222176} {"step": 13500, "global_schedule": 0.9971332550048828, "l2_grads": 1.3058661222457886, "l2_params": 299.2703552246094, "l2_updates": 1.0281846523284912, "train/loss": 3.63372802734375, "uptime": 2673.1116773880003, "examples_seen": 13824000.0, "progress": 0.11989023383035977, "epoch": 10.790162406618341, "img/sec/core": 730.825598631708, "core_hours_NVIDIA A100-SXM4-40GB": 5.394152629042219, "core_hours": 5.394152629042219} {"step": 13550, "global_schedule": 0.9970507621765137, "l2_grads": 0.9830536842346191, "l2_params": 299.6421813964844, "l2_updates": 1.0357558727264404, "train/loss": 5.5979485511779785, "uptime": 2681.941919668001, "examples_seen": 13875200.0, "progress": 0.12033427173343517, "epoch": 10.830125971087298, "img/sec/core": 724.7819252360888, "core_hours_NVIDIA A100-SXM4-40GB": 5.413775389664442, "core_hours": 5.413775389664442} {"step": 13600, "global_schedule": 0.9969671964645386, "l2_grads": 1.1534591913223267, "l2_params": 299.9533996582031, "l2_updates": 1.0509487390518188, "train/loss": 3.529526948928833, "uptime": 2690.747503146, "examples_seen": 13926400.0, "progress": 0.12077830963651057, "epoch": 10.870089535556255, "img/sec/core": 726.811575404477, "core_hours_NVIDIA A100-SXM4-40GB": 5.433343352948884, "core_hours": 5.433343352948884} {"step": 13650, "global_schedule": 0.996882438659668, "l2_grads": 1.3842213153839111, "l2_params": 300.3125, "l2_updates": 1.0685657262802124, "train/loss": 3.5660431385040283, "uptime": 2699.192343531, "examples_seen": 13977600.0, "progress": 0.12122234753958598, "epoch": 10.91005310002521, "img/sec/core": 757.8592025691553, "core_hours_NVIDIA A100-SXM4-40GB": 5.452109664915552, "core_hours": 5.452109664915552} {"step": 13700, "global_schedule": 0.9967964887619019, "l2_grads": 1.167110562324524, "l2_params": 300.63800048828125, "l2_updates": 1.0382777452468872, "train/loss": 3.4184722900390625, "uptime": 2708.060507806, "examples_seen": 14028800.0, "progress": 0.12166638544266138, "epoch": 10.950016664494168, "img/sec/core": 721.6826167781094, "core_hours_NVIDIA A100-SXM4-40GB": 5.471816696637774, "core_hours": 5.471816696637774} {"step": 13750, "global_schedule": 0.996709406375885, "l2_grads": 1.2995738983154297, "l2_params": 300.9784240722656, "l2_updates": 1.03249990940094, "train/loss": 3.550245761871338, "uptime": 2717.187755189001, "examples_seen": 14080000.0, "progress": 0.1221104233457368, "epoch": 10.989980228963125, "img/sec/core": 701.1971661817163, "core_hours_NVIDIA A100-SXM4-40GB": 5.492099468599998, "core_hours": 5.492099468599998} {"step": 13800, "global_schedule": 0.9966211318969727, "l2_grads": 1.2081583738327026, "l2_params": 301.3356018066406, "l2_updates": 1.0395419597625732, "train/loss": 4.605704307556152, "uptime": 2727.099687793001, "examples_seen": 14131200.0, "progress": 0.1225544612488122, "epoch": 11.029943793432082, "img/sec/core": 645.6863919168782, "core_hours_NVIDIA A100-SXM4-40GB": 5.514125985497776, "core_hours": 5.514125985497776} {"step": 13850, "global_schedule": 0.9965317249298096, "l2_grads": 1.268782615661621, "l2_params": 301.643798828125, "l2_updates": 1.0892984867095947, "train/loss": 3.5871331691741943, "uptime": 2736.2075861169997, "examples_seen": 14182400.0, "progress": 0.12299849915188761, "epoch": 11.06990735790104, "img/sec/core": 702.6868079034767, "core_hours_NVIDIA A100-SXM4-40GB": 5.534365759551107, "core_hours": 5.534365759551107} {"step": 13900, "global_schedule": 0.996441125869751, "l2_grads": 1.236779808998108, "l2_params": 302.015625, "l2_updates": 1.0294499397277832, "train/loss": 3.4375078678131104, "uptime": 2745.087126233, "examples_seen": 14233600.0, "progress": 0.12344253705496301, "epoch": 11.109870922369996, "img/sec/core": 720.7580478709153, "core_hours_NVIDIA A100-SXM4-40GB": 5.554098070919996, "core_hours": 5.554098070919996} {"step": 13950, "global_schedule": 0.9963493943214417, "l2_grads": 0.9890816807746887, "l2_params": 302.3282165527344, "l2_updates": 1.086755394935608, "train/loss": 5.072210311889648, "uptime": 2754.0606429010004, "examples_seen": 14284800.0, "progress": 0.12388657495803841, "epoch": 11.149834486838952, "img/sec/core": 713.2097968706684, "core_hours_NVIDIA A100-SXM4-40GB": 5.574039219071108, "core_hours": 5.574039219071108} {"step": 14000, "global_schedule": 0.9962564706802368, "l2_grads": 1.0356388092041016, "l2_params": 302.6903991699219, "l2_updates": 1.0159250497817993, "train/loss": 4.855594635009766, "uptime": 2763.192998460001, "examples_seen": 14336000.0, "progress": 0.12433061286111383, "epoch": 11.189798051307909, "img/sec/core": 700.8049520906251, "core_hours_NVIDIA A100-SXM4-40GB": 5.5943333425355535, "core_hours": 5.5943333425355535} {"step": 14050, "global_schedule": 0.9961624145507812, "l2_grads": 1.089172601699829, "l2_params": 303.0649108886719, "l2_updates": 1.0330191850662231, "train/loss": 4.637333393096924, "uptime": 2772.4888139940012, "examples_seen": 14387200.0, "progress": 0.12477465076418923, "epoch": 11.229761615776866, "img/sec/core": 741.6817142200136, "core_hours_NVIDIA A100-SXM4-40GB": 5.613508983446668, "core_hours": 5.613508983446668} {"step": 14100, "global_schedule": 0.9960671663284302, "l2_grads": 1.1301380395889282, "l2_params": 303.38153076171875, "l2_updates": 1.0647772550582886, "train/loss": 3.5460398197174072, "uptime": 2781.4083814349997, "examples_seen": 14438400.0, "progress": 0.12521868866726463, "epoch": 11.269725180245823, "img/sec/core": 717.5235842247972, "core_hours_NVIDIA A100-SXM4-40GB": 5.633330244426664, "core_hours": 5.633330244426664} {"step": 14150, "global_schedule": 0.9959707260131836, "l2_grads": 1.2962976694107056, "l2_params": 303.68316650390625, "l2_updates": 1.0270421504974365, "train/loss": 3.56337833404541, "uptime": 2789.926770776001, "examples_seen": 14489600.0, "progress": 0.12566272657034006, "epoch": 11.30968874471478, "img/sec/core": 751.3157410163356, "core_hours_NVIDIA A100-SXM4-40GB": 5.652259998517778, "core_hours": 5.652259998517778} {"step": 14200, "global_schedule": 0.995873212814331, "l2_grads": 1.3936890363693237, "l2_params": 303.9241027832031, "l2_updates": 0.9949626326560974, "train/loss": 3.648109197616577, "uptime": 2798.4402351900007, "examples_seen": 14540800.0, "progress": 0.12610676447341546, "epoch": 11.349652309183737, "img/sec/core": 751.7503672741763, "core_hours_NVIDIA A100-SXM4-40GB": 5.671178808326667, "core_hours": 5.671178808326667} {"step": 14250, "global_schedule": 0.995774507522583, "l2_grads": 1.1086581945419312, "l2_params": 304.23248291015625, "l2_updates": 1.0214685201644897, "train/loss": 4.172238826751709, "uptime": 2807.0078784240013, "examples_seen": 14592000.0, "progress": 0.12655080237649086, "epoch": 11.389615873652692, "img/sec/core": 746.9965573031438, "core_hours_NVIDIA A100-SXM4-40GB": 5.690218015513334, "core_hours": 5.690218015513334} {"step": 14300, "global_schedule": 0.9956746101379395, "l2_grads": 0.9151813387870789, "l2_params": 304.5966491699219, "l2_updates": 1.0602220296859741, "train/loss": 4.210476875305176, "uptime": 2815.885640982, "examples_seen": 14643200.0, "progress": 0.12699484027956626, "epoch": 11.42957943812165, "img/sec/core": 720.902362300026, "core_hours_NVIDIA A100-SXM4-40GB": 5.709946376753332, "core_hours": 5.709946376753332} {"step": 14350, "global_schedule": 0.9955735206604004, "l2_grads": 1.241065263748169, "l2_params": 304.82940673828125, "l2_updates": 1.0250896215438843, "train/loss": 3.525347948074341, "uptime": 2824.597462349, "examples_seen": 14694400.0, "progress": 0.12743887818264166, "epoch": 11.469543002590607, "img/sec/core": 734.633979553674, "core_hours_NVIDIA A100-SXM4-40GB": 5.72930597979111, "core_hours": 5.72930597979111} {"step": 14400, "global_schedule": 0.9954713582992554, "l2_grads": 1.1869887113571167, "l2_params": 305.1080017089844, "l2_updates": 1.1133259534835815, "train/loss": 3.5414323806762695, "uptime": 2833.6674308990005, "examples_seen": 14745600.0, "progress": 0.12788291608571709, "epoch": 11.509506567059564, "img/sec/core": 705.6253794837867, "core_hours_NVIDIA A100-SXM4-40GB": 5.7494614654577765, "core_hours": 5.7494614654577765} {"step": 14450, "global_schedule": 0.9953679442405701, "l2_grads": 1.1046531200408936, "l2_params": 305.38787841796875, "l2_updates": 1.0511001348495483, "train/loss": 4.217182636260986, "uptime": 2842.7777315540006, "examples_seen": 14796800.0, "progress": 0.12832695398879249, "epoch": 11.54947013152852, "img/sec/core": 702.501513656124, "core_hours_NVIDIA A100-SXM4-40GB": 5.769706578024444, "core_hours": 5.769706578024444} {"step": 14500, "global_schedule": 0.9952634572982788, "l2_grads": 0.9426921010017395, "l2_params": 305.59344482421875, "l2_updates": 0.9765704870223999, "train/loss": 5.758066654205322, "uptime": 2852.005713407001, "examples_seen": 14848000.0, "progress": 0.1287709918918679, "epoch": 11.589433695997478, "img/sec/core": 693.5427596142275, "core_hours_NVIDIA A100-SXM4-40GB": 5.790213204364445, "core_hours": 5.790213204364445} {"step": 14550, "global_schedule": 0.9951577186584473, "l2_grads": 1.1334084272384644, "l2_params": 305.91851806640625, "l2_updates": 1.037567377090454, "train/loss": 3.7749860286712646, "uptime": 2861.137961196, "examples_seen": 14899200.0, "progress": 0.1292150297949433, "epoch": 11.629397260466433, "img/sec/core": 700.8132223163818, "core_hours_NVIDIA A100-SXM4-40GB": 5.810507088339999, "core_hours": 5.810507088339999} {"step": 14600, "global_schedule": 0.9950509071350098, "l2_grads": 1.4458485841751099, "l2_params": 306.2440185546875, "l2_updates": 0.974534273147583, "train/loss": 3.492818832397461, "uptime": 2869.79824337, "examples_seen": 14950400.0, "progress": 0.12965906769801872, "epoch": 11.66936082493539, "img/sec/core": 739.0059436185925, "core_hours_NVIDIA A100-SXM4-40GB": 5.829752159837776, "core_hours": 5.829752159837776} {"step": 14650, "global_schedule": 0.994942843914032, "l2_grads": 1.3149621486663818, "l2_params": 306.4797668457031, "l2_updates": 1.0305346250534058, "train/loss": 3.525451183319092, "uptime": 2878.3643126260013, "examples_seen": 15001600.0, "progress": 0.13010310560109412, "epoch": 11.709324389404347, "img/sec/core": 747.1338146742374, "core_hours_NVIDIA A100-SXM4-40GB": 5.848787869295557, "core_hours": 5.848787869295557} {"step": 14700, "global_schedule": 0.9948337078094482, "l2_grads": 1.1518898010253906, "l2_params": 306.7629089355469, "l2_updates": 1.0907074213027954, "train/loss": 3.478862762451172, "uptime": 2886.7525743290007, "examples_seen": 15052800.0, "progress": 0.13054714350416952, "epoch": 11.749287953873305, "img/sec/core": 762.9709499539711, "core_hours_NVIDIA A100-SXM4-40GB": 5.867428450857777, "core_hours": 5.867428450857777} {"step": 14750, "global_schedule": 0.9947233200073242, "l2_grads": 1.2070763111114502, "l2_params": 307.09759521484375, "l2_updates": 0.9965167045593262, "train/loss": 3.5557608604431152, "uptime": 2895.537786056, "examples_seen": 15104000.0, "progress": 0.13099118140724492, "epoch": 11.789251518342262, "img/sec/core": 728.4969558936141, "core_hours_NVIDIA A100-SXM4-40GB": 5.886951143584443, "core_hours": 5.886951143584443} {"step": 14800, "global_schedule": 0.9946118593215942, "l2_grads": 0.8422117233276367, "l2_params": 307.365966796875, "l2_updates": 1.0038374662399292, "train/loss": 5.877200603485107, "uptime": 2904.8963836109997, "examples_seen": 15155200.0, "progress": 0.13143521931032032, "epoch": 11.829215082811219, "img/sec/core": 683.863149621283, "core_hours_NVIDIA A100-SXM4-40GB": 5.907748027039998, "core_hours": 5.907748027039998} {"step": 14850, "global_schedule": 0.9944992065429688, "l2_grads": 1.1724146604537964, "l2_params": 307.5762634277344, "l2_updates": 1.062805414199829, "train/loss": 3.4222633838653564, "uptime": 2913.580484895001, "examples_seen": 15206400.0, "progress": 0.13187925721339575, "epoch": 11.869178647280176, "img/sec/core": 736.9789677362069, "core_hours_NVIDIA A100-SXM4-40GB": 5.927046029893334, "core_hours": 5.927046029893334} {"step": 14900, "global_schedule": 0.9943853616714478, "l2_grads": 1.2082290649414062, "l2_params": 307.8558654785156, "l2_updates": 1.0450541973114014, "train/loss": 3.4571735858917236, "uptime": 2922.4720046620005, "examples_seen": 15257600.0, "progress": 0.13232329511647115, "epoch": 11.909142211749131, "img/sec/core": 719.7869619267333, "core_hours_NVIDIA A100-SXM4-40GB": 5.946804962708888, "core_hours": 5.946804962708888} {"step": 14950, "global_schedule": 0.9942704439163208, "l2_grads": 1.0985621213912964, "l2_params": 308.1943054199219, "l2_updates": 1.0521256923675537, "train/loss": 3.5318241119384766, "uptime": 2931.5745811430006, "examples_seen": 15308800.0, "progress": 0.13276733301954655, "epoch": 11.949105776218088, "img/sec/core": 703.0976354177035, "core_hours_NVIDIA A100-SXM4-40GB": 5.967032910444444, "core_hours": 5.967032910444444} {"step": 15000, "global_schedule": 0.9941542744636536, "l2_grads": 0.8980629444122314, "l2_params": 308.4652099609375, "l2_updates": 1.0456337928771973, "train/loss": 5.606868743896484, "uptime": 2940.125762765001, "examples_seen": 15360000.0, "progress": 0.13321137092262195, "epoch": 11.989069340687045, "img/sec/core": 748.4345769868875, "core_hours_NVIDIA A100-SXM4-40GB": 5.986035536271112, "core_hours": 5.986035536271112, "val/acc@1": 0.45348, "val/loss": 2.499212568359375, "z/secs/eval/val": 5.03177665000112} {"step": 15050, "global_schedule": 0.9940370321273804, "l2_grads": 1.2030996084213257, "l2_params": 308.7355651855469, "l2_updates": 1.02852201461792, "train/loss": 3.65271258354187, "uptime": 2955.8911231029997, "examples_seen": 15411200.0, "progress": 0.13365540882569737, "epoch": 12.029032905156003, "img/sec/core": 647.8506466207685, "core_hours_NVIDIA A100-SXM4-40GB": 6.00798846986222, "core_hours": 6.00798846986222} {"step": 15100, "global_schedule": 0.9939185380935669, "l2_grads": 1.2266570329666138, "l2_params": 309.00634765625, "l2_updates": 1.0679404735565186, "train/loss": 3.2967262268066406, "uptime": 2965.073427106001, "examples_seen": 15462400.0, "progress": 0.13409944672877278, "epoch": 12.06899646962496, "img/sec/core": 696.992824231058, "core_hours_NVIDIA A100-SXM4-40GB": 6.028393589868889, "core_hours": 6.028393589868889} {"step": 15150, "global_schedule": 0.9937989711761475, "l2_grads": 1.2320588827133179, "l2_params": 309.29443359375, "l2_updates": 1.0329475402832031, "train/loss": 3.5815749168395996, "uptime": 2974.215030020001, "examples_seen": 15513600.0, "progress": 0.13454348463184818, "epoch": 12.108960034093917, "img/sec/core": 700.0960400717727, "core_hours_NVIDIA A100-SXM4-40GB": 6.048708263011111, "core_hours": 6.048708263011111} {"step": 15200, "global_schedule": 0.9936782121658325, "l2_grads": 1.109619379043579, "l2_params": 309.630615234375, "l2_updates": 1.0510231256484985, "train/loss": 3.5307135581970215, "uptime": 2983.044338036001, "examples_seen": 15564800.0, "progress": 0.13498752253492358, "epoch": 12.148923598562872, "img/sec/core": 724.8586172780653, "core_hours_NVIDIA A100-SXM4-40GB": 6.0683289474911115, "core_hours": 6.0683289474911115} {"step": 15250, "global_schedule": 0.9935562610626221, "l2_grads": 1.3925338983535767, "l2_params": 309.8873291015625, "l2_updates": 1.0374614000320435, "train/loss": 3.415846586227417, "uptime": 2992.3158621889997, "examples_seen": 15616000.0, "progress": 0.13543156043799898, "epoch": 12.18888716303183, "img/sec/core": 690.2856417550402, "core_hours_NVIDIA A100-SXM4-40GB": 6.088932334497775, "core_hours": 6.088932334497775} {"step": 15300, "global_schedule": 0.9934331774711609, "l2_grads": 1.278764009475708, "l2_params": 310.1173095703125, "l2_updates": 1.0723552703857422, "train/loss": 3.294156074523926, "uptime": 3001.6187033530005, "examples_seen": 15667200.0, "progress": 0.1358755983410744, "epoch": 12.228850727500786, "img/sec/core": 687.9618696238884, "core_hours_NVIDIA A100-SXM4-40GB": 6.109605314862222, "core_hours": 6.109605314862222} {"step": 15350, "global_schedule": 0.993308961391449, "l2_grads": 1.101001501083374, "l2_params": 310.3455505371094, "l2_updates": 1.0595202445983887, "train/loss": 3.918752670288086, "uptime": 3010.8673930390014, "examples_seen": 15718400.0, "progress": 0.1363196362441498, "epoch": 12.268814291969743, "img/sec/core": 691.9899161161397, "core_hours_NVIDIA A100-SXM4-40GB": 6.130157958608891, "core_hours": 6.130157958608891} {"step": 15400, "global_schedule": 0.9931836128234863, "l2_grads": 1.2892062664031982, "l2_params": 310.5898742675781, "l2_updates": 0.9999563097953796, "train/loss": 3.425018548965454, "uptime": 3019.8658814870014, "examples_seen": 15769600.0, "progress": 0.1367636741472252, "epoch": 12.3087778564387, "img/sec/core": 711.2305624421253, "core_hours_NVIDIA A100-SXM4-40GB": 6.150154599604446, "core_hours": 6.150154599604446} {"step": 15450, "global_schedule": 0.9930570125579834, "l2_grads": 1.0053704977035522, "l2_params": 310.78936767578125, "l2_updates": 0.9522905945777893, "train/loss": 5.513970851898193, "uptime": 3028.3809223120006, "examples_seen": 15820800.0, "progress": 0.1372077120503006, "epoch": 12.348741420907658, "img/sec/core": 751.6111938313081, "core_hours_NVIDIA A100-SXM4-40GB": 6.1690769125488885, "core_hours": 6.1690769125488885} {"step": 15500, "global_schedule": 0.9929293394088745, "l2_grads": 1.2836124897003174, "l2_params": 311.048828125, "l2_updates": 0.9883063435554504, "train/loss": 3.406122922897339, "uptime": 3037.534227170001, "examples_seen": 15872000.0, "progress": 0.137651749953376, "epoch": 12.388704985376613, "img/sec/core": 699.2010098304663, "core_hours_NVIDIA A100-SXM4-40GB": 6.189417590011112, "core_hours": 6.189417590011112} {"step": 15550, "global_schedule": 0.9928004741668701, "l2_grads": 1.178122878074646, "l2_params": 311.2525634765625, "l2_updates": 1.0571215152740479, "train/loss": 3.463449478149414, "uptime": 3046.910223744, "examples_seen": 15923200.0, "progress": 0.13809578785645144, "epoch": 12.42866854984557, "img/sec/core": 682.5941060759376, "core_hours_NVIDIA A100-SXM4-40GB": 6.210253137953332, "core_hours": 6.210253137953332} {"step": 15600, "global_schedule": 0.9926704168319702, "l2_grads": 1.1582363843917847, "l2_params": 311.4874267578125, "l2_updates": 1.031134009361267, "train/loss": 3.600782871246338, "uptime": 3056.155246624001, "examples_seen": 15974400.0, "progress": 0.13853982575952684, "epoch": 12.468632114314527, "img/sec/core": 692.2643765268294, "core_hours_NVIDIA A100-SXM4-40GB": 6.230797633242222, "core_hours": 6.230797633242222} {"step": 15650, "global_schedule": 0.9925392866134644, "l2_grads": 0.906943678855896, "l2_params": 311.67852783203125, "l2_updates": 1.034419298171997, "train/loss": 5.024080753326416, "uptime": 3065.561014629, "examples_seen": 16025600.0, "progress": 0.13898386366260224, "epoch": 12.508595678783484, "img/sec/core": 680.4335378672356, "core_hours_NVIDIA A100-SXM4-40GB": 6.251699339919998, "core_hours": 6.251699339919998} {"step": 15700, "global_schedule": 0.992406964302063, "l2_grads": 0.9087194800376892, "l2_params": 311.8910217285156, "l2_updates": 1.0325331687927246, "train/loss": 4.58413028717041, "uptime": 3074.6667206439997, "examples_seen": 16076800.0, "progress": 0.13942790156567764, "epoch": 12.548559243252441, "img/sec/core": 702.8559882624579, "core_hours_NVIDIA A100-SXM4-40GB": 6.271934242175553, "core_hours": 6.271934242175553} {"step": 15750, "global_schedule": 0.9922735095024109, "l2_grads": 1.1898897886276245, "l2_params": 312.1784362792969, "l2_updates": 1.0356656312942505, "train/loss": 3.719433307647705, "uptime": 3084.029991577001, "examples_seen": 16128000.0, "progress": 0.13987193946875306, "epoch": 12.588522807721398, "img/sec/core": 683.5218211450947, "core_hours_NVIDIA A100-SXM4-40GB": 6.2927415109155564, "core_hours": 6.2927415109155564} {"step": 15800, "global_schedule": 0.9921388626098633, "l2_grads": 1.2042983770370483, "l2_params": 312.42218017578125, "l2_updates": 1.0685210227966309, "train/loss": 3.352202892303467, "uptime": 3093.4170079940013, "examples_seen": 16179200.0, "progress": 0.14031597737182847, "epoch": 12.628486372190354, "img/sec/core": 681.7927779916673, "core_hours_NVIDIA A100-SXM4-40GB": 6.313601547397779, "core_hours": 6.313601547397779} {"step": 15850, "global_schedule": 0.9920030832290649, "l2_grads": 1.344178318977356, "l2_params": 312.72576904296875, "l2_updates": 1.0311758518218994, "train/loss": 3.393712043762207, "uptime": 3102.7652698130005, "examples_seen": 16230400.0, "progress": 0.14076001527490387, "epoch": 12.66844993665931, "img/sec/core": 684.6192504998959, "core_hours_NVIDIA A100-SXM4-40GB": 6.33437546255111, "core_hours": 6.33437546255111} {"step": 15900, "global_schedule": 0.9918661713600159, "l2_grads": 1.2206408977508545, "l2_params": 312.934326171875, "l2_updates": 1.0507642030715942, "train/loss": 3.285288095474243, "uptime": 3111.723697046, "examples_seen": 16281600.0, "progress": 0.14120405317797927, "epoch": 12.708413501128268, "img/sec/core": 714.4111163201587, "core_hours_NVIDIA A100-SXM4-40GB": 6.354283078624443, "core_hours": 6.354283078624443} {"step": 15950, "global_schedule": 0.9917280673980713, "l2_grads": 1.2511186599731445, "l2_params": 313.13848876953125, "l2_updates": 1.0554227828979492, "train/loss": 3.400506019592285, "uptime": 3120.287441509001, "examples_seen": 16332800.0, "progress": 0.14164809108105467, "epoch": 12.748377065597225, "img/sec/core": 747.3366385055818, "core_hours_NVIDIA A100-SXM4-40GB": 6.373313621875556, "core_hours": 6.373313621875556} {"step": 16000, "global_schedule": 0.991588830947876, "l2_grads": 1.1735320091247559, "l2_params": 313.35992431640625, "l2_updates": 1.079667568206787, "train/loss": 3.383143901824951, "uptime": 3129.0777184670005, "examples_seen": 16384000.0, "progress": 0.1420921289841301, "epoch": 12.788340630066182, "img/sec/core": 728.0771732881155, "core_hours_NVIDIA A100-SXM4-40GB": 6.39284757067111, "core_hours": 6.39284757067111} {"step": 16050, "global_schedule": 0.9914484620094299, "l2_grads": 1.2108447551727295, "l2_params": 313.5644226074219, "l2_updates": 1.0185960531234741, "train/loss": 3.3360633850097656, "uptime": 3138.577745828001, "examples_seen": 16435200.0, "progress": 0.1425361668872055, "epoch": 12.82830419453514, "img/sec/core": 759.0837778669038, "core_hours_NVIDIA A100-SXM4-40GB": 6.411583608295558, "core_hours": 6.411583608295558} {"step": 16100, "global_schedule": 0.9913069009780884, "l2_grads": 1.1916855573654175, "l2_params": 313.7496032714844, "l2_updates": 1.0256850719451904, "train/loss": 3.413973331451416, "uptime": 3147.160904755001, "examples_seen": 16486400.0, "progress": 0.1429802047902809, "epoch": 12.868267759004096, "img/sec/core": 745.6462188842231, "core_hours_NVIDIA A100-SXM4-40GB": 6.430657294800003, "core_hours": 6.430657294800003} {"step": 16150, "global_schedule": 0.9911642074584961, "l2_grads": 1.2775324583053589, "l2_params": 313.935302734375, "l2_updates": 0.9507825970649719, "train/loss": 3.804333448410034, "uptime": 3155.7373393380003, "examples_seen": 16537600.0, "progress": 0.1434242426933563, "epoch": 12.908231323473052, "img/sec/core": 746.2308419732375, "core_hours_NVIDIA A100-SXM4-40GB": 6.449716038317779, "core_hours": 6.449716038317779} {"step": 16200, "global_schedule": 0.9910203218460083, "l2_grads": 0.8278502225875854, "l2_params": 314.04437255859375, "l2_updates": 0.9997682571411133, "train/loss": 5.501415252685547, "uptime": 3164.277238730001, "examples_seen": 16588800.0, "progress": 0.14386828059643172, "epoch": 12.948194887942009, "img/sec/core": 749.4233487100371, "core_hours_NVIDIA A100-SXM4-40GB": 6.468693592522226, "core_hours": 6.468693592522226} {"step": 16250, "global_schedule": 0.9908753633499146, "l2_grads": 1.2950917482376099, "l2_params": 314.25518798828125, "l2_updates": 1.0456669330596924, "train/loss": 3.343764305114746, "uptime": 3172.761184985, "examples_seen": 16640000.0, "progress": 0.14431231849950713, "epoch": 12.988158452410966, "img/sec/core": 754.3659292076443, "core_hours_NVIDIA A100-SXM4-40GB": 6.487546806422222, "core_hours": 6.487546806422222} {"step": 16300, "global_schedule": 0.9907292127609253, "l2_grads": 0.9289043545722961, "l2_params": 314.4764404296875, "l2_updates": 1.030553936958313, "train/loss": 5.605979919433594, "uptime": 3182.1489844940006, "examples_seen": 16691200.0, "progress": 0.14475635640258253, "epoch": 13.028122016879923, "img/sec/core": 681.7359056149375, "core_hours_NVIDIA A100-SXM4-40GB": 6.508408583108891, "core_hours": 6.508408583108891} {"step": 16350, "global_schedule": 0.9905819296836853, "l2_grads": 0.9287495613098145, "l2_params": 314.7276611328125, "l2_updates": 0.9925442934036255, "train/loss": 5.195245742797852, "uptime": 3190.720328733001, "examples_seen": 16742400.0, "progress": 0.14520039430565793, "epoch": 13.06808558134888, "img/sec/core": 746.6740130304485, "core_hours_NVIDIA A100-SXM4-40GB": 6.527456014751114, "core_hours": 6.527456014751114} {"step": 16400, "global_schedule": 0.9904334545135498, "l2_grads": 1.3960767984390259, "l2_params": 314.90472412109375, "l2_updates": 1.0004903078079224, "train/loss": 3.3193342685699463, "uptime": 3199.2819759330014, "examples_seen": 16793600.0, "progress": 0.14564443220873333, "epoch": 13.108049145817837, "img/sec/core": 747.519706254643, "core_hours_NVIDIA A100-SXM4-40GB": 6.546481897417782, "core_hours": 6.546481897417782} {"step": 16450, "global_schedule": 0.9902838468551636, "l2_grads": 0.9176949858665466, "l2_params": 315.14874267578125, "l2_updates": 1.0216916799545288, "train/loss": 4.588683128356934, "uptime": 3208.052277025001, "examples_seen": 16844800.0, "progress": 0.14608847011180875, "epoch": 13.148012710286793, "img/sec/core": 729.7354940115168, "core_hours_NVIDIA A100-SXM4-40GB": 6.565971455400003, "core_hours": 6.565971455400003} {"step": 16500, "global_schedule": 0.9901331663131714, "l2_grads": 1.2758142948150635, "l2_params": 315.358642578125, "l2_updates": 0.9713940620422363, "train/loss": 3.3978593349456787, "uptime": 3217.4837196980006, "examples_seen": 16896000.0, "progress": 0.14653250801488416, "epoch": 13.18797627475575, "img/sec/core": 678.5812332106786, "core_hours_NVIDIA A100-SXM4-40GB": 6.586930216895557, "core_hours": 6.586930216895557} {"step": 16550, "global_schedule": 0.9899812340736389, "l2_grads": 0.9413235187530518, "l2_params": 315.57476806640625, "l2_updates": 1.0582199096679688, "train/loss": 5.129194259643555, "uptime": 3226.3952407960005, "examples_seen": 16947200.0, "progress": 0.14697654591795956, "epoch": 13.227939839224707, "img/sec/core": 718.1714467843698, "core_hours_NVIDIA A100-SXM4-40GB": 6.606733597113335, "core_hours": 6.606733597113335} {"step": 16600, "global_schedule": 0.9898282289505005, "l2_grads": 0.893416702747345, "l2_params": 315.7598571777344, "l2_updates": 1.0228885412216187, "train/loss": 4.496535301208496, "uptime": 3235.099527128001, "examples_seen": 16998400.0, "progress": 0.14742058382103496, "epoch": 13.267903403693664, "img/sec/core": 735.2699297668055, "core_hours_NVIDIA A100-SXM4-40GB": 6.626076455628891, "core_hours": 6.626076455628891} {"step": 16650, "global_schedule": 0.9896739721298218, "l2_grads": 1.3008817434310913, "l2_params": 315.9909973144531, "l2_updates": 1.0823392868041992, "train/loss": 3.2872421741485596, "uptime": 3243.7098585000003, "examples_seen": 17049600.0, "progress": 0.14786462172411036, "epoch": 13.307866968162621, "img/sec/core": 743.293111901887, "core_hours_NVIDIA A100-SXM4-40GB": 6.645210525344447, "core_hours": 6.645210525344447} {"step": 16700, "global_schedule": 0.9895186424255371, "l2_grads": 0.9822441339492798, "l2_params": 316.1866149902344, "l2_updates": 0.9943505525588989, "train/loss": 5.062549591064453, "uptime": 3252.328442524, "examples_seen": 17100800.0, "progress": 0.14830865962718578, "epoch": 13.347830532631578, "img/sec/core": 742.581377889728, "core_hours_NVIDIA A100-SXM4-40GB": 6.664362934286667, "core_hours": 6.664362934286667} {"step": 16750, "global_schedule": 0.9893621802330017, "l2_grads": 1.2772952318191528, "l2_params": 316.3721008300781, "l2_updates": 1.0083222389221191, "train/loss": 3.5182862281799316, "uptime": 3261.1486609270014, "examples_seen": 17152000.0, "progress": 0.14875269753026119, "epoch": 13.387794097100533, "img/sec/core": 725.6056151423758, "core_hours_NVIDIA A100-SXM4-40GB": 6.683963419626671, "core_hours": 6.683963419626671} {"step": 16800, "global_schedule": 0.9892045259475708, "l2_grads": 1.2161297798156738, "l2_params": 316.5960388183594, "l2_updates": 1.0264078378677368, "train/loss": 3.3353607654571533, "uptime": 3270.1719001340007, "examples_seen": 17203200.0, "progress": 0.14919673543333659, "epoch": 13.42775766156949, "img/sec/core": 709.2796559173067, "core_hours_NVIDIA A100-SXM4-40GB": 6.704015062308891, "core_hours": 6.704015062308891} {"step": 16850, "global_schedule": 0.9890457391738892, "l2_grads": 1.3207950592041016, "l2_params": 316.7222595214844, "l2_updates": 0.9874593019485474, "train/loss": 3.2793946266174316, "uptime": 3278.6515411990003, "examples_seen": 17254400.0, "progress": 0.149640773336412, "epoch": 13.467721226038448, "img/sec/core": 754.7489275715292, "core_hours_NVIDIA A100-SXM4-40GB": 6.722858709120001, "core_hours": 6.722858709120001} {"step": 16900, "global_schedule": 0.9888858795166016, "l2_grads": 1.1673091650009155, "l2_params": 316.9383239746094, "l2_updates": 1.0354859828948975, "train/loss": 3.391495943069458, "uptime": 3287.269179182, "examples_seen": 17305600.0, "progress": 0.15008481123948741, "epoch": 13.507684790507405, "img/sec/core": 742.6628981892353, "core_hours_NVIDIA A100-SXM4-40GB": 6.74200901574889, "core_hours": 6.74200901574889} {"step": 16950, "global_schedule": 0.9887247681617737, "l2_grads": 1.323751449584961, "l2_params": 317.1114196777344, "l2_updates": 1.0601918697357178, "train/loss": 3.2693443298339844, "uptime": 3295.7201784110002, "examples_seen": 17356800.0, "progress": 0.15052884914256282, "epoch": 13.547648354976362, "img/sec/core": 757.3068966848042, "core_hours_NVIDIA A100-SXM4-40GB": 6.760789014035557, "core_hours": 6.760789014035557} {"step": 17000, "global_schedule": 0.9885625839233398, "l2_grads": 1.1446449756622314, "l2_params": 317.2537536621094, "l2_updates": 1.0233525037765503, "train/loss": 3.3009839057922363, "uptime": 3304.8832567610007, "examples_seen": 17408000.0, "progress": 0.15097288704563822, "epoch": 13.587611919445319, "img/sec/core": 698.4552303865979, "core_hours_NVIDIA A100-SXM4-40GB": 6.781151410368891, "core_hours": 6.781151410368891} {"step": 17050, "global_schedule": 0.9883992075920105, "l2_grads": 0.9884942173957825, "l2_params": 317.4132385253906, "l2_updates": 0.9931695461273193, "train/loss": 5.493070602416992, "uptime": 3314.3689997640013, "examples_seen": 17459200.0, "progress": 0.15141692494871362, "epoch": 13.627575483914274, "img/sec/core": 726.5926604870492, "core_hours_NVIDIA A100-SXM4-40GB": 6.800725269280003, "core_hours": 6.800725269280003} {"step": 17100, "global_schedule": 0.9882346987724304, "l2_grads": 1.025561809539795, "l2_params": 317.5842590332031, "l2_updates": 1.0318549871444702, "train/loss": 4.055927276611328, "uptime": 3323.4694606619996, "examples_seen": 17510400.0, "progress": 0.15186096285178902, "epoch": 13.667539048383231, "img/sec/core": 703.2610844366889, "core_hours_NVIDIA A100-SXM4-40GB": 6.820948515719999, "core_hours": 6.820948515719999} {"step": 17150, "global_schedule": 0.9880690574645996, "l2_grads": 1.0245094299316406, "l2_params": 317.7586364746094, "l2_updates": 1.026801586151123, "train/loss": 4.240410327911377, "uptime": 3332.105960252, "examples_seen": 17561600.0, "progress": 0.15230500075486444, "epoch": 13.707502612852188, "img/sec/core": 741.040966112032, "core_hours_NVIDIA A100-SXM4-40GB": 6.84014073703111, "core_hours": 6.84014073703111} {"step": 17200, "global_schedule": 0.9879022836685181, "l2_grads": 1.222824215888977, "l2_params": 317.9499816894531, "l2_updates": 0.9793375134468079, "train/loss": 3.876617431640625, "uptime": 3341.2967474590005, "examples_seen": 17612800.0, "progress": 0.15274903865793985, "epoch": 13.747466177321146, "img/sec/core": 696.3494917089558, "core_hours_NVIDIA A100-SXM4-40GB": 6.860564708602223, "core_hours": 6.860564708602223} {"step": 17250, "global_schedule": 0.987734317779541, "l2_grads": 1.1194343566894531, "l2_params": 318.15753173828125, "l2_updates": 1.0868691205978394, "train/loss": 3.4326820373535156, "uptime": 3349.914133837001, "examples_seen": 17664000.0, "progress": 0.15319307656101525, "epoch": 13.787429741790103, "img/sec/core": 742.6845819909769, "core_hours_NVIDIA A100-SXM4-40GB": 6.87971445610889, "core_hours": 6.87971445610889} {"step": 17300, "global_schedule": 0.9875652194023132, "l2_grads": 1.0795888900756836, "l2_params": 318.34521484375, "l2_updates": 1.0200687646865845, "train/loss": 4.014702796936035, "uptime": 3358.633101818001, "examples_seen": 17715200.0, "progress": 0.15363711446409065, "epoch": 13.82739330625906, "img/sec/core": 734.0318273844673, "core_hours_NVIDIA A100-SXM4-40GB": 6.899089940511113, "core_hours": 6.899089940511113} {"step": 17350, "global_schedule": 0.9873949885368347, "l2_grads": 0.9052232503890991, "l2_params": 318.47607421875, "l2_updates": 1.0273405313491821, "train/loss": 5.093371391296387, "uptime": 3367.7384048840013, "examples_seen": 17766400.0, "progress": 0.15408115236716607, "epoch": 13.867356870728017, "img/sec/core": 702.8870926765544, "core_hours_NVIDIA A100-SXM4-40GB": 6.919323947324447, "core_hours": 6.919323947324447} {"step": 17400, "global_schedule": 0.9872236251831055, "l2_grads": 1.0037213563919067, "l2_params": 318.6531677246094, "l2_updates": 1.0066819190979004, "train/loss": 5.07702112197876, "uptime": 3376.3156913090006, "examples_seen": 17817600.0, "progress": 0.15452519027024147, "epoch": 13.907320435196972, "img/sec/core": 746.1567310316912, "core_hours_NVIDIA A100-SXM4-40GB": 6.938384583824445, "core_hours": 6.938384583824445} {"step": 17450, "global_schedule": 0.9870511293411255, "l2_grads": 1.0157235860824585, "l2_params": 318.76947021484375, "l2_updates": 1.0225744247436523, "train/loss": 4.467310905456543, "uptime": 3385.698853183001, "examples_seen": 17868800.0, "progress": 0.15496922817331688, "epoch": 13.94728399966593, "img/sec/core": 682.0728541125937, "core_hours_NVIDIA A100-SXM4-40GB": 6.959236054655558, "core_hours": 6.959236054655558} {"step": 17500, "global_schedule": 0.98687744140625, "l2_grads": 1.0990588665008545, "l2_params": 318.8815612792969, "l2_updates": 1.019816517829895, "train/loss": 3.3859810829162598, "uptime": 3394.4327474380007, "examples_seen": 17920000.0, "progress": 0.15541326607639228, "epoch": 13.987247564134886, "img/sec/core": 732.7773628970203, "core_hours_NVIDIA A100-SXM4-40GB": 6.978644708555556, "core_hours": 6.978644708555556, "val/acc@1": 0.49772, "val/loss": 2.2603321826171876, "z/secs/eval/val": 3.9922575169985066} {"step": 17550, "global_schedule": 0.9867026805877686, "l2_grads": 1.34226393699646, "l2_params": 319.0706481933594, "l2_updates": 1.0562702417373657, "train/loss": 3.1025335788726807, "uptime": 3408.3922348819997, "examples_seen": 17971200.0, "progress": 0.15585730397946768, "epoch": 14.027211128603843, "img/sec/core": 642.1639199249287, "core_hours_NVIDIA A100-SXM4-40GB": 7.000792047857778, "core_hours": 7.000792047857778} {"step": 17600, "global_schedule": 0.9865267276763916, "l2_grads": 1.2796863317489624, "l2_params": 319.285888671875, "l2_updates": 1.06374192237854, "train/loss": 3.255329132080078, "uptime": 3417.539495676001, "examples_seen": 18022400.0, "progress": 0.1563013418825431, "epoch": 14.0671746930728, "img/sec/core": 699.6630077713583, "core_hours_NVIDIA A100-SXM4-40GB": 7.021119294066669, "core_hours": 7.021119294066669} {"step": 17650, "global_schedule": 0.9863497018814087, "l2_grads": 0.987587034702301, "l2_params": 319.50201416015625, "l2_updates": 1.0434659719467163, "train/loss": 4.650845527648926, "uptime": 3426.1825187470004, "examples_seen": 18073600.0, "progress": 0.1567453797856185, "epoch": 14.107138257541758, "img/sec/core": 740.4816517815926, "core_hours_NVIDIA A100-SXM4-40GB": 7.040326012002224, "core_hours": 7.040326012002224} {"step": 17700, "global_schedule": 0.9861714839935303, "l2_grads": 1.073815107345581, "l2_params": 319.6327819824219, "l2_updates": 1.0701185464859009, "train/loss": 4.538064956665039, "uptime": 3434.7408669920005, "examples_seen": 18124800.0, "progress": 0.1571894176886939, "epoch": 14.147101822010713, "img/sec/core": 747.8078499246533, "core_hours_NVIDIA A100-SXM4-40GB": 7.059344563657779, "core_hours": 7.059344563657779} {"step": 17750, "global_schedule": 0.9859920740127563, "l2_grads": 1.435820460319519, "l2_params": 319.7562255859375, "l2_updates": 1.0271813869476318, "train/loss": 3.346264362335205, "uptime": 3444.148274983001, "examples_seen": 18176000.0, "progress": 0.1576334555917693, "epoch": 14.18706538647967, "img/sec/core": 680.3149184262486, "core_hours_NVIDIA A100-SXM4-40GB": 7.080249914748892, "core_hours": 7.080249914748892} {"step": 17800, "global_schedule": 0.9858115911483765, "l2_grads": 1.3593765497207642, "l2_params": 319.9430236816406, "l2_updates": 1.0378988981246948, "train/loss": 3.258021831512451, "uptime": 3453.151372759001, "examples_seen": 18227200.0, "progress": 0.1580774934948447, "epoch": 14.227028950948627, "img/sec/core": 710.8664327806094, "core_hours_NVIDIA A100-SXM4-40GB": 7.1002567986955585, "core_hours": 7.1002567986955585} {"step": 17850, "global_schedule": 0.9856300354003906, "l2_grads": 0.9752908945083618, "l2_params": 320.13421630859375, "l2_updates": 0.993016242980957, "train/loss": 5.360183238983154, "uptime": 3461.6650830750004, "examples_seen": 18278400.0, "progress": 0.15852153139792013, "epoch": 14.266992515417584, "img/sec/core": 751.728654423756, "core_hours_NVIDIA A100-SXM4-40GB": 7.119176154953336, "core_hours": 7.119176154953336} {"step": 17900, "global_schedule": 0.9854472279548645, "l2_grads": 0.8434610962867737, "l2_params": 320.23248291015625, "l2_updates": 1.0087870359420776, "train/loss": 5.624547958374023, "uptime": 3470.9624185480006, "examples_seen": 18329600.0, "progress": 0.15896556930099554, "epoch": 14.306956079886541, "img/sec/core": 688.3692665049928, "core_hours_NVIDIA A100-SXM4-40GB": 7.139836900448892, "core_hours": 7.139836900448892} {"step": 17950, "global_schedule": 0.9852633476257324, "l2_grads": 1.0214965343475342, "l2_params": 320.3723449707031, "l2_updates": 1.071871042251587, "train/loss": 4.709832191467285, "uptime": 3479.4764321029998, "examples_seen": 18380800.0, "progress": 0.15940960720407094, "epoch": 14.346919644355498, "img/sec/core": 751.7018805122949, "core_hours_NVIDIA A100-SXM4-40GB": 7.158756930571112, "core_hours": 7.158756930571112} {"step": 18000, "global_schedule": 0.9850782752037048, "l2_grads": 1.2346612215042114, "l2_params": 320.5058288574219, "l2_updates": 1.030654788017273, "train/loss": 3.236906051635742, "uptime": 3488.1657586889996, "examples_seen": 18432000.0, "progress": 0.15985364510714634, "epoch": 14.386883208824454, "img/sec/core": 736.5357875156391, "core_hours_NVIDIA A100-SXM4-40GB": 7.178066545206667, "core_hours": 7.178066545206667} {"step": 18050, "global_schedule": 0.9848921298980713, "l2_grads": 1.170515537261963, "l2_params": 320.6482238769531, "l2_updates": 1.0793925523757935, "train/loss": 3.272934913635254, "uptime": 3497.847839106, "examples_seen": 18483200.0, "progress": 0.16029768301022176, "epoch": 14.426846773293411, "img/sec/core": 721.4986245314345, "core_hours_NVIDIA A100-SXM4-40GB": 7.197778602497779, "core_hours": 7.197778602497779} {"step": 18100, "global_schedule": 0.9847047924995422, "l2_grads": 1.267221212387085, "l2_params": 320.8786926269531, "l2_updates": 0.9885373711585999, "train/loss": 3.2897777557373047, "uptime": 3507.3534662439997, "examples_seen": 18534400.0, "progress": 0.16074172091329716, "epoch": 14.466810337762368, "img/sec/core": 673.2854031708456, "core_hours_NVIDIA A100-SXM4-40GB": 7.218902218360001, "core_hours": 7.218902218360001} {"step": 18150, "global_schedule": 0.9845163226127625, "l2_grads": 1.2215133905410767, "l2_params": 320.9981994628906, "l2_updates": 1.0452609062194824, "train/loss": 2.9970734119415283, "uptime": 3516.485168813, "examples_seen": 18585600.0, "progress": 0.16118575881637257, "epoch": 14.506773902231325, "img/sec/core": 700.8550652674749, "core_hours_NVIDIA A100-SXM4-40GB": 7.239194890735558, "core_hours": 7.239194890735558} {"step": 18200, "global_schedule": 0.9843267202377319, "l2_grads": 1.3805859088897705, "l2_params": 321.13763427734375, "l2_updates": 1.0011941194534302, "train/loss": 3.179689407348633, "uptime": 3525.1949941780003, "examples_seen": 18636800.0, "progress": 0.16162979671944797, "epoch": 14.546737466700282, "img/sec/core": 734.8023332038294, "core_hours_NVIDIA A100-SXM4-40GB": 7.258550058213335, "core_hours": 7.258550058213335} {"step": 18250, "global_schedule": 0.9841359853744507, "l2_grads": 1.0454667806625366, "l2_params": 321.2415771484375, "l2_updates": 1.0526411533355713, "train/loss": 4.1934814453125, "uptime": 3533.9489403589996, "examples_seen": 18688000.0, "progress": 0.16207383462252337, "epoch": 14.58670103116924, "img/sec/core": 731.0988516117926, "core_hours_NVIDIA A100-SXM4-40GB": 7.27800327194889, "core_hours": 7.27800327194889} {"step": 18300, "global_schedule": 0.9839441776275635, "l2_grads": 1.1814861297607422, "l2_params": 321.3841857910156, "l2_updates": 1.0338295698165894, "train/loss": 3.1566245555877686, "uptime": 3543.359343666001, "examples_seen": 18739200.0, "progress": 0.1625178725255988, "epoch": 14.626664595638195, "img/sec/core": 680.0983752989856, "core_hours_NVIDIA A100-SXM4-40GB": 7.298915279297782, "core_hours": 7.298915279297782} {"step": 18350, "global_schedule": 0.9837511777877808, "l2_grads": 1.2983441352844238, "l2_params": 321.4530334472656, "l2_updates": 1.0293928384780884, "train/loss": 3.385558605194092, "uptime": 3552.456978503, "examples_seen": 18790400.0, "progress": 0.1629619104286742, "epoch": 14.666628160107152, "img/sec/core": 703.4795432734039, "core_hours_NVIDIA A100-SXM4-40GB": 7.319132245602224, "core_hours": 7.319132245602224} {"step": 18400, "global_schedule": 0.9835570454597473, "l2_grads": 1.2170988321304321, "l2_params": 321.5505676269531, "l2_updates": 1.0822337865829468, "train/loss": 3.09713077545166, "uptime": 3562.116620779001, "examples_seen": 18841600.0, "progress": 0.1634059483317496, "epoch": 14.706591724576109, "img/sec/core": 662.5504151329063, "core_hours_NVIDIA A100-SXM4-40GB": 7.34059811732667, "core_hours": 7.34059811732667} {"step": 18450, "global_schedule": 0.9833617806434631, "l2_grads": 1.034273624420166, "l2_params": 321.7391052246094, "l2_updates": 1.0100877285003662, "train/loss": 4.569279670715332, "uptime": 3571.7615519210012, "examples_seen": 18892800.0, "progress": 0.163849986234825, "epoch": 14.746555289045066, "img/sec/core": 663.5609840831679, "core_hours_NVIDIA A100-SXM4-40GB": 7.362031297642227, "core_hours": 7.362031297642227} {"step": 18500, "global_schedule": 0.9831653833389282, "l2_grads": 1.3523645401000977, "l2_params": 321.8953552246094, "l2_updates": 1.041687250137329, "train/loss": 3.2336602210998535, "uptime": 3581.149559061001, "examples_seen": 18944000.0, "progress": 0.16429402413790042, "epoch": 14.786518853514023, "img/sec/core": 681.7208279200423, "core_hours_NVIDIA A100-SXM4-40GB": 7.382893535731116, "core_hours": 7.382893535731116} {"step": 18550, "global_schedule": 0.9829678535461426, "l2_grads": 1.215384840965271, "l2_params": 322.0178527832031, "l2_updates": 1.0312503576278687, "train/loss": 3.2561731338500977, "uptime": 3589.8687944030007, "examples_seen": 18995200.0, "progress": 0.16473806204097582, "epoch": 14.82648241798298, "img/sec/core": 734.0093195067127, "core_hours_NVIDIA A100-SXM4-40GB": 7.402269614268892, "core_hours": 7.402269614268892} {"step": 18600, "global_schedule": 0.982769250869751, "l2_grads": 1.2408881187438965, "l2_params": 322.21343994140625, "l2_updates": 1.0130525827407837, "train/loss": 3.382195472717285, "uptime": 3598.3988181840014, "examples_seen": 19046400.0, "progress": 0.16518209994405122, "epoch": 14.866445982451937, "img/sec/core": 750.2909914805925, "core_hours_NVIDIA A100-SXM4-40GB": 7.421225222671116, "core_hours": 7.421225222671116} {"step": 18650, "global_schedule": 0.9825694561004639, "l2_grads": 0.8529976010322571, "l2_params": 322.32061767578125, "l2_updates": 0.9965255260467529, "train/loss": 4.4449663162231445, "uptime": 3607.274754094, "examples_seen": 19097600.0, "progress": 0.16562613784712663, "epoch": 14.906409546920893, "img/sec/core": 721.050722413454, "core_hours_NVIDIA A100-SXM4-40GB": 7.440949524693335, "core_hours": 7.440949524693335} {"step": 18700, "global_schedule": 0.9823684692382812, "l2_grads": 0.9898074269294739, "l2_params": 322.4766540527344, "l2_updates": 1.036763072013855, "train/loss": 5.464521408081055, "uptime": 3616.9359084690004, "examples_seen": 19148800.0, "progress": 0.16607017575020203, "epoch": 14.94637311138985, "img/sec/core": 662.4467171915658, "core_hours_NVIDIA A100-SXM4-40GB": 7.46241875663778, "core_hours": 7.46241875663778} {"step": 18750, "global_schedule": 0.9821664094924927, "l2_grads": 1.180605173110962, "l2_params": 322.6235656738281, "l2_updates": 1.013117790222168, "train/loss": 3.68304443359375, "uptime": 3626.033369074001, "examples_seen": 19200000.0, "progress": 0.16651421365327745, "epoch": 14.986336675858807, "img/sec/core": 703.4930161150979, "core_hours_NVIDIA A100-SXM4-40GB": 7.482635335760004, "core_hours": 7.482635335760004} {"step": 18800, "global_schedule": 0.9819632768630981, "l2_grads": 1.1895169019699097, "l2_params": 322.75726318359375, "l2_updates": 1.0169754028320312, "train/loss": 5.150554656982422, "uptime": 3635.7345996149998, "examples_seen": 19251200.0, "progress": 0.16695825155635285, "epoch": 15.026300240327764, "img/sec/core": 659.7101236747831, "core_hours_NVIDIA A100-SXM4-40GB": 7.504193625851112, "core_hours": 7.504193625851112} {"step": 18850, "global_schedule": 0.9817589521408081, "l2_grads": 1.0741320848464966, "l2_params": 322.9465637207031, "l2_updates": 1.0320080518722534, "train/loss": 3.871427536010742, "uptime": 3644.995790811001, "examples_seen": 19302400.0, "progress": 0.16740228945942826, "epoch": 15.066263804796721, "img/sec/core": 691.0558117797437, "core_hours_NVIDIA A100-SXM4-40GB": 7.524774050731114, "core_hours": 7.524774050731114} {"step": 18900, "global_schedule": 0.9815535545349121, "l2_grads": 0.9555670022964478, "l2_params": 323.0448303222656, "l2_updates": 1.023938536643982, "train/loss": 4.105163097381592, "uptime": 3654.1228503660004, "examples_seen": 19353600.0, "progress": 0.16784632736250366, "epoch": 15.106227369265678, "img/sec/core": 701.2115962905368, "core_hours_NVIDIA A100-SXM4-40GB": 7.545056405297781, "core_hours": 7.545056405297781} {"step": 18950, "global_schedule": 0.9813469648361206, "l2_grads": 1.2707836627960205, "l2_params": 323.1696472167969, "l2_updates": 1.0147348642349243, "train/loss": 3.167090892791748, "uptime": 3663.408609921, "examples_seen": 19404800.0, "progress": 0.16829036526557906, "epoch": 15.146190933734633, "img/sec/core": 689.2274091411549, "core_hours_NVIDIA A100-SXM4-40GB": 7.565691426531113, "core_hours": 7.565691426531113} {"step": 19000, "global_schedule": 0.9811393022537231, "l2_grads": 1.3330129384994507, "l2_params": 323.3106384277344, "l2_updates": 0.9740881323814392, "train/loss": 3.309436082839966, "uptime": 3672.1140490550006, "examples_seen": 19456000.0, "progress": 0.16873440316865448, "epoch": 15.18615449820359, "img/sec/core": 735.1725629788874, "core_hours_NVIDIA A100-SXM4-40GB": 7.585036846828891, "core_hours": 7.585036846828891} {"step": 19050, "global_schedule": 0.9809304475784302, "l2_grads": 1.2348383665084839, "l2_params": 323.4140625, "l2_updates": 1.039442539215088, "train/loss": 3.1691811084747314, "uptime": 3681.595197394001, "examples_seen": 19507200.0, "progress": 0.16917844107172988, "epoch": 15.226118062672548, "img/sec/core": 757.5285850117415, "core_hours_NVIDIA A100-SXM4-40GB": 7.603811349208894, "core_hours": 7.603811349208894} {"step": 19100, "global_schedule": 0.9807205200195312, "l2_grads": 1.4097105264663696, "l2_params": 323.5343933105469, "l2_updates": 0.9675641059875488, "train/loss": 3.2443723678588867, "uptime": 3690.3064402689997, "examples_seen": 19558400.0, "progress": 0.16962247897480529, "epoch": 15.266081627141505, "img/sec/core": 734.6827647714839, "core_hours_NVIDIA A100-SXM4-40GB": 7.623169666708891, "core_hours": 7.623169666708891} {"step": 19150, "global_schedule": 0.9805094003677368, "l2_grads": 1.3111991882324219, "l2_params": 323.67156982421875, "l2_updates": 1.0388263463974, "train/loss": 3.3000059127807617, "uptime": 3699.4210129010007, "examples_seen": 19609600.0, "progress": 0.17006651687788069, "epoch": 15.306045191610462, "img/sec/core": 702.1722529841702, "core_hours_NVIDIA A100-SXM4-40GB": 7.643424272557782, "core_hours": 7.643424272557782} {"step": 19200, "global_schedule": 0.9802972078323364, "l2_grads": 1.081821084022522, "l2_params": 323.80108642578125, "l2_updates": 1.069698691368103, "train/loss": 3.7125887870788574, "uptime": 3708.805775269, "examples_seen": 19660800.0, "progress": 0.17051055478095611, "epoch": 15.346008756079419, "img/sec/core": 681.9565321997922, "core_hours_NVIDIA A100-SXM4-40GB": 7.664279300042225, "core_hours": 7.664279300042225} {"step": 19250, "global_schedule": 0.9800838828086853, "l2_grads": 1.0548194646835327, "l2_params": 323.9255065917969, "l2_updates": 0.9908636212348938, "train/loss": 3.857985258102417, "uptime": 3718.1725393350007, "examples_seen": 19712000.0, "progress": 0.17095459268403151, "epoch": 15.385972320548374, "img/sec/core": 683.2669163975961, "core_hours_NVIDIA A100-SXM4-40GB": 7.685094331300005, "core_hours": 7.685094331300005} {"step": 19300, "global_schedule": 0.9798694252967834, "l2_grads": 1.1545610427856445, "l2_params": 323.96258544921875, "l2_updates": 1.0196386575698853, "train/loss": 3.3818411827087402, "uptime": 3727.6797614509996, "examples_seen": 19763200.0, "progress": 0.17139863058710691, "epoch": 15.425935885017331, "img/sec/core": 673.1724495244455, "core_hours_NVIDIA A100-SXM4-40GB": 7.70622149155778, "core_hours": 7.70622149155778} {"step": 19350, "global_schedule": 0.9796538352966309, "l2_grads": 1.2699284553527832, "l2_params": 324.02459716796875, "l2_updates": 0.9712222814559937, "train/loss": 3.2958199977874756, "uptime": 3736.899558274001, "examples_seen": 19814400.0, "progress": 0.17184266849018232, "epoch": 15.465899449486288, "img/sec/core": 694.1584638864871, "core_hours_NVIDIA A100-SXM4-40GB": 7.726709928942227, "core_hours": 7.726709928942227} {"step": 19400, "global_schedule": 0.9794371128082275, "l2_grads": 1.1798832416534424, "l2_params": 324.1103820800781, "l2_updates": 1.0572044849395752, "train/loss": 3.272052526473999, "uptime": 3746.5488852360013, "examples_seen": 19865600.0, "progress": 0.17228670639325772, "epoch": 15.505863013955246, "img/sec/core": 663.2586941248346, "core_hours_NVIDIA A100-SXM4-40GB": 7.748152877746673, "core_hours": 7.748152877746673} {"step": 19450, "global_schedule": 0.9792193174362183, "l2_grads": 1.0022472143173218, "l2_params": 324.2184753417969, "l2_updates": 1.00697922706604, "train/loss": 5.202481746673584, "uptime": 3755.270277237001, "examples_seen": 19916800.0, "progress": 0.17273074429633314, "epoch": 15.545826578424203, "img/sec/core": 733.8278108891603, "core_hours_NVIDIA A100-SXM4-40GB": 7.767533748860005, "core_hours": 7.767533748860005} {"step": 19500, "global_schedule": 0.9790003299713135, "l2_grads": 1.351524829864502, "l2_params": 324.2785339355469, "l2_updates": 1.000321388244629, "train/loss": 3.131558895111084, "uptime": 3764.593380716, "examples_seen": 19968000.0, "progress": 0.17317478219940854, "epoch": 15.58579014289316, "img/sec/core": 686.4666915278439, "core_hours_NVIDIA A100-SXM4-40GB": 7.788251756591113, "core_hours": 7.788251756591113} {"step": 19550, "global_schedule": 0.9787802696228027, "l2_grads": 1.217874526977539, "l2_params": 324.4462585449219, "l2_updates": 1.0678825378417969, "train/loss": 3.0925655364990234, "uptime": 3773.791729445, "examples_seen": 20019200.0, "progress": 0.17361882010248395, "epoch": 15.625753707362115, "img/sec/core": 695.7770561386222, "core_hours_NVIDIA A100-SXM4-40GB": 7.808692531544447, "core_hours": 7.808692531544447} {"step": 19600, "global_schedule": 0.978559136390686, "l2_grads": 1.2267199754714966, "l2_params": 324.60198974609375, "l2_updates": 0.9983232617378235, "train/loss": 3.080861806869507, "uptime": 3783.1390034040014, "examples_seen": 20070400.0, "progress": 0.17406285800555935, "epoch": 15.665717271831072, "img/sec/core": 684.6916039982674, "core_hours_NVIDIA A100-SXM4-40GB": 7.82946425145334, "core_hours": 7.82946425145334} {"step": 19650, "global_schedule": 0.9783368110656738, "l2_grads": 1.2169890403747559, "l2_params": 324.6741638183594, "l2_updates": 1.0019816160202026, "train/loss": 3.220850706100464, "uptime": 3792.2420220370004, "examples_seen": 20121600.0, "progress": 0.17450689590863477, "epoch": 15.70568083630003, "img/sec/core": 703.063484545621, "core_hours_NVIDIA A100-SXM4-40GB": 7.849693181748893, "core_hours": 7.849693181748893} {"step": 19700, "global_schedule": 0.9781133532524109, "l2_grads": 1.225382685661316, "l2_params": 324.7662658691406, "l2_updates": 1.0062568187713623, "train/loss": 4.082762241363525, "uptime": 3800.8745174450014, "examples_seen": 20172800.0, "progress": 0.17495093381171017, "epoch": 15.745644400768986, "img/sec/core": 741.3846978786919, "core_hours_NVIDIA A100-SXM4-40GB": 7.868876504877784, "core_hours": 7.868876504877784} {"step": 19750, "global_schedule": 0.977888822555542, "l2_grads": 1.0184621810913086, "l2_params": 324.8125, "l2_updates": 1.0161411762237549, "train/loss": 4.239189147949219, "uptime": 3809.7048481420006, "examples_seen": 20224000.0, "progress": 0.17539497171478557, "epoch": 15.785607965237944, "img/sec/core": 724.7746680851811, "core_hours_NVIDIA A100-SXM4-40GB": 7.888499461982226, "core_hours": 7.888499461982226} {"step": 19800, "global_schedule": 0.9776630997657776, "l2_grads": 1.1629981994628906, "l2_params": 324.9288024902344, "l2_updates": 1.057943344116211, "train/loss": 3.1884751319885254, "uptime": 3818.4076025169998, "examples_seen": 20275200.0, "progress": 0.17583900961786098, "epoch": 15.8255715297069, "img/sec/core": 735.3993602744464, "core_hours_NVIDIA A100-SXM4-40GB": 7.907838916148891, "core_hours": 7.907838916148891} {"step": 19850, "global_schedule": 0.9774363040924072, "l2_grads": 1.1418782472610474, "l2_params": 325.0881042480469, "l2_updates": 1.0477712154388428, "train/loss": 5.593245029449463, "uptime": 3827.122255247001, "examples_seen": 20326400.0, "progress": 0.17628304752093638, "epoch": 15.865535094175858, "img/sec/core": 734.3952993063489, "core_hours_NVIDIA A100-SXM4-40GB": 7.927204811104448, "core_hours": 7.927204811104448} {"step": 19900, "global_schedule": 0.9772083759307861, "l2_grads": 1.050741195678711, "l2_params": 325.1816711425781, "l2_updates": 1.0303764343261719, "train/loss": 5.547584533691406, "uptime": 3835.6303505160013, "examples_seen": 20377600.0, "progress": 0.1767270854240118, "epoch": 15.905498658644813, "img/sec/core": 752.2247691934772, "core_hours_NVIDIA A100-SXM4-40GB": 7.946111689480006, "core_hours": 7.946111689480006} {"step": 19950, "global_schedule": 0.9769793748855591, "l2_grads": 1.1996591091156006, "l2_params": 325.2802734375, "l2_updates": 1.0508407354354858, "train/loss": 3.3319003582000732, "uptime": 3844.3957677430008, "examples_seen": 20428800.0, "progress": 0.1771711233270872, "epoch": 15.94546222311377, "img/sec/core": 730.1420838572906, "core_hours_NVIDIA A100-SXM4-40GB": 7.965590394428893, "core_hours": 7.965590394428893} {"step": 20000, "global_schedule": 0.9767491817474365, "l2_grads": 0.993341863155365, "l2_params": 325.4014892578125, "l2_updates": 1.022772192955017, "train/loss": 5.137252330780029, "uptime": 3853.1746253640013, "examples_seen": 20480000.0, "progress": 0.1776151612301626, "epoch": 15.985425787582727, "img/sec/core": 729.0242394056065, "core_hours_NVIDIA A100-SXM4-40GB": 7.985098966920005, "core_hours": 7.985098966920005, "val/acc@1": 0.5195, "val/loss": 2.1072034521484375, "z/secs/eval/val": 2.638215857999967} {"step": 20050, "global_schedule": 0.976517915725708, "l2_grads": 1.1626245975494385, "l2_params": 325.45269775390625, "l2_updates": 1.0256102085113525, "train/loss": 3.241736888885498, "uptime": 3865.758291084001, "examples_seen": 20531200.0, "progress": 0.178059199133238, "epoch": 16.025389352051683, "img/sec/core": 715.9190014284258, "core_hours_NVIDIA A100-SXM4-40GB": 8.004964653113339, "core_hours": 8.004964653113339} {"step": 20100, "global_schedule": 0.9762855768203735, "l2_grads": 1.0615308284759521, "l2_params": 325.562744140625, "l2_updates": 1.0356947183609009, "train/loss": 3.7913901805877686, "uptime": 3874.5501333760003, "examples_seen": 20582400.0, "progress": 0.17850323703631343, "epoch": 16.06535291652064, "img/sec/core": 727.9475435795873, "core_hours_NVIDIA A100-SXM4-40GB": 8.024502080428894, "core_hours": 8.024502080428894} {"step": 20150, "global_schedule": 0.9760520458221436, "l2_grads": 0.9520306587219238, "l2_params": 325.67364501953125, "l2_updates": 0.9972889423370361, "train/loss": 4.936070442199707, "uptime": 3883.385021115, "examples_seen": 20633600.0, "progress": 0.17894727493938883, "epoch": 16.105316480989597, "img/sec/core": 724.4008287449361, "core_hours_NVIDIA A100-SXM4-40GB": 8.044135164293339, "core_hours": 8.044135164293339} {"step": 20200, "global_schedule": 0.9758174419403076, "l2_grads": 1.1503435373306274, "l2_params": 325.80828857421875, "l2_updates": 1.0224547386169434, "train/loss": 4.302257537841797, "uptime": 3892.8476347840005, "examples_seen": 20684800.0, "progress": 0.17939131284246423, "epoch": 16.145280045458556, "img/sec/core": 676.345904405512, "core_hours_NVIDIA A100-SXM4-40GB": 8.065163194668894, "core_hours": 8.065163194668894} {"step": 20250, "global_schedule": 0.9755816459655762, "l2_grads": 1.301679015159607, "l2_params": 325.9251403808594, "l2_updates": 1.006726622581482, "train/loss": 3.0479724407196045, "uptime": 3901.620635022, "examples_seen": 20736000.0, "progress": 0.17983535074553963, "epoch": 16.18524360992751, "img/sec/core": 729.5109798674108, "core_hours_NVIDIA A100-SXM4-40GB": 8.084658750753338, "core_hours": 8.084658750753338} {"step": 20300, "global_schedule": 0.9753448367118835, "l2_grads": 1.1111423969268799, "l2_params": 326.01763916015625, "l2_updates": 1.0395041704177856, "train/loss": 2.940876007080078, "uptime": 3910.841500919001, "examples_seen": 20787200.0, "progress": 0.18027938864861504, "epoch": 16.22520717439647, "img/sec/core": 694.0779826416734, "core_hours_NVIDIA A100-SXM4-40GB": 8.105149563857784, "core_hours": 8.105149563857784} {"step": 20350, "global_schedule": 0.9751068353652954, "l2_grads": 1.1273605823516846, "l2_params": 326.1114807128906, "l2_updates": 1.055743932723999, "train/loss": 2.937285900115967, "uptime": 3919.81825982, "examples_seen": 20838400.0, "progress": 0.18072342655169046, "epoch": 16.265170738865425, "img/sec/core": 712.952199182695, "core_hours_NVIDIA A100-SXM4-40GB": 8.125097916971116, "core_hours": 8.125097916971116} {"step": 20400, "global_schedule": 0.9748678207397461, "l2_grads": 1.2519522905349731, "l2_params": 326.2327880859375, "l2_updates": 1.0428379774093628, "train/loss": 3.070117473602295, "uptime": 3929.4408021750005, "examples_seen": 20889600.0, "progress": 0.18116746445476586, "epoch": 16.30513430333438, "img/sec/core": 665.1048926455705, "core_hours_NVIDIA A100-SXM4-40GB": 8.146481344426672, "core_hours": 8.146481344426672} {"step": 20450, "global_schedule": 0.9746276140213013, "l2_grads": 1.4089399576187134, "l2_params": 326.2900695800781, "l2_updates": 0.9556027054786682, "train/loss": 3.158996105194092, "uptime": 3939.006590145, "examples_seen": 20940800.0, "progress": 0.18161150235784126, "epoch": 16.34509786780334, "img/sec/core": 669.0509992560993, "core_hours_NVIDIA A100-SXM4-40GB": 8.16773865102667, "core_hours": 8.16773865102667} {"step": 20500, "global_schedule": 0.9743863344192505, "l2_grads": 0.9164873361587524, "l2_params": 326.35516357421875, "l2_updates": 0.9531074166297913, "train/loss": 5.236751556396484, "uptime": 3948.804831818001, "examples_seen": 20992000.0, "progress": 0.18205554026091667, "epoch": 16.385061432272295, "img/sec/core": 653.178418494733, "core_hours_NVIDIA A100-SXM4-40GB": 8.189512521411116, "core_hours": 8.189512521411116} {"step": 20550, "global_schedule": 0.9741438627243042, "l2_grads": 0.9559771418571472, "l2_params": 326.4386291503906, "l2_updates": 1.0019710063934326, "train/loss": 4.717892646789551, "uptime": 3958.546615245001, "examples_seen": 21043200.0, "progress": 0.18249957816399207, "epoch": 16.425024996741254, "img/sec/core": 656.9638965963863, "core_hours_NVIDIA A100-SXM4-40GB": 8.211160929026672, "core_hours": 8.211160929026672} {"step": 20600, "global_schedule": 0.9739003777503967, "l2_grads": 1.260766863822937, "l2_params": 326.500244140625, "l2_updates": 1.003686785697937, "train/loss": 3.0365796089172363, "uptime": 3967.915125716001, "examples_seen": 21094400.0, "progress": 0.1829436160670675, "epoch": 16.46498856121021, "img/sec/core": 683.1395470828438, "core_hours_NVIDIA A100-SXM4-40GB": 8.231979841184451, "core_hours": 8.231979841184451} {"step": 20650, "global_schedule": 0.9736557006835938, "l2_grads": 1.3802566528320312, "l2_params": 326.57037353515625, "l2_updates": 1.0058344602584839, "train/loss": 2.9820303916931152, "uptime": 3976.802477665, "examples_seen": 21145600.0, "progress": 0.1833876539701429, "epoch": 16.504952125679164, "img/sec/core": 720.1245136602143, "core_hours_NVIDIA A100-SXM4-40GB": 8.251729512182227, "core_hours": 8.251729512182227} {"step": 20700, "global_schedule": 0.9734100103378296, "l2_grads": 1.3735136985778809, "l2_params": 326.669189453125, "l2_updates": 1.0014286041259766, "train/loss": 2.976224422454834, "uptime": 3985.5897525180008, "examples_seen": 21196800.0, "progress": 0.1838316918732183, "epoch": 16.544915690148123, "img/sec/core": 728.3259152653513, "core_hours_NVIDIA A100-SXM4-40GB": 8.27125678963334, "core_hours": 8.27125678963334} {"step": 20750, "global_schedule": 0.9731631278991699, "l2_grads": 1.1711537837982178, "l2_params": 326.7825012207031, "l2_updates": 1.018262505531311, "train/loss": 3.8283157348632812, "uptime": 3995.0466328790008, "examples_seen": 21248000.0, "progress": 0.1842757297762937, "epoch": 16.58487925461708, "img/sec/core": 676.7559444225899, "core_hours_NVIDIA A100-SXM4-40GB": 8.29227207932445, "core_hours": 8.29227207932445} {"step": 20800, "global_schedule": 0.9729151725769043, "l2_grads": 0.9455167651176453, "l2_params": 326.88604736328125, "l2_updates": 0.9836435914039612, "train/loss": 5.062387466430664, "uptime": 4004.759147681001, "examples_seen": 21299200.0, "progress": 0.18471976767936912, "epoch": 16.624842819086037, "img/sec/core": 658.9436547043225, "core_hours_NVIDIA A100-SXM4-40GB": 8.313855445551118, "core_hours": 8.313855445551118} {"step": 20850, "global_schedule": 0.9726660847663879, "l2_grads": 1.271501898765564, "l2_params": 326.99029541015625, "l2_updates": 1.0017857551574707, "train/loss": 3.344496726989746, "uptime": 4014.508435775, "examples_seen": 21350400.0, "progress": 0.18516380558244452, "epoch": 16.664806383554993, "img/sec/core": 656.4581883614062, "core_hours_NVIDIA A100-SXM4-40GB": 8.33552053020445, "core_hours": 8.33552053020445} {"step": 20900, "global_schedule": 0.9724159240722656, "l2_grads": 1.2288182973861694, "l2_params": 327.048095703125, "l2_updates": 1.0102057456970215, "train/loss": 3.220324993133545, "uptime": 4024.1571242570008, "examples_seen": 21401600.0, "progress": 0.18560784348551992, "epoch": 16.70476994802395, "img/sec/core": 663.3025837593433, "core_hours_NVIDIA A100-SXM4-40GB": 8.35696206016445, "core_hours": 8.35696206016445} {"step": 20950, "global_schedule": 0.9721646308898926, "l2_grads": 1.2923047542572021, "l2_params": 327.1123352050781, "l2_updates": 1.0157848596572876, "train/loss": 3.1139779090881348, "uptime": 4032.884776645, "examples_seen": 21452800.0, "progress": 0.18605188138859532, "epoch": 16.744733512492907, "img/sec/core": 733.3014326739533, "core_hours_NVIDIA A100-SXM4-40GB": 8.376356843248892, "core_hours": 8.376356843248892} {"step": 21000, "global_schedule": 0.9719122052192688, "l2_grads": 1.1350035667419434, "l2_params": 327.2145080566406, "l2_updates": 0.9709814786911011, "train/loss": 3.9238057136535645, "uptime": 4041.7560387330013, "examples_seen": 21504000.0, "progress": 0.18649591929167073, "epoch": 16.784697076961862, "img/sec/core": 721.4306077887288, "core_hours_NVIDIA A100-SXM4-40GB": 8.396070759000006, "core_hours": 8.396070759000006} {"step": 21050, "global_schedule": 0.9716587066650391, "l2_grads": 1.3635507822036743, "l2_params": 327.25640869140625, "l2_updates": 0.9914308190345764, "train/loss": 3.1517386436462402, "uptime": 4051.8652392410004, "examples_seen": 21555200.0, "progress": 0.18693995719474615, "epoch": 16.82466064143082, "img/sec/core": 678.9232389028655, "core_hours_NVIDIA A100-SXM4-40GB": 8.417018962577787, "core_hours": 8.417018962577787} {"step": 21100, "global_schedule": 0.9714040756225586, "l2_grads": 1.2421386241912842, "l2_params": 327.3128356933594, "l2_updates": 1.0518373250961304, "train/loss": 3.0459179878234863, "uptime": 4061.643548074, "examples_seen": 21606400.0, "progress": 0.18738399509782155, "epoch": 16.864624205899776, "img/sec/core": 654.5099064984871, "core_hours_NVIDIA A100-SXM4-40GB": 8.43874853776223, "core_hours": 8.43874853776223} {"step": 21150, "global_schedule": 0.9711483716964722, "l2_grads": 1.41520094871521, "l2_params": 327.3877868652344, "l2_updates": 1.0251973867416382, "train/loss": 3.097912549972534, "uptime": 4071.425637583001, "examples_seen": 21657600.0, "progress": 0.18782803300089695, "epoch": 16.904587770368735, "img/sec/core": 654.2569452171916, "core_hours_NVIDIA A100-SXM4-40GB": 8.460486514448897, "core_hours": 8.460486514448897} {"step": 21200, "global_schedule": 0.9708915948867798, "l2_grads": 1.2907474040985107, "l2_params": 327.4718322753906, "l2_updates": 1.0002003908157349, "train/loss": 3.070769786834717, "uptime": 4081.2131799140006, "examples_seen": 21708800.0, "progress": 0.18827207090397236, "epoch": 16.94455133483769, "img/sec/core": 653.8924464959423, "core_hours_NVIDIA A100-SXM4-40GB": 8.482236608517786, "core_hours": 8.482236608517786} {"step": 21250, "global_schedule": 0.9706336259841919, "l2_grads": 1.2118737697601318, "l2_params": 327.5638732910156, "l2_updates": 1.0311259031295776, "train/loss": 3.273123025894165, "uptime": 4090.9923529240004, "examples_seen": 21760000.0, "progress": 0.18871610880704778, "epoch": 16.98451489930665, "img/sec/core": 654.4520680282078, "core_hours_NVIDIA A100-SXM4-40GB": 8.503968104095565, "core_hours": 8.503968104095565} {"step": 21300, "global_schedule": 0.9703746438026428, "l2_grads": 1.2224184274673462, "l2_params": 327.65325927734375, "l2_updates": 1.045931100845337, "train/loss": 2.900400161743164, "uptime": 4101.490394079001, "examples_seen": 21811200.0, "progress": 0.18916014671012318, "epoch": 17.024478463775605, "img/sec/core": 609.6375414713943, "core_hours_NVIDIA A100-SXM4-40GB": 8.52729708444001, "core_hours": 8.52729708444001} {"step": 21350, "global_schedule": 0.970114529132843, "l2_grads": 0.9799385666847229, "l2_params": 327.7623596191406, "l2_updates": 1.0259661674499512, "train/loss": 4.727677345275879, "uptime": 4111.320722118, "examples_seen": 21862400.0, "progress": 0.18960418461319858, "epoch": 17.06444202824456, "img/sec/core": 651.0464324903246, "core_hours_NVIDIA A100-SXM4-40GB": 8.549142257860007, "core_hours": 8.549142257860007} {"step": 21400, "global_schedule": 0.9698532819747925, "l2_grads": 1.1745034456253052, "l2_params": 327.81689453125, "l2_updates": 1.005108118057251, "train/loss": 3.2388744354248047, "uptime": 4120.947754165001, "examples_seen": 21913600.0, "progress": 0.19004822251627398, "epoch": 17.10440559271352, "img/sec/core": 664.7947123011386, "core_hours_NVIDIA A100-SXM4-40GB": 8.570535662408899, "core_hours": 8.570535662408899} {"step": 21450, "global_schedule": 0.969590961933136, "l2_grads": 1.204001784324646, "l2_params": 327.8368225097656, "l2_updates": 1.0513739585876465, "train/loss": 3.3707969188690186, "uptime": 4129.643064749, "examples_seen": 21964800.0, "progress": 0.19049226041934939, "epoch": 17.144369157182474, "img/sec/core": 736.0289133061693, "core_hours_NVIDIA A100-SXM4-40GB": 8.589858574817784, "core_hours": 8.589858574817784} {"step": 21500, "global_schedule": 0.9693275690078735, "l2_grads": 1.28041410446167, "l2_params": 327.9288330078125, "l2_updates": 1.0346848964691162, "train/loss": 2.9421916007995605, "uptime": 4138.101454803, "examples_seen": 22016000.0, "progress": 0.1909362983224248, "epoch": 17.184332721651433, "img/sec/core": 756.6451723248833, "core_hours_NVIDIA A100-SXM4-40GB": 8.608654997160007, "core_hours": 8.608654997160007} {"step": 21550, "global_schedule": 0.9690630435943604, "l2_grads": 1.2641133069992065, "l2_params": 328.00848388671875, "l2_updates": 1.0351123809814453, "train/loss": 3.042762279510498, "uptime": 4146.633759905, "examples_seen": 22067200.0, "progress": 0.1913803362255002, "epoch": 17.22429628612039, "img/sec/core": 750.0903827852418, "core_hours_NVIDIA A100-SXM4-40GB": 8.627615675164453, "core_hours": 8.627615675164453} {"step": 21600, "global_schedule": 0.9687973856925964, "l2_grads": 0.9602210521697998, "l2_params": 328.09771728515625, "l2_updates": 0.994950532913208, "train/loss": 4.322782039642334, "uptime": 4155.372779456, "examples_seen": 22118400.0, "progress": 0.19182437412857561, "epoch": 17.264259850589344, "img/sec/core": 732.3476006261883, "core_hours_NVIDIA A100-SXM4-40GB": 8.647035718611118, "core_hours": 8.647035718611118} {"step": 21650, "global_schedule": 0.9685306549072266, "l2_grads": 1.4260687828063965, "l2_params": 328.1282043457031, "l2_updates": 1.00872004032135, "train/loss": 3.122709274291992, "uptime": 4163.898855896001, "examples_seen": 22169600.0, "progress": 0.19226841203165101, "epoch": 17.304223415058303, "img/sec/core": 750.6383557592546, "core_hours_NVIDIA A100-SXM4-40GB": 8.665982555144454, "core_hours": 8.665982555144454} {"step": 21700, "global_schedule": 0.968262791633606, "l2_grads": 0.9599906206130981, "l2_params": 328.2051086425781, "l2_updates": 1.0197696685791016, "train/loss": 4.921281814575195, "uptime": 4172.581907192001, "examples_seen": 22220800.0, "progress": 0.19271244993472642, "epoch": 17.344186979527258, "img/sec/core": 737.0680860710698, "core_hours_NVIDIA A100-SXM4-40GB": 8.685278224691121, "core_hours": 8.685278224691121} {"step": 21750, "global_schedule": 0.9679938554763794, "l2_grads": 0.9104562401771545, "l2_params": 328.25299072265625, "l2_updates": 0.9805992841720581, "train/loss": 4.876222133636475, "uptime": 4181.420907869, "examples_seen": 22272000.0, "progress": 0.19315648783780184, "epoch": 17.384150543996217, "img/sec/core": 724.0637526654356, "core_hours_NVIDIA A100-SXM4-40GB": 8.704920448417786, "core_hours": 8.704920448417786} {"step": 21800, "global_schedule": 0.9677238464355469, "l2_grads": 1.2830828428268433, "l2_params": 328.29803466796875, "l2_updates": 1.0422815084457397, "train/loss": 3.0347487926483154, "uptime": 4190.020768879, "examples_seen": 22323200.0, "progress": 0.19360052574087724, "epoch": 17.424114108465172, "img/sec/core": 744.1980739640243, "core_hours_NVIDIA A100-SXM4-40GB": 8.724031250662229, "core_hours": 8.724031250662229} {"step": 21850, "global_schedule": 0.9674527645111084, "l2_grads": 1.3311116695404053, "l2_params": 328.33990478515625, "l2_updates": 1.0088346004486084, "train/loss": 3.084259510040283, "uptime": 4198.638593515001, "examples_seen": 22374400.0, "progress": 0.19404456364395264, "epoch": 17.46407767293413, "img/sec/core": 742.646812893324, "core_hours_NVIDIA A100-SXM4-40GB": 8.743181972075565, "core_hours": 8.743181972075565} {"step": 21900, "global_schedule": 0.9671805500984192, "l2_grads": 0.9402365684509277, "l2_params": 328.4013366699219, "l2_updates": 0.9752943515777588, "train/loss": 4.85453987121582, "uptime": 4207.60952405, "examples_seen": 22425600.0, "progress": 0.19448860154702804, "epoch": 17.504041237403086, "img/sec/core": 713.4154004460615, "core_hours_NVIDIA A100-SXM4-40GB": 8.763117373264452, "core_hours": 8.763117373264452} {"step": 21950, "global_schedule": 0.966907262802124, "l2_grads": 1.4637542963027954, "l2_params": 328.4921569824219, "l2_updates": 1.0303765535354614, "train/loss": 3.0935633182525635, "uptime": 4216.605535683, "examples_seen": 22476800.0, "progress": 0.19493263945010347, "epoch": 17.544004801872042, "img/sec/core": 711.426381055657, "core_hours_NVIDIA A100-SXM4-40GB": 8.783108510226674, "core_hours": 8.783108510226674} {"step": 22000, "global_schedule": 0.9666328430175781, "l2_grads": 1.1616696119308472, "l2_params": 328.5394287109375, "l2_updates": 1.0247483253479004, "train/loss": 2.8468496799468994, "uptime": 4225.094011012001, "examples_seen": 22528000.0, "progress": 0.19537667735317887, "epoch": 17.583968366341, "img/sec/core": 753.9634330012738, "core_hours_NVIDIA A100-SXM4-40GB": 8.801971788735564, "core_hours": 8.801971788735564} {"step": 22050, "global_schedule": 0.9663573503494263, "l2_grads": 1.2377854585647583, "l2_params": 328.5367126464844, "l2_updates": 0.989515483379364, "train/loss": 3.014307737350464, "uptime": 4234.898246759001, "examples_seen": 22579200.0, "progress": 0.19582071525625427, "epoch": 17.623931930809956, "img/sec/core": 702.5886466573141, "core_hours_NVIDIA A100-SXM4-40GB": 8.822214390562234, "core_hours": 8.822214390562234} {"step": 22100, "global_schedule": 0.9660807847976685, "l2_grads": 1.29132080078125, "l2_params": 328.6191101074219, "l2_updates": 1.0262576341629028, "train/loss": 2.894258975982666, "uptime": 4244.596217125001, "examples_seen": 22630400.0, "progress": 0.19626475315932967, "epoch": 17.663895495278915, "img/sec/core": 659.9318989917443, "core_hours_NVIDIA A100-SXM4-40GB": 8.843765435820012, "core_hours": 8.843765435820012} {"step": 22150, "global_schedule": 0.9658030867576599, "l2_grads": 1.2494958639144897, "l2_params": 328.68743896484375, "l2_updates": 1.0245180130004883, "train/loss": 3.526423454284668, "uptime": 4254.265554347001, "examples_seen": 22681600.0, "progress": 0.19670879106240508, "epoch": 17.70385905974787, "img/sec/core": 661.8861099847338, "core_hours_NVIDIA A100-SXM4-40GB": 8.865252851868899, "core_hours": 8.865252851868899} {"step": 22200, "global_schedule": 0.9655243158340454, "l2_grads": 1.174910306930542, "l2_params": 328.7462463378906, "l2_updates": 1.0038206577301025, "train/loss": 3.424184799194336, "uptime": 4262.9750846080005, "examples_seen": 22732800.0, "progress": 0.1971528289654805, "epoch": 17.743822624216826, "img/sec/core": 734.8272304257964, "core_hours_NVIDIA A100-SXM4-40GB": 8.88460736356001, "core_hours": 8.88460736356001} {"step": 22250, "global_schedule": 0.9652444124221802, "l2_grads": 1.3027539253234863, "l2_params": 328.8001708984375, "l2_updates": 0.9912292957305908, "train/loss": 3.121037006378174, "uptime": 4271.834747683, "examples_seen": 22784000.0, "progress": 0.1975968668685559, "epoch": 17.783786188685784, "img/sec/core": 722.3751000260371, "core_hours_NVIDIA A100-SXM4-40GB": 8.904295503726676, "core_hours": 8.904295503726676} {"step": 22300, "global_schedule": 0.9649634957313538, "l2_grads": 1.220533847808838, "l2_params": 328.88067626953125, "l2_updates": 1.00504469871521, "train/loss": 3.158754348754883, "uptime": 4281.269057472, "examples_seen": 22835200.0, "progress": 0.1980409047716313, "epoch": 17.82374975315474, "img/sec/core": 678.3750102696857, "core_hours_NVIDIA A100-SXM4-40GB": 8.925260636591121, "core_hours": 8.925260636591121} {"step": 22350, "global_schedule": 0.9646814465522766, "l2_grads": 1.170172095298767, "l2_params": 328.911376953125, "l2_updates": 1.0193647146224976, "train/loss": 3.489253520965576, "uptime": 4290.886701888001, "examples_seen": 22886400.0, "progress": 0.1984849426747067, "epoch": 17.8637133176237, "img/sec/core": 665.4436079329619, "core_hours_NVIDIA A100-SXM4-40GB": 8.94663317973779, "core_hours": 8.94663317973779} {"step": 22400, "global_schedule": 0.9643983244895935, "l2_grads": 0.9265945553779602, "l2_params": 328.9757385253906, "l2_updates": 0.9897303581237793, "train/loss": 5.2920331954956055, "uptime": 4300.142670077001, "examples_seen": 22937600.0, "progress": 0.19892898057778213, "epoch": 17.903676882092654, "img/sec/core": 691.445764431869, "core_hours_NVIDIA A100-SXM4-40GB": 8.967201997935566, "core_hours": 8.967201997935566} {"step": 22450, "global_schedule": 0.9641140699386597, "l2_grads": 1.3639050722122192, "l2_params": 329.0124206542969, "l2_updates": 0.9900166392326355, "train/loss": 3.070218801498413, "uptime": 4309.692169249001, "examples_seen": 22988800.0, "progress": 0.19937301848085753, "epoch": 17.943640446561613, "img/sec/core": 670.192214767131, "core_hours_NVIDIA A100-SXM4-40GB": 8.988423107206678, "core_hours": 8.988423107206678} {"step": 22500, "global_schedule": 0.9638288021087646, "l2_grads": 1.2325907945632935, "l2_params": 329.0225524902344, "l2_updates": 1.020062804222107, "train/loss": 2.848306894302368, "uptime": 4319.16937899, "examples_seen": 23040000.0, "progress": 0.19981705638393293, "epoch": 17.983604011030568, "img/sec/core": 675.3042482866482, "core_hours_NVIDIA A100-SXM4-40GB": 9.009483573297786, "core_hours": 9.009483573297786, "val/acc@1": 0.5434, "val/loss": 1.9798643920898438, "z/secs/eval/val": 2.689539174998572} {"step": 22550, "global_schedule": 0.9635424017906189, "l2_grads": 1.2347959280014038, "l2_params": 329.1133117675781, "l2_updates": 1.0366653203964233, "train/loss": 3.0304205417633057, "uptime": 4331.014033451, "examples_seen": 23091200.0, "progress": 0.20026109428700833, "epoch": 18.023567575499523, "img/sec/core": 699.1392710070514, "core_hours_NVIDIA A100-SXM4-40GB": 9.029826046982231, "core_hours": 9.029826046982231} {"step": 22600, "global_schedule": 0.9632549285888672, "l2_grads": 0.9044938683509827, "l2_params": 329.1844787597656, "l2_updates": 0.9417725801467896, "train/loss": 4.806496620178223, "uptime": 4339.981768906, "examples_seen": 23142400.0, "progress": 0.20070513219008373, "epoch": 18.063531139968482, "img/sec/core": 713.6695804771305, "core_hours_NVIDIA A100-SXM4-40GB": 9.049754347993343, "core_hours": 9.049754347993343} {"step": 22650, "global_schedule": 0.9629663228988647, "l2_grads": 1.3431118726730347, "l2_params": 329.1837158203125, "l2_updates": 0.9928632378578186, "train/loss": 3.0338521003723145, "uptime": 4349.245840102001, "examples_seen": 23193600.0, "progress": 0.20114917009315916, "epoch": 18.103494704437438, "img/sec/core": 690.8409774271335, "core_hours_NVIDIA A100-SXM4-40GB": 9.070341172873345, "core_hours": 9.070341172873345} {"step": 22700, "global_schedule": 0.9626767039299011, "l2_grads": 1.380053162574768, "l2_params": 329.2115173339844, "l2_updates": 0.9892403483390808, "train/loss": 2.986790418624878, "uptime": 4358.648233013, "examples_seen": 23244800.0, "progress": 0.20159320799623456, "epoch": 18.143458268906397, "img/sec/core": 680.6777870889915, "core_hours_NVIDIA A100-SXM4-40GB": 9.091235379342232, "core_hours": 9.091235379342232} {"step": 22750, "global_schedule": 0.9623859524726868, "l2_grads": 1.3046338558197021, "l2_params": 329.2612609863281, "l2_updates": 0.9593276977539062, "train/loss": 3.2893121242523193, "uptime": 4367.647759907, "examples_seen": 23296000.0, "progress": 0.20203724589930996, "epoch": 18.183421833375352, "img/sec/core": 711.1484942910478, "core_hours_NVIDIA A100-SXM4-40GB": 9.111234327995565, "core_hours": 9.111234327995565} {"step": 22800, "global_schedule": 0.9620941281318665, "l2_grads": 0.9718397259712219, "l2_params": 329.27752685546875, "l2_updates": 0.9996173977851868, "train/loss": 5.210874557495117, "uptime": 4376.764008872, "examples_seen": 23347200.0, "progress": 0.20248128380238536, "epoch": 18.22338539784431, "img/sec/core": 702.0431346896933, "core_hours_NVIDIA A100-SXM4-40GB": 9.131492659028899, "core_hours": 9.131492659028899} {"step": 22850, "global_schedule": 0.9618012309074402, "l2_grads": 0.9618927836418152, "l2_params": 329.337646484375, "l2_updates": 0.9810810089111328, "train/loss": 5.4489970207214355, "uptime": 4385.362943191001, "examples_seen": 23398400.0, "progress": 0.20292532170546076, "epoch": 18.263348962313266, "img/sec/core": 744.2782747924665, "core_hours_NVIDIA A100-SXM4-40GB": 9.150601401960012, "core_hours": 9.150601401960012} {"step": 22900, "global_schedule": 0.961507260799408, "l2_grads": 1.2386882305145264, "l2_params": 329.3624572753906, "l2_updates": 1.0355141162872314, "train/loss": 2.9097161293029785, "uptime": 4394.477720129, "examples_seen": 23449600.0, "progress": 0.2033693596085362, "epoch": 18.30331252678222, "img/sec/core": 702.1565139261968, "core_hours_NVIDIA A100-SXM4-40GB": 9.17085646182223, "core_hours": 9.17085646182223} {"step": 22950, "global_schedule": 0.961212158203125, "l2_grads": 1.3085209131240845, "l2_params": 329.4681396484375, "l2_updates": 1.012656807899475, "train/loss": 2.9474735260009766, "uptime": 4404.073554547, "examples_seen": 23500800.0, "progress": 0.2038133975116116, "epoch": 18.34327609125118, "img/sec/core": 666.9560687703072, "core_hours_NVIDIA A100-SXM4-40GB": 9.192180538306674, "core_hours": 9.192180538306674} {"step": 23000, "global_schedule": 0.9609160423278809, "l2_grads": 1.171958565711975, "l2_params": 329.54425048828125, "l2_updates": 1.0190246105194092, "train/loss": 3.3153908252716064, "uptime": 4413.066061621001, "examples_seen": 23552000.0, "progress": 0.204257435414687, "epoch": 18.383239655720136, "img/sec/core": 711.7036380770392, "core_hours_NVIDIA A100-SXM4-40GB": 9.212163887360012, "core_hours": 9.212163887360012} {"step": 23050, "global_schedule": 0.960618793964386, "l2_grads": 0.8877196907997131, "l2_params": 329.57220458984375, "l2_updates": 0.9993690252304077, "train/loss": 4.912896633148193, "uptime": 4422.273292897, "examples_seen": 23603200.0, "progress": 0.2047014733177624, "epoch": 18.423203220189095, "img/sec/core": 782.745875142359, "core_hours_NVIDIA A100-SXM4-40GB": 9.230333542000011, "core_hours": 9.230333542000011} {"step": 23100, "global_schedule": 0.9603204727172852, "l2_grads": 1.2957161664962769, "l2_params": 329.6136779785156, "l2_updates": 0.9811895489692688, "train/loss": 3.1257810592651367, "uptime": 4430.937623092001, "examples_seen": 23654400.0, "progress": 0.20514551122083782, "epoch": 18.46316678465805, "img/sec/core": 738.6606761239044, "core_hours_NVIDIA A100-SXM4-40GB": 9.249587609100013, "core_hours": 9.249587609100013} {"step": 23150, "global_schedule": 0.9600211381912231, "l2_grads": 1.2253938913345337, "l2_params": 329.6544494628906, "l2_updates": 1.0353233814239502, "train/loss": 3.453372001647949, "uptime": 4440.036191175001, "examples_seen": 23705600.0, "progress": 0.20558954912391322, "epoch": 18.503130349127005, "img/sec/core": 703.4073869225624, "core_hours_NVIDIA A100-SXM4-40GB": 9.269806649284456, "core_hours": 9.269806649284456} {"step": 23200, "global_schedule": 0.9597206115722656, "l2_grads": 1.3246161937713623, "l2_params": 329.7247619628906, "l2_updates": 0.9877734780311584, "train/loss": 2.969752788543701, "uptime": 4448.661685206, "examples_seen": 23756800.0, "progress": 0.20603358702698862, "epoch": 18.543093913595964, "img/sec/core": 741.9864852956922, "core_hours_NVIDIA A100-SXM4-40GB": 9.28897441379779, "core_hours": 9.28897441379779} {"step": 23250, "global_schedule": 0.9594191312789917, "l2_grads": 1.1701287031173706, "l2_params": 329.7170715332031, "l2_updates": 1.032720923423767, "train/loss": 2.772886276245117, "uptime": 4457.776736267, "examples_seen": 23808000.0, "progress": 0.20647762493006402, "epoch": 18.58305747806492, "img/sec/core": 702.135397505664, "core_hours_NVIDIA A100-SXM4-40GB": 9.309230082822234, "core_hours": 9.309230082822234} {"step": 23300, "global_schedule": 0.9591164588928223, "l2_grads": 1.1017911434173584, "l2_params": 329.7979431152344, "l2_updates": 1.0040934085845947, "train/loss": 4.275134086608887, "uptime": 4467.287552555001, "examples_seen": 23859200.0, "progress": 0.20692166283313942, "epoch": 18.62302104253388, "img/sec/core": 672.9180552120047, "core_hours_NVIDIA A100-SXM4-40GB": 9.330365230128903, "core_hours": 9.330365230128903} {"step": 23350, "global_schedule": 0.9588127732276917, "l2_grads": 1.1863466501235962, "l2_params": 329.8531799316406, "l2_updates": 1.0124709606170654, "train/loss": 3.053398847579956, "uptime": 4477.040241956001, "examples_seen": 23910400.0, "progress": 0.20736570073621485, "epoch": 18.662984607002834, "img/sec/core": 656.229244760253, "core_hours_NVIDIA A100-SXM4-40GB": 9.352037873242237, "core_hours": 9.352037873242237} {"step": 23400, "global_schedule": 0.9585080146789551, "l2_grads": 1.0386228561401367, "l2_params": 329.9232177734375, "l2_updates": 0.9701112508773804, "train/loss": 4.0552077293396, "uptime": 4485.925039, "examples_seen": 23961600.0, "progress": 0.20780973863929025, "epoch": 18.702948171471792, "img/sec/core": 720.3315920787622, "core_hours_NVIDIA A100-SXM4-40GB": 9.371781866673343, "core_hours": 9.371781866673343} {"step": 23450, "global_schedule": 0.9582021236419678, "l2_grads": 1.1209371089935303, "l2_params": 329.92803955078125, "l2_updates": 0.9460447430610657, "train/loss": 5.548792839050293, "uptime": 4494.587638661, "examples_seen": 24012800.0, "progress": 0.20825377654236565, "epoch": 18.742911735940748, "img/sec/core": 738.8082389185637, "core_hours_NVIDIA A100-SXM4-40GB": 9.391032088142232, "core_hours": 9.391032088142232} {"step": 23500, "global_schedule": 0.9578952789306641, "l2_grads": 0.9485580921173096, "l2_params": 329.9344177246094, "l2_updates": 0.9955036044120789, "train/loss": 5.344472885131836, "uptime": 4503.508039561, "examples_seen": 24064000.0, "progress": 0.20869781444544105, "epoch": 18.782875300409703, "img/sec/core": 717.4565439093293, "core_hours_NVIDIA A100-SXM4-40GB": 9.410855201253346, "core_hours": 9.410855201253346} {"step": 23550, "global_schedule": 0.9575872421264648, "l2_grads": 1.254069447517395, "l2_params": 329.9483947753906, "l2_updates": 1.0272142887115479, "train/loss": 2.912797451019287, "uptime": 4512.958377607001, "examples_seen": 24115200.0, "progress": 0.20914185234851648, "epoch": 18.822838864878662, "img/sec/core": 677.2244515325285, "core_hours_NVIDIA A100-SXM4-40GB": 9.431855952466682, "core_hours": 9.431855952466682} {"step": 23600, "global_schedule": 0.9572781324386597, "l2_grads": 1.261633038520813, "l2_params": 329.96661376953125, "l2_updates": 1.0020697116851807, "train/loss": 3.015470266342163, "uptime": 4522.603022551, "examples_seen": 24166400.0, "progress": 0.20958589025159188, "epoch": 18.862802429347617, "img/sec/core": 663.5806747849326, "core_hours_NVIDIA A100-SXM4-40GB": 9.45328849678668, "core_hours": 9.45328849678668} {"step": 23650, "global_schedule": 0.9569680690765381, "l2_grads": 1.3225995302200317, "l2_params": 330.0583190917969, "l2_updates": 1.0254288911819458, "train/loss": 2.9447221755981445, "uptime": 4531.973043363001, "examples_seen": 24217600.0, "progress": 0.21002992815466728, "epoch": 18.902765993816576, "img/sec/core": 683.0294327418247, "core_hours_NVIDIA A100-SXM4-40GB": 9.474110765257793, "core_hours": 9.474110765257793} {"step": 23700, "global_schedule": 0.956656813621521, "l2_grads": 1.3857941627502441, "l2_params": 330.1068420410156, "l2_updates": 1.0037541389465332, "train/loss": 2.900250196456909, "uptime": 4540.763590782, "examples_seen": 24268800.0, "progress": 0.21047396605774268, "epoch": 18.94272955828553, "img/sec/core": 728.0547723532544, "core_hours_NVIDIA A100-SXM4-40GB": 9.49364531507779, "core_hours": 9.49364531507779} {"step": 23750, "global_schedule": 0.9563445448875427, "l2_grads": 1.21437668800354, "l2_params": 330.1401672363281, "l2_updates": 0.9974298477172852, "train/loss": 3.300863742828369, "uptime": 4549.405182739001, "examples_seen": 24320000.0, "progress": 0.21091800396081808, "epoch": 18.98269312275449, "img/sec/core": 740.6042812302815, "core_hours_NVIDIA A100-SXM4-40GB": 9.512848852760015, "core_hours": 9.512848852760015} {"step": 23800, "global_schedule": 0.9560312032699585, "l2_grads": 0.974838137626648, "l2_params": 330.1827087402344, "l2_updates": 0.9754366278648376, "train/loss": 5.029320240020752, "uptime": 4558.973110742001, "examples_seen": 24371200.0, "progress": 0.2113620418638935, "epoch": 19.022656687223446, "img/sec/core": 668.9013543991299, "core_hours_NVIDIA A100-SXM4-40GB": 9.534110914988903, "core_hours": 9.534110914988903} {"step": 23850, "global_schedule": 0.9557167887687683, "l2_grads": 1.1366995573043823, "l2_params": 330.204833984375, "l2_updates": 0.9916428327560425, "train/loss": 3.2651939392089844, "uptime": 4567.473321284, "examples_seen": 24422400.0, "progress": 0.2118060797669689, "epoch": 19.0626202516924, "img/sec/core": 752.9225268454271, "core_hours_NVIDIA A100-SXM4-40GB": 9.553000271748902, "core_hours": 9.553000271748902} {"step": 23900, "global_schedule": 0.9554013013839722, "l2_grads": 1.0756791830062866, "l2_params": 330.2409973144531, "l2_updates": 1.022942304611206, "train/loss": 3.365732192993164, "uptime": 4576.776661150001, "examples_seen": 24473600.0, "progress": 0.2122501176700443, "epoch": 19.10258381616136, "img/sec/core": 687.9249916891495, "core_hours_NVIDIA A100-SXM4-40GB": 9.573674360340014, "core_hours": 9.573674360340014} {"step": 23950, "global_schedule": 0.9550847411155701, "l2_grads": 1.354775309562683, "l2_params": 330.3694763183594, "l2_updates": 0.9955761432647705, "train/loss": 3.029754161834717, "uptime": 4586.2593332060005, "examples_seen": 24524800.0, "progress": 0.21269415557311971, "epoch": 19.142547380630315, "img/sec/core": 674.9152519674922, "core_hours_NVIDIA A100-SXM4-40GB": 9.594746964908902, "core_hours": 9.594746964908902} {"step": 24000, "global_schedule": 0.954767107963562, "l2_grads": 1.1018584966659546, "l2_params": 330.4258728027344, "l2_updates": 1.0245305299758911, "train/loss": 3.7859079837799072, "uptime": 4595.727278039001, "examples_seen": 24576000.0, "progress": 0.21313819347619511, "epoch": 19.182510945099274, "img/sec/core": 675.9650708665581, "core_hours_NVIDIA A100-SXM4-40GB": 9.61578684231557, "core_hours": 9.61578684231557} {"step": 24050, "global_schedule": 0.9544484615325928, "l2_grads": 1.3351974487304688, "l2_params": 330.4460754394531, "l2_updates": 0.9693443179130554, "train/loss": 2.900634527206421, "uptime": 4605.478748501, "examples_seen": 24627200.0, "progress": 0.21358223137927054, "epoch": 19.22247450956823, "img/sec/core": 731.1455981950103, "core_hours_NVIDIA A100-SXM4-40GB": 9.6352388122889, "core_hours": 9.6352388122889} {"step": 24100, "global_schedule": 0.9541286826133728, "l2_grads": 1.0568839311599731, "l2_params": 330.45068359375, "l2_updates": 0.9937491416931152, "train/loss": 4.252491474151611, "uptime": 4614.334147192001, "examples_seen": 24678400.0, "progress": 0.21402626928234594, "epoch": 19.262438074037185, "img/sec/core": 722.7229652013029, "core_hours_NVIDIA A100-SXM4-40GB": 9.65491747604668, "core_hours": 9.65491747604668} {"step": 24150, "global_schedule": 0.9538078904151917, "l2_grads": 1.2955483198165894, "l2_params": 330.5135498046875, "l2_updates": 0.9860426187515259, "train/loss": 2.9003844261169434, "uptime": 4623.076964399001, "examples_seen": 24729600.0, "progress": 0.21447030718542134, "epoch": 19.302401638506144, "img/sec/core": 732.0294875748045, "core_hours_NVIDIA A100-SXM4-40GB": 9.674345958728901, "core_hours": 9.674345958728901} {"step": 24200, "global_schedule": 0.9534859657287598, "l2_grads": 1.1966979503631592, "l2_params": 330.5052795410156, "l2_updates": 0.9900702834129333, "train/loss": 4.204549312591553, "uptime": 4631.487907959001, "examples_seen": 24780800.0, "progress": 0.21491434508849674, "epoch": 19.3423652029751, "img/sec/core": 760.9134402513774, "core_hours_NVIDIA A100-SXM4-40GB": 9.693036944417791, "core_hours": 9.693036944417791} {"step": 24250, "global_schedule": 0.9531630277633667, "l2_grads": 1.1009619235992432, "l2_params": 330.5238342285156, "l2_updates": 0.9970617294311523, "train/loss": 4.732241630554199, "uptime": 4640.2175207380005, "examples_seen": 24832000.0, "progress": 0.21535838299157217, "epoch": 19.382328767444058, "img/sec/core": 733.136756695117, "core_hours_NVIDIA A100-SXM4-40GB": 9.71243608392668, "core_hours": 9.71243608392668} {"step": 24300, "global_schedule": 0.9528390169143677, "l2_grads": 1.1328229904174805, "l2_params": 330.594482421875, "l2_updates": 1.017040729522705, "train/loss": 3.3002686500549316, "uptime": 4648.946685869001, "examples_seen": 24883200.0, "progress": 0.21580242089464757, "epoch": 19.422292331913013, "img/sec/core": 733.1743533263146, "core_hours_NVIDIA A100-SXM4-40GB": 9.731834228662235, "core_hours": 9.731834228662235} {"step": 24350, "global_schedule": 0.9525139927864075, "l2_grads": 1.2309964895248413, "l2_params": 330.6044006347656, "l2_updates": 1.0007027387619019, "train/loss": 3.077965497970581, "uptime": 4657.559846215001, "examples_seen": 24934400.0, "progress": 0.21624645879772297, "epoch": 19.462255896381972, "img/sec/core": 743.0489788771088, "core_hours_NVIDIA A100-SXM4-40GB": 9.75097458498668, "core_hours": 9.75097458498668} {"step": 24400, "global_schedule": 0.9521878957748413, "l2_grads": 1.3438254594802856, "l2_params": 330.64837646484375, "l2_updates": 1.0025238990783691, "train/loss": 2.9183363914489746, "uptime": 4667.073731420001, "examples_seen": 24985600.0, "progress": 0.21669049670079837, "epoch": 19.502219460850927, "img/sec/core": 672.7009904046585, "core_hours_NVIDIA A100-SXM4-40GB": 9.772116552108905, "core_hours": 9.772116552108905} {"step": 24450, "global_schedule": 0.9518606662750244, "l2_grads": 1.2770429849624634, "l2_params": 330.6410827636719, "l2_updates": 0.9935330152511597, "train/loss": 3.1783640384674072, "uptime": 4676.625994339001, "examples_seen": 25036800.0, "progress": 0.21713453460387377, "epoch": 19.542183025319883, "img/sec/core": 669.998308701286, "core_hours_NVIDIA A100-SXM4-40GB": 9.793343803040015, "core_hours": 9.793343803040015} {"step": 24500, "global_schedule": 0.9515324234962463, "l2_grads": 1.4396165609359741, "l2_params": 330.68878173828125, "l2_updates": 0.924547553062439, "train/loss": 3.2185497283935547, "uptime": 4686.243013968, "examples_seen": 25088000.0, "progress": 0.2175785725069492, "epoch": 19.58214658978884, "img/sec/core": 665.4868396755487, "core_hours_NVIDIA A100-SXM4-40GB": 9.814714957771121, "core_hours": 9.814714957771121} {"step": 24550, "global_schedule": 0.9512031078338623, "l2_grads": 1.227728247642517, "l2_params": 330.66064453125, "l2_updates": 1.0167367458343506, "train/loss": 2.9753313064575195, "uptime": 4695.231724078001, "examples_seen": 25139200.0, "progress": 0.2180226104100246, "epoch": 19.622110154257797, "img/sec/core": 712.0042722124399, "core_hours_NVIDIA A100-SXM4-40GB": 9.83468986912668, "core_hours": 9.83468986912668} {"step": 24600, "global_schedule": 0.9508727788925171, "l2_grads": 1.2641593217849731, "l2_params": 330.72119140625, "l2_updates": 0.9780160188674927, "train/loss": 2.8851706981658936, "uptime": 4704.134221677001, "examples_seen": 25190400.0, "progress": 0.2184666483131, "epoch": 19.662073718726756, "img/sec/core": 718.8993795088667, "core_hours_NVIDIA A100-SXM4-40GB": 9.854473197124458, "core_hours": 9.854473197124458} {"step": 24650, "global_schedule": 0.9505413770675659, "l2_grads": 1.3409188985824585, "l2_params": 330.7165832519531, "l2_updates": 1.0049601793289185, "train/loss": 2.8899741172790527, "uptime": 4713.797988347, "examples_seen": 25241600.0, "progress": 0.2189106862161754, "epoch": 19.70203728319571, "img/sec/core": 662.2676455826199, "core_hours_NVIDIA A100-SXM4-40GB": 9.8759482341689, "core_hours": 9.8759482341689} {"step": 24700, "global_schedule": 0.9502089023590088, "l2_grads": 1.2601038217544556, "l2_params": 330.73504638671875, "l2_updates": 0.9849534630775452, "train/loss": 2.9282331466674805, "uptime": 4723.077726855001, "examples_seen": 25292800.0, "progress": 0.21935472411925083, "epoch": 19.742000847664666, "img/sec/core": 689.6746060766468, "core_hours_NVIDIA A100-SXM4-40GB": 9.896569875297791, "core_hours": 9.896569875297791} {"step": 24750, "global_schedule": 0.9498753547668457, "l2_grads": 1.0368709564208984, "l2_params": 330.7854919433594, "l2_updates": 0.9567162990570068, "train/loss": 4.676680088043213, "uptime": 4732.13998493, "examples_seen": 25344000.0, "progress": 0.21979876202232623, "epoch": 19.781964412133625, "img/sec/core": 706.2257493699694, "core_hours_NVIDIA A100-SXM4-40GB": 9.916708226575567, "core_hours": 9.916708226575567} {"step": 24800, "global_schedule": 0.9495407342910767, "l2_grads": 1.1528762578964233, "l2_params": 330.8002624511719, "l2_updates": 0.9792499542236328, "train/loss": 2.993114948272705, "uptime": 4740.997998109, "examples_seen": 25395200.0, "progress": 0.22024279992540163, "epoch": 19.82192797660258, "img/sec/core": 722.5096498131666, "core_hours_NVIDIA A100-SXM4-40GB": 9.936392700306678, "core_hours": 9.936392700306678} {"step": 24850, "global_schedule": 0.9492051601409912, "l2_grads": 1.366659164428711, "l2_params": 330.8100280761719, "l2_updates": 0.9968551397323608, "train/loss": 3.0206549167633057, "uptime": 4749.715768033, "examples_seen": 25446400.0, "progress": 0.22068683782847703, "epoch": 19.86189154107154, "img/sec/core": 734.1327031791405, "core_hours_NVIDIA A100-SXM4-40GB": 9.955765522360013, "core_hours": 9.955765522360013} {"step": 24900, "global_schedule": 0.948868453502655, "l2_grads": 1.291336178779602, "l2_params": 330.8519287109375, "l2_updates": 0.9971383213996887, "train/loss": 3.032876491546631, "uptime": 4758.897220436, "examples_seen": 25497600.0, "progress": 0.22113087573155243, "epoch": 19.901855105540495, "img/sec/core": 697.0574718558776, "core_hours_NVIDIA A100-SXM4-40GB": 9.976168749922234, "core_hours": 9.976168749922234} {"step": 24950, "global_schedule": 0.9485306739807129, "l2_grads": 1.2273375988006592, "l2_params": 330.8517150878906, "l2_updates": 1.001579761505127, "train/loss": 3.106313467025757, "uptime": 4768.142453644001, "examples_seen": 25548800.0, "progress": 0.22157491363462786, "epoch": 19.941818670009454, "img/sec/core": 692.2486275912718, "core_hours_NVIDIA A100-SXM4-40GB": 9.996713712606681, "core_hours": 9.996713712606681} {"step": 25000, "global_schedule": 0.9481918811798096, "l2_grads": 1.1475622653961182, "l2_params": 330.8747253417969, "l2_updates": 0.9951701760292053, "train/loss": 3.5777435302734375, "uptime": 4777.290141046, "examples_seen": 25600000.0, "progress": 0.22201895153770326, "epoch": 19.98178223447841, "img/sec/core": 699.630378559, "core_hours_NVIDIA A100-SXM4-40GB": 10.017041906833345, "core_hours": 10.017041906833345, "val/acc@1": 0.55704, "val/loss": 1.9058630908203125, "z/secs/eval/val": 3.585490748999291} {"step": 25050, "global_schedule": 0.9478520750999451, "l2_grads": 1.115141749382019, "l2_params": 330.89013671875, "l2_updates": 0.9789870381355286, "train/loss": 4.032315731048584, "uptime": 4791.517309891, "examples_seen": 25651200.0, "progress": 0.22246298944077866, "epoch": 20.021745798947364, "img/sec/core": 640.6722734334277, "core_hours_NVIDIA A100-SXM4-40GB": 10.039240810722228, "core_hours": 10.039240810722228} {"step": 25100, "global_schedule": 0.9475111961364746, "l2_grads": 1.1404657363891602, "l2_params": 330.9033508300781, "l2_updates": 0.9518877267837524, "train/loss": 5.343281269073486, "uptime": 4801.079724996, "examples_seen": 25702400.0, "progress": 0.22290702734385406, "epoch": 20.061709363416323, "img/sec/core": 669.286987620291, "core_hours_NVIDIA A100-SXM4-40GB": 10.060490622066673, "core_hours": 10.060490622066673} {"step": 25150, "global_schedule": 0.9471692442893982, "l2_grads": 1.0901892185211182, "l2_params": 330.94287109375, "l2_updates": 0.979508101940155, "train/loss": 4.293720245361328, "uptime": 4810.676866515001, "examples_seen": 25753600.0, "progress": 0.22335106524692946, "epoch": 20.10167292788528, "img/sec/core": 666.8652314158902, "core_hours_NVIDIA A100-SXM4-40GB": 10.08181760322001, "core_hours": 10.08181760322001} {"step": 25200, "global_schedule": 0.9468262195587158, "l2_grads": 1.4393458366394043, "l2_params": 330.9554138183594, "l2_updates": 0.974541962146759, "train/loss": 2.903226613998413, "uptime": 4819.419449457, "examples_seen": 25804800.0, "progress": 0.2237951031500049, "epoch": 20.141636492354237, "img/sec/core": 732.0491029321183, "core_hours_NVIDIA A100-SXM4-40GB": 10.101245565313342, "core_hours": 10.101245565313342} {"step": 25250, "global_schedule": 0.9464821815490723, "l2_grads": 1.092354416847229, "l2_params": 330.98553466796875, "l2_updates": 0.9889104962348938, "train/loss": 4.998215198516846, "uptime": 4828.370456014001, "examples_seen": 25856000.0, "progress": 0.2242391410530803, "epoch": 20.181600056823193, "img/sec/core": 715.0033864062074, "core_hours_NVIDIA A100-SXM4-40GB": 10.121136690995566, "core_hours": 10.121136690995566} {"step": 25300, "global_schedule": 0.9461371302604675, "l2_grads": 1.2623134851455688, "l2_params": 330.9933776855469, "l2_updates": 0.9730231165885925, "train/loss": 2.8470921516418457, "uptime": 4836.913822427001, "examples_seen": 25907200.0, "progress": 0.2246831789561557, "epoch": 20.22156362129215, "img/sec/core": 749.1192219336101, "core_hours_NVIDIA A100-SXM4-40GB": 10.140121949691121, "core_hours": 10.140121949691121} {"step": 25350, "global_schedule": 0.9457910060882568, "l2_grads": 1.325465440750122, "l2_params": 331.0166320800781, "l2_updates": 1.0119425058364868, "train/loss": 2.9058337211608887, "uptime": 4846.518357633, "examples_seen": 25958400.0, "progress": 0.2251272168592311, "epoch": 20.261527185761107, "img/sec/core": 666.3518705207588, "core_hours_NVIDIA A100-SXM4-40GB": 10.161465361260008, "core_hours": 10.161465361260008} {"step": 25400, "global_schedule": 0.9454438090324402, "l2_grads": 1.4052023887634277, "l2_params": 331.03216552734375, "l2_updates": 0.9726819396018982, "train/loss": 3.0331764221191406, "uptime": 4856.078421277001, "examples_seen": 26009600.0, "progress": 0.22557125476230652, "epoch": 20.301490750230062, "img/sec/core": 669.4516101904674, "core_hours_NVIDIA A100-SXM4-40GB": 10.182709947135567, "core_hours": 10.182709947135567} {"step": 25450, "global_schedule": 0.9450955986976624, "l2_grads": 1.3586491346359253, "l2_params": 331.1133117675781, "l2_updates": 0.9722967743873596, "train/loss": 2.92691969871521, "uptime": 4865.716405481, "examples_seen": 26060800.0, "progress": 0.22601529266538192, "epoch": 20.34145431469902, "img/sec/core": 664.0392705089408, "core_hours_NVIDIA A100-SXM4-40GB": 10.204127689811118, "core_hours": 10.204127689811118} {"step": 25500, "global_schedule": 0.9447463750839233, "l2_grads": 1.2268692255020142, "l2_params": 331.1229553222656, "l2_updates": 0.9679329991340637, "train/loss": 3.9797048568725586, "uptime": 4874.556427521, "examples_seen": 26112000.0, "progress": 0.22645933056845732, "epoch": 20.381417879167977, "img/sec/core": 723.9800954161509, "core_hours_NVIDIA A100-SXM4-40GB": 10.22377218323334, "core_hours": 10.22377218323334} {"step": 25550, "global_schedule": 0.9443960189819336, "l2_grads": 1.0704600811004639, "l2_params": 331.1087646484375, "l2_updates": 1.0035769939422607, "train/loss": 4.4042840003967285, "uptime": 4884.085485258, "examples_seen": 26163200.0, "progress": 0.22690336847153272, "epoch": 20.421381443636935, "img/sec/core": 671.6298900309852, "core_hours_NVIDIA A100-SXM4-40GB": 10.244947867093341, "core_hours": 10.244947867093341} {"step": 25600, "global_schedule": 0.9440447092056274, "l2_grads": 1.0986653566360474, "l2_params": 331.1722106933594, "l2_updates": 1.0066722631454468, "train/loss": 3.6700387001037598, "uptime": 4892.741249376, "examples_seen": 26214400.0, "progress": 0.22734740637460812, "epoch": 20.46134500810589, "img/sec/core": 739.3916831317597, "core_hours_NVIDIA A100-SXM4-40GB": 10.264182898466675, "core_hours": 10.264182898466675} {"step": 25650, "global_schedule": 0.9436923265457153, "l2_grads": 1.2445050477981567, "l2_params": 331.219970703125, "l2_updates": 0.9882486462593079, "train/loss": 2.734684705734253, "uptime": 4902.240877735001, "examples_seen": 26265600.0, "progress": 0.22779144427768355, "epoch": 20.501308572574846, "img/sec/core": 673.7105661545253, "core_hours_NVIDIA A100-SXM4-40GB": 10.285293183708898, "core_hours": 10.285293183708898} {"step": 25700, "global_schedule": 0.9433388710021973, "l2_grads": 1.2138025760650635, "l2_params": 331.23077392578125, "l2_updates": 0.9869807958602905, "train/loss": 2.8546478748321533, "uptime": 4911.8523826050005, "examples_seen": 26316800.0, "progress": 0.22823548218075895, "epoch": 20.541272137043805, "img/sec/core": 665.868673695048, "core_hours_NVIDIA A100-SXM4-40GB": 10.306652083420008, "core_hours": 10.306652083420008} {"step": 25750, "global_schedule": 0.9429844617843628, "l2_grads": 1.2346357107162476, "l2_params": 331.2574768066406, "l2_updates": 0.9838303327560425, "train/loss": 2.7891364097595215, "uptime": 4921.242646647001, "examples_seen": 26368000.0, "progress": 0.22867952008383435, "epoch": 20.58123570151276, "img/sec/core": 681.5569798010494, "core_hours_NVIDIA A100-SXM4-40GB": 10.327519336846676, "core_hours": 10.327519336846676} {"step": 25800, "global_schedule": 0.9426289200782776, "l2_grads": 1.1594648361206055, "l2_params": 331.2799987792969, "l2_updates": 0.9750956296920776, "train/loss": 3.4410476684570312, "uptime": 4930.785465699, "examples_seen": 26419200.0, "progress": 0.22912355798690975, "epoch": 20.62119926598172, "img/sec/core": 670.6613596177209, "core_hours_NVIDIA A100-SXM4-40GB": 10.348725601406676, "core_hours": 10.348725601406676} {"step": 25850, "global_schedule": 0.9422723650932312, "l2_grads": 1.192164659500122, "l2_params": 331.2626953125, "l2_updates": 1.017479419708252, "train/loss": 2.857544422149658, "uptime": 4939.624119296001, "examples_seen": 26470400.0, "progress": 0.22956759588998518, "epoch": 20.661162830450674, "img/sec/core": 724.0921855079894, "core_hours_NVIDIA A100-SXM4-40GB": 10.368367053844453, "core_hours": 10.368367053844453} {"step": 25900, "global_schedule": 0.9419147968292236, "l2_grads": 1.2703691720962524, "l2_params": 331.2579345703125, "l2_updates": 1.0007266998291016, "train/loss": 2.863734006881714, "uptime": 4948.258161461001, "examples_seen": 26521600.0, "progress": 0.23001163379306058, "epoch": 20.701126394919633, "img/sec/core": 741.2518815281746, "core_hours_NVIDIA A100-SXM4-40GB": 10.38755381421112, "core_hours": 10.38755381421112} {"step": 25950, "global_schedule": 0.9415562152862549, "l2_grads": 1.2510385513305664, "l2_params": 331.2676696777344, "l2_updates": 0.986708402633667, "train/loss": 2.808952808380127, "uptime": 4957.569814542001, "examples_seen": 26572800.0, "progress": 0.23045567169613598, "epoch": 20.74108995938859, "img/sec/core": 687.3108291650951, "core_hours_NVIDIA A100-SXM4-40GB": 10.408246376613343, "core_hours": 10.408246376613343} {"step": 26000, "global_schedule": 0.9411965608596802, "l2_grads": 1.1809606552124023, "l2_params": 331.27813720703125, "l2_updates": 1.0035916566848755, "train/loss": 3.113835573196411, "uptime": 4966.138716183001, "examples_seen": 26624000.0, "progress": 0.23089970959921138, "epoch": 20.781053523857544, "img/sec/core": 746.8868552975185, "core_hours_NVIDIA A100-SXM4-40GB": 10.427288380260011, "core_hours": 10.427288380260011} {"step": 26050, "global_schedule": 0.9408358335494995, "l2_grads": 1.1436525583267212, "l2_params": 331.33050537109375, "l2_updates": 0.9923545718193054, "train/loss": 3.2830910682678223, "uptime": 4975.998304478, "examples_seen": 26675200.0, "progress": 0.23134374750228678, "epoch": 20.821017088326503, "img/sec/core": 696.1690665052836, "core_hours_NVIDIA A100-SXM4-40GB": 10.447717645084452, "core_hours": 10.447717645084452} {"step": 26100, "global_schedule": 0.9404741525650024, "l2_grads": 1.2977797985076904, "l2_params": 331.3417663574219, "l2_updates": 0.9765986204147339, "train/loss": 2.790498733520508, "uptime": 4985.635290652001, "examples_seen": 26726400.0, "progress": 0.2317877854053622, "epoch": 20.860980652795458, "img/sec/core": 664.1080400495473, "core_hours_NVIDIA A100-SXM4-40GB": 10.469133169915564, "core_hours": 10.469133169915564} {"step": 26150, "global_schedule": 0.9401113986968994, "l2_grads": 1.316003680229187, "l2_params": 331.3786315917969, "l2_updates": 0.959964394569397, "train/loss": 2.842895746231079, "uptime": 4995.348161356, "examples_seen": 26777600.0, "progress": 0.2322318233084376, "epoch": 20.900944217264417, "img/sec/core": 658.9195094880486, "core_hours_NVIDIA A100-SXM4-40GB": 10.490717327035563, "core_hours": 10.490717327035563} {"step": 26200, "global_schedule": 0.9397475719451904, "l2_grads": 1.150922179222107, "l2_params": 331.3769226074219, "l2_updates": 0.9685910940170288, "train/loss": 5.287800312042236, "uptime": 5004.362729735001, "examples_seen": 26828800.0, "progress": 0.232675861211513, "epoch": 20.940907781733372, "img/sec/core": 709.9618895684604, "core_hours_NVIDIA A100-SXM4-40GB": 10.510749701211122, "core_hours": 10.510749701211122} {"step": 26250, "global_schedule": 0.939382791519165, "l2_grads": 1.2169480323791504, "l2_params": 331.3661193847656, "l2_updates": 0.9979656934738159, "train/loss": 3.3686320781707764, "uptime": 5012.975942203, "examples_seen": 26880000.0, "progress": 0.2331198991145884, "epoch": 20.98087134620233, "img/sec/core": 743.0444823900776, "core_hours_NVIDIA A100-SXM4-40GB": 10.52989017336223, "core_hours": 10.52989017336223} {"step": 26300, "global_schedule": 0.9390169382095337, "l2_grads": 1.2687932252883911, "l2_params": 331.3722839355469, "l2_updates": 0.9747973680496216, "train/loss": 2.875392436981201, "uptime": 5022.547116287, "examples_seen": 26931200.0, "progress": 0.23356393701766381, "epoch": 21.020834910671287, "img/sec/core": 668.6744952950943, "core_hours_NVIDIA A100-SXM4-40GB": 10.551159449104453, "core_hours": 10.551159449104453} {"step": 26350, "global_schedule": 0.9386501312255859, "l2_grads": 1.1014765501022339, "l2_params": 331.3968505859375, "l2_updates": 0.9603102207183838, "train/loss": 5.2449846267700195, "uptime": 5031.093859501001, "examples_seen": 26982400.0, "progress": 0.23400797492073924, "epoch": 21.060798475140242, "img/sec/core": 748.8232464402975, "core_hours_NVIDIA A100-SXM4-40GB": 10.570152211802233, "core_hours": 10.570152211802233} {"step": 26400, "global_schedule": 0.9382821917533875, "l2_grads": 1.4275091886520386, "l2_params": 331.4235534667969, "l2_updates": 0.9742172956466675, "train/loss": 2.711059331893921, "uptime": 5039.557365672001, "examples_seen": 27033600.0, "progress": 0.23445201282381464, "epoch": 21.1007620396092, "img/sec/core": 756.1877867980699, "core_hours_NVIDIA A100-SXM4-40GB": 10.588960003293344, "core_hours": 10.588960003293344} {"step": 26450, "global_schedule": 0.9379132986068726, "l2_grads": 1.4513227939605713, "l2_params": 331.4724426269531, "l2_updates": 0.9370592832565308, "train/loss": 2.877793788909912, "uptime": 5048.075037701001, "examples_seen": 27084800.0, "progress": 0.23489605072689004, "epoch": 21.140725604078156, "img/sec/core": 751.3790127407977, "core_hours_NVIDIA A100-SXM4-40GB": 10.607888163357789, "core_hours": 10.607888163357789} {"step": 26500, "global_schedule": 0.9375433325767517, "l2_grads": 1.1477917432785034, "l2_params": 331.4446105957031, "l2_updates": 0.9916449785232544, "train/loss": 3.8790853023529053, "uptime": 5057.298926047, "examples_seen": 27136000.0, "progress": 0.23534008862996544, "epoch": 21.180689168547115, "img/sec/core": 693.8505497820494, "core_hours_NVIDIA A100-SXM4-40GB": 10.628385693015565, "core_hours": 10.628385693015565} {"step": 26550, "global_schedule": 0.9371723532676697, "l2_grads": 1.389998197555542, "l2_params": 331.4941101074219, "l2_updates": 0.9720224142074585, "train/loss": 2.9086315631866455, "uptime": 5066.853382928, "examples_seen": 27187200.0, "progress": 0.23578412653304087, "epoch": 21.22065273301607, "img/sec/core": 669.8444589484717, "core_hours_NVIDIA A100-SXM4-40GB": 10.649617819417786, "core_hours": 10.649617819417786} {"step": 26600, "global_schedule": 0.9368003606796265, "l2_grads": 1.0337214469909668, "l2_params": 331.4857177734375, "l2_updates": 0.9971925020217896, "train/loss": 4.090999603271484, "uptime": 5076.580902748001, "examples_seen": 27238400.0, "progress": 0.23622816443611627, "epoch": 21.260616297485026, "img/sec/core": 657.9272125296685, "core_hours_NVIDIA A100-SXM4-40GB": 10.6712345301289, "core_hours": 10.6712345301289} {"step": 26650, "global_schedule": 0.9364273548126221, "l2_grads": 1.2017741203308105, "l2_params": 331.495361328125, "l2_updates": 0.9969128370285034, "train/loss": 2.8236136436462402, "uptime": 5085.666053273, "examples_seen": 27289600.0, "progress": 0.23667220233919167, "epoch": 21.300579861953985, "img/sec/core": 704.4462260024545, "core_hours_NVIDIA A100-SXM4-40GB": 10.691423753517787, "core_hours": 10.691423753517787} {"step": 26700, "global_schedule": 0.9360532760620117, "l2_grads": 1.1394944190979004, "l2_params": 331.514892578125, "l2_updates": 0.9787942171096802, "train/loss": 3.1653974056243896, "uptime": 5094.2295601490005, "examples_seen": 27340800.0, "progress": 0.23711624024226707, "epoch": 21.34054342642294, "img/sec/core": 747.3573727063141, "core_hours_NVIDIA A100-SXM4-40GB": 10.710453768797786, "core_hours": 10.710453768797786} {"step": 26750, "global_schedule": 0.935678243637085, "l2_grads": 1.1766493320465088, "l2_params": 331.50921630859375, "l2_updates": 1.0060105323791504, "train/loss": 2.9808177947998047, "uptime": 5103.567626648, "examples_seen": 27392000.0, "progress": 0.23756027814534247, "epoch": 21.3805069908919, "img/sec/core": 685.36671919025, "core_hours_NVIDIA A100-SXM4-40GB": 10.731205027684455, "core_hours": 10.731205027684455} {"step": 26800, "global_schedule": 0.9353021383285522, "l2_grads": 1.2492806911468506, "l2_params": 331.5271301269531, "l2_updates": 0.9802409410476685, "train/loss": 2.9623301029205322, "uptime": 5112.569943787001, "examples_seen": 27443200.0, "progress": 0.2380043160484179, "epoch": 21.420470555360854, "img/sec/core": 710.9280756477234, "core_hours_NVIDIA A100-SXM4-40GB": 10.751210176882232, "core_hours": 10.751210176882232} {"step": 26850, "global_schedule": 0.9349250197410583, "l2_grads": 1.3468176126480103, "l2_params": 331.5137939453125, "l2_updates": 0.9701384902000427, "train/loss": 2.9510250091552734, "uptime": 5121.111900958, "examples_seen": 27494400.0, "progress": 0.2384483539514933, "epoch": 21.460434119829813, "img/sec/core": 749.2428107376587, "core_hours_NVIDIA A100-SXM4-40GB": 10.770192303928896, "core_hours": 10.770192303928896} {"step": 26900, "global_schedule": 0.9345468878746033, "l2_grads": 1.2727148532867432, "l2_params": 331.5415954589844, "l2_updates": 0.9456491470336914, "train/loss": 2.709547996520996, "uptime": 5130.224451692, "examples_seen": 27545600.0, "progress": 0.2388923918545687, "epoch": 21.50039768429877, "img/sec/core": 702.3280513677328, "core_hours_NVIDIA A100-SXM4-40GB": 10.79044241667112, "core_hours": 10.79044241667112} {"step": 26950, "global_schedule": 0.934167742729187, "l2_grads": 1.324594497680664, "l2_params": 331.56097412109375, "l2_updates": 0.9929916262626648, "train/loss": 2.8355295658111572, "uptime": 5139.124610656001, "examples_seen": 27596800.0, "progress": 0.2393364297576441, "epoch": 21.540361248767724, "img/sec/core": 719.0882798707744, "core_hours_NVIDIA A100-SXM4-40GB": 10.810220547702233, "core_hours": 10.810220547702233} {"step": 27000, "global_schedule": 0.9337875843048096, "l2_grads": 0.9949339032173157, "l2_params": 331.5553894042969, "l2_updates": 0.9700091481208801, "train/loss": 3.935138702392578, "uptime": 5148.291974772001, "examples_seen": 27648000.0, "progress": 0.23978046766071953, "epoch": 21.580324813236683, "img/sec/core": 698.1287007930914, "core_hours_NVIDIA A100-SXM4-40GB": 10.83059246796001, "core_hours": 10.83059246796001} {"step": 27050, "global_schedule": 0.9334063529968262, "l2_grads": 1.3311781883239746, "l2_params": 331.5491943359375, "l2_updates": 0.9670119881629944, "train/loss": 2.8058018684387207, "uptime": 5158.253143691001, "examples_seen": 27699200.0, "progress": 0.24022450556379493, "epoch": 21.620288377705638, "img/sec/core": 721.313968805956, "core_hours_NVIDIA A100-SXM4-40GB": 10.85030957152001, "core_hours": 10.85030957152001} {"step": 27100, "global_schedule": 0.9330241680145264, "l2_grads": 1.184279203414917, "l2_params": 331.5746765136719, "l2_updates": 0.9358498454093933, "train/loss": 5.317964553833008, "uptime": 5166.805699052, "examples_seen": 27750400.0, "progress": 0.24066854346687033, "epoch": 21.660251942174597, "img/sec/core": 748.3143610136985, "core_hours_NVIDIA A100-SXM4-40GB": 10.869315250100009, "core_hours": 10.869315250100009} {"step": 27150, "global_schedule": 0.9326409697532654, "l2_grads": 0.9407297968864441, "l2_params": 331.549560546875, "l2_updates": 0.9428789615631104, "train/loss": 5.268965721130371, "uptime": 5175.451210305, "examples_seen": 27801600.0, "progress": 0.24111258136994573, "epoch": 21.700215506643552, "img/sec/core": 740.2685408314088, "core_hours_NVIDIA A100-SXM4-40GB": 10.888527497328898, "core_hours": 10.888527497328898} {"step": 27200, "global_schedule": 0.9322566986083984, "l2_grads": 1.2687971591949463, "l2_params": 331.5579528808594, "l2_updates": 0.9826711416244507, "train/loss": 2.8473029136657715, "uptime": 5184.236326699, "examples_seen": 27852800.0, "progress": 0.24155661927302113, "epoch": 21.74017907111251, "img/sec/core": 728.504861286915, "core_hours_NVIDIA A100-SXM4-40GB": 10.90804997820445, "core_hours": 10.90804997820445} {"step": 27250, "global_schedule": 0.9318715333938599, "l2_grads": 1.2404084205627441, "l2_params": 331.5447692871094, "l2_updates": 1.0000942945480347, "train/loss": 2.790231466293335, "uptime": 5193.422893053001, "examples_seen": 27904000.0, "progress": 0.24200065717609656, "epoch": 21.780142635581466, "img/sec/core": 696.6694359326698, "core_hours_NVIDIA A100-SXM4-40GB": 10.92846457010223, "core_hours": 10.92846457010223} {"step": 27300, "global_schedule": 0.9314852952957153, "l2_grads": 1.07126784324646, "l2_params": 331.5583190917969, "l2_updates": 1.0032786130905151, "train/loss": 3.7307629585266113, "uptime": 5201.8042246820005, "examples_seen": 27955200.0, "progress": 0.24244469507917196, "epoch": 21.82010620005042, "img/sec/core": 763.6018097477173, "core_hours_NVIDIA A100-SXM4-40GB": 10.947089751500009, "core_hours": 10.947089751500009} {"step": 27350, "global_schedule": 0.9310979843139648, "l2_grads": 1.291334867477417, "l2_params": 331.5582275390625, "l2_updates": 0.9384451508522034, "train/loss": 2.9309091567993164, "uptime": 5210.237114917001, "examples_seen": 28006400.0, "progress": 0.24288873298224736, "epoch": 21.86006976451938, "img/sec/core": 758.9331559702719, "core_hours_NVIDIA A100-SXM4-40GB": 10.965829507577787, "core_hours": 10.965829507577787} {"step": 27400, "global_schedule": 0.930709719657898, "l2_grads": 1.2260463237762451, "l2_params": 331.5462646484375, "l2_updates": 0.9842491745948792, "train/loss": 2.8033976554870605, "uptime": 5218.928896363001, "examples_seen": 28057600.0, "progress": 0.24333277088532276, "epoch": 21.900033328988336, "img/sec/core": 736.3277643095566, "core_hours_NVIDIA A100-SXM4-40GB": 10.985144577457786, "core_hours": 10.985144577457786} {"step": 27450, "global_schedule": 0.9303204417228699, "l2_grads": 0.9774523973464966, "l2_params": 331.5483093261719, "l2_updates": 0.9439536929130554, "train/loss": 4.888762950897217, "uptime": 5228.187243221, "examples_seen": 28108800.0, "progress": 0.24377680878839816, "epoch": 21.939996893457295, "img/sec/core": 691.2681171012839, "core_hours_NVIDIA A100-SXM4-40GB": 11.005718681586675, "core_hours": 11.005718681586675} {"step": 27500, "global_schedule": 0.9299300909042358, "l2_grads": 1.0474117994308472, "l2_params": 331.5408935546875, "l2_updates": 0.9728769659996033, "train/loss": 4.088371753692627, "uptime": 5237.348864942, "examples_seen": 28160000.0, "progress": 0.2442208466914736, "epoch": 21.97996045792625, "img/sec/core": 698.5662795191088, "core_hours_NVIDIA A100-SXM4-40GB": 11.026077840966675, "core_hours": 11.026077840966675, "val/acc@1": 0.57006, "val/loss": 1.8503551318359375, "z/secs/eval/val": 5.282613954999761} {"step": 27550, "global_schedule": 0.9295388460159302, "l2_grads": 1.1895582675933838, "l2_params": 331.5801696777344, "l2_updates": 0.983575701713562, "train/loss": 3.223783254623413, "uptime": 5252.176391471001, "examples_seen": 28211200.0, "progress": 0.244664884594549, "epoch": 22.019924022395205, "img/sec/core": 670.5946751860002, "core_hours_NVIDIA A100-SXM4-40GB": 11.047286214293344, "core_hours": 11.047286214293344} {"step": 27600, "global_schedule": 0.9291465282440186, "l2_grads": 1.3651340007781982, "l2_params": 331.59136962890625, "l2_updates": 0.9719067811965942, "train/loss": 2.77703595161438, "uptime": 5260.832306445, "examples_seen": 28262400.0, "progress": 0.2451089224976244, "epoch": 22.059887586864164, "img/sec/core": 739.3787969526948, "core_hours_NVIDIA A100-SXM4-40GB": 11.06652158090223, "core_hours": 11.06652158090223} {"step": 27650, "global_schedule": 0.9287532567977905, "l2_grads": 1.3183289766311646, "l2_params": 331.63739013671875, "l2_updates": 1.0052781105041504, "train/loss": 2.7735493183135986, "uptime": 5269.378946983001, "examples_seen": 28313600.0, "progress": 0.2455529604006998, "epoch": 22.09985115133312, "img/sec/core": 748.8322425102014, "core_hours_NVIDIA A100-SXM4-40GB": 11.085514115431122, "core_hours": 11.085514115431122} {"step": 27700, "global_schedule": 0.9283589124679565, "l2_grads": 1.0277128219604492, "l2_params": 331.65399169921875, "l2_updates": 0.9541473984718323, "train/loss": 5.30388879776001, "uptime": 5277.659135894, "examples_seen": 28364800.0, "progress": 0.24599699830377522, "epoch": 22.13981471580208, "img/sec/core": 772.9292252617638, "core_hours_NVIDIA A100-SXM4-40GB": 11.103914535233343, "core_hours": 11.103914535233343} {"step": 27750, "global_schedule": 0.9279636144638062, "l2_grads": 1.2796268463134766, "l2_params": 331.6263732910156, "l2_updates": 0.9905049800872803, "train/loss": 2.7145397663116455, "uptime": 5286.2885749960005, "examples_seen": 28416000.0, "progress": 0.24644103620685062, "epoch": 22.179778280271034, "img/sec/core": 741.6472756052739, "core_hours_NVIDIA A100-SXM4-40GB": 11.123091066571122, "core_hours": 11.123091066571122} {"step": 27800, "global_schedule": 0.9275672435760498, "l2_grads": 1.2017086744308472, "l2_params": 331.6524658203125, "l2_updates": 0.978775143623352, "train/loss": 3.2469069957733154, "uptime": 5294.915847881, "examples_seen": 28467200.0, "progress": 0.24688507410992602, "epoch": 22.219741844739993, "img/sec/core": 741.8334953943057, "core_hours_NVIDIA A100-SXM4-40GB": 11.142262784093344, "core_hours": 11.142262784093344} {"step": 27850, "global_schedule": 0.927169919013977, "l2_grads": 1.1781790256500244, "l2_params": 331.65570068359375, "l2_updates": 0.9656455516815186, "train/loss": 3.669886589050293, "uptime": 5303.438899083001, "examples_seen": 28518400.0, "progress": 0.24732911201300142, "epoch": 22.259705409208948, "img/sec/core": 750.9047931681617, "core_hours_NVIDIA A100-SXM4-40GB": 11.161202897875567, "core_hours": 11.161202897875567} {"step": 27900, "global_schedule": 0.9267716407775879, "l2_grads": 1.2015424966812134, "l2_params": 331.6761474609375, "l2_updates": 0.9752283692359924, "train/loss": 3.1801483631134033, "uptime": 5312.353393858, "examples_seen": 28569600.0, "progress": 0.24777314991607682, "epoch": 22.299668973677903, "img/sec/core": 717.9318807779082, "core_hours_NVIDIA A100-SXM4-40GB": 11.181012886264455, "core_hours": 11.181012886264455} {"step": 27950, "global_schedule": 0.9263722896575928, "l2_grads": 1.4132204055786133, "l2_params": 331.7071228027344, "l2_updates": 0.9425756931304932, "train/loss": 2.880929708480835, "uptime": 5321.259044569, "examples_seen": 28620800.0, "progress": 0.24821718781915225, "epoch": 22.339632538146862, "img/sec/core": 718.6448478262204, "core_hours_NVIDIA A100-SXM4-40GB": 11.200803221177788, "core_hours": 11.200803221177788} {"step": 28000, "global_schedule": 0.9259719848632812, "l2_grads": 1.2952818870544434, "l2_params": 331.6734924316406, "l2_updates": 0.9978919625282288, "train/loss": 2.7370827198028564, "uptime": 5330.222398861, "examples_seen": 28672000.0, "progress": 0.24866122572222765, "epoch": 22.379596102615817, "img/sec/core": 714.0184122490944, "core_hours_NVIDIA A100-SXM4-40GB": 11.220721786271122, "core_hours": 11.220721786271122} {"step": 28050, "global_schedule": 0.9255706071853638, "l2_grads": 1.3469526767730713, "l2_params": 331.67449951171875, "l2_updates": 0.9761357307434082, "train/loss": 2.678616523742676, "uptime": 5339.388170621001, "examples_seen": 28723200.0, "progress": 0.24910526362530305, "epoch": 22.419559667084776, "img/sec/core": 784.8673144333022, "core_hours_NVIDIA A100-SXM4-40GB": 11.238842329655567, "core_hours": 11.238842329655567} {"step": 28100, "global_schedule": 0.9251682758331299, "l2_grads": 1.1791375875473022, "l2_params": 331.66668701171875, "l2_updates": 0.9840726256370544, "train/loss": 2.8622918128967285, "uptime": 5348.257046378001, "examples_seen": 28774400.0, "progress": 0.24954930152837845, "epoch": 22.45952323155373, "img/sec/core": 721.6247217071162, "core_hours_NVIDIA A100-SXM4-40GB": 11.258550942448899, "core_hours": 11.258550942448899} {"step": 28150, "global_schedule": 0.9247649908065796, "l2_grads": 1.2678848505020142, "l2_params": 331.69671630859375, "l2_updates": 0.9880165457725525, "train/loss": 2.9301955699920654, "uptime": 5357.620008481001, "examples_seen": 28825600.0, "progress": 0.24999333943145388, "epoch": 22.499486796022687, "img/sec/core": 683.544366579215, "core_hours_NVIDIA A100-SXM4-40GB": 11.27935752490001, "core_hours": 11.27935752490001} {"step": 28200, "global_schedule": 0.9243606328964233, "l2_grads": 1.2951862812042236, "l2_params": 331.6994934082031, "l2_updates": 0.9809351563453674, "train/loss": 2.7728066444396973, "uptime": 5366.955650923001, "examples_seen": 28876800.0, "progress": 0.25043737733452925, "epoch": 22.539450360491646, "img/sec/core": 685.5446788757896, "core_hours_NVIDIA A100-SXM4-40GB": 11.300103396993343, "core_hours": 11.300103396993343} {"step": 28250, "global_schedule": 0.9239553213119507, "l2_grads": 1.2261875867843628, "l2_params": 331.6854248046875, "l2_updates": 0.9684610366821289, "train/loss": 3.031020164489746, "uptime": 5375.527350608001, "examples_seen": 28928000.0, "progress": 0.25088141523760465, "epoch": 22.5794139249606, "img/sec/core": 746.643050409153, "core_hours_NVIDIA A100-SXM4-40GB": 11.319151618515567, "core_hours": 11.319151618515567} {"step": 28300, "global_schedule": 0.9235490560531616, "l2_grads": 1.2830042839050293, "l2_params": 331.6732482910156, "l2_updates": 0.9452537894248962, "train/loss": 2.71745228767395, "uptime": 5384.395947458001, "examples_seen": 28979200.0, "progress": 0.2513254531406801, "epoch": 22.61937748942956, "img/sec/core": 721.6474159607783, "core_hours_NVIDIA A100-SXM4-40GB": 11.338859611515566, "core_hours": 11.338859611515566} {"step": 28350, "global_schedule": 0.9231417179107666, "l2_grads": 1.2959272861480713, "l2_params": 331.61529541015625, "l2_updates": 0.9880567789077759, "train/loss": 2.750375270843506, "uptime": 5392.804232755001, "examples_seen": 29030400.0, "progress": 0.2517694910437555, "epoch": 22.659341053898515, "img/sec/core": 761.154001551672, "core_hours_NVIDIA A100-SXM4-40GB": 11.357544689953345, "core_hours": 11.357544689953345} {"step": 28400, "global_schedule": 0.9227334260940552, "l2_grads": 1.1278657913208008, "l2_params": 331.58428955078125, "l2_updates": 0.9936946034431458, "train/loss": 3.1773571968078613, "uptime": 5402.138158803, "examples_seen": 29081600.0, "progress": 0.2522135289468309, "epoch": 22.699304618367474, "img/sec/core": 685.6707420959419, "core_hours_NVIDIA A100-SXM4-40GB": 11.378286747837786, "core_hours": 11.378286747837786} {"step": 28450, "global_schedule": 0.9223241806030273, "l2_grads": 1.2908380031585693, "l2_params": 331.5868225097656, "l2_updates": 0.9355329275131226, "train/loss": 2.7884254455566406, "uptime": 5411.438324196, "examples_seen": 29132800.0, "progress": 0.2526575668499063, "epoch": 22.73926818283643, "img/sec/core": 688.1598046435579, "core_hours_NVIDIA A100-SXM4-40GB": 11.398953782044455, "core_hours": 11.398953782044455} {"step": 28500, "global_schedule": 0.9219139218330383, "l2_grads": 1.3791972398757935, "l2_params": 331.54949951171875, "l2_updates": 0.9705172777175903, "train/loss": 2.8840341567993164, "uptime": 5419.953845223001, "examples_seen": 29184000.0, "progress": 0.2531016047529817, "epoch": 22.779231747305385, "img/sec/core": 751.5688094371816, "core_hours_NVIDIA A100-SXM4-40GB": 11.417877162104455, "core_hours": 11.417877162104455} {"step": 28550, "global_schedule": 0.9215026497840881, "l2_grads": 1.2801873683929443, "l2_params": 331.5528564453125, "l2_updates": 0.9656797647476196, "train/loss": 2.6915276050567627, "uptime": 5428.447951048001, "examples_seen": 29235200.0, "progress": 0.2535456426560571, "epoch": 22.819195311774344, "img/sec/core": 753.4636525439753, "core_hours_NVIDIA A100-SXM4-40GB": 11.436752952826678, "core_hours": 11.436752952826678} {"step": 28600, "global_schedule": 0.9210904240608215, "l2_grads": 1.409061074256897, "l2_params": 331.5465087890625, "l2_updates": 0.9271939992904663, "train/loss": 2.9772629737854004, "uptime": 5436.966469767001, "examples_seen": 29286400.0, "progress": 0.2539896805591325, "epoch": 22.8591588762433, "img/sec/core": 751.3043301443042, "core_hours_NVIDIA A100-SXM4-40GB": 11.455682994424455, "core_hours": 11.455682994424455} {"step": 28650, "global_schedule": 0.9206771850585938, "l2_grads": 1.3159602880477905, "l2_params": 331.5561828613281, "l2_updates": 0.968823254108429, "train/loss": 5.407463073730469, "uptime": 5445.427428137, "examples_seen": 29337600.0, "progress": 0.2544337184622079, "epoch": 22.899122440712258, "img/sec/core": 756.4154933906323, "core_hours_NVIDIA A100-SXM4-40GB": 11.474485124135564, "core_hours": 11.474485124135564} {"step": 28700, "global_schedule": 0.9202629327774048, "l2_grads": 1.256195306777954, "l2_params": 331.5488586425781, "l2_updates": 0.9529388546943665, "train/loss": 2.749631643295288, "uptime": 5454.305422372001, "examples_seen": 29388800.0, "progress": 0.2548777563652833, "epoch": 22.939086005181213, "img/sec/core": 720.8835498865594, "core_hours_NVIDIA A100-SXM4-40GB": 11.494214000213343, "core_hours": 11.494214000213343} {"step": 28750, "global_schedule": 0.9198477268218994, "l2_grads": 1.3078429698944092, "l2_params": 331.539306640625, "l2_updates": 0.9605544805526733, "train/loss": 2.750096082687378, "uptime": 5463.240737582, "examples_seen": 29440000.0, "progress": 0.25532179426835877, "epoch": 22.979049569650172, "img/sec/core": 716.2590070507977, "core_hours_NVIDIA A100-SXM4-40GB": 11.514070256235565, "core_hours": 11.514070256235565} {"step": 28800, "global_schedule": 0.9194315671920776, "l2_grads": 1.2666269540786743, "l2_params": 331.5519104003906, "l2_updates": 0.960898220539093, "train/loss": 2.6385974884033203, "uptime": 5472.806402257, "examples_seen": 29491200.0, "progress": 0.25576583217143417, "epoch": 23.019013134119128, "img/sec/core": 669.0596228746001, "core_hours_NVIDIA A100-SXM4-40GB": 11.535327288846675, "core_hours": 11.535327288846675} {"step": 28850, "global_schedule": 0.9190143942832947, "l2_grads": 1.3181469440460205, "l2_params": 331.54864501953125, "l2_updates": 0.9732121825218201, "train/loss": 2.8225412368774414, "uptime": 5482.102330215001, "examples_seen": 29542400.0, "progress": 0.25620987007450957, "epoch": 23.058976698588083, "img/sec/core": 688.4734938690646, "core_hours_NVIDIA A100-SXM4-40GB": 11.55598490653112, "core_hours": 11.55598490653112} {"step": 28900, "global_schedule": 0.9185962677001953, "l2_grads": 1.2108495235443115, "l2_params": 331.5397033691406, "l2_updates": 0.9571561217308044, "train/loss": 4.884877681732178, "uptime": 5491.413491942001, "examples_seen": 29593600.0, "progress": 0.25665390797758497, "epoch": 23.09894026305704, "img/sec/core": 687.3470988524696, "core_hours_NVIDIA A100-SXM4-40GB": 11.576676377035566, "core_hours": 11.576676377035566} {"step": 28950, "global_schedule": 0.9181771278381348, "l2_grads": 1.4487643241882324, "l2_params": 331.5438537597656, "l2_updates": 0.9563935399055481, "train/loss": 2.7321226596832275, "uptime": 5500.719804955001, "examples_seen": 29644800.0, "progress": 0.2570979458806604, "epoch": 23.138903827525997, "img/sec/core": 687.7052159174324, "core_hours_NVIDIA A100-SXM4-40GB": 11.59735707262001, "core_hours": 11.59735707262001} {"step": 29000, "global_schedule": 0.917756974697113, "l2_grads": 1.268523931503296, "l2_params": 331.5272216796875, "l2_updates": 0.9633695483207703, "train/loss": 3.1056630611419678, "uptime": 5509.99794902, "examples_seen": 29696000.0, "progress": 0.2575419837837358, "epoch": 23.178867391994956, "img/sec/core": 689.7931262075355, "core_hours_NVIDIA A100-SXM4-40GB": 11.61797517054223, "core_hours": 11.61797517054223} {"step": 29050, "global_schedule": 0.9173358678817749, "l2_grads": 0.9655831456184387, "l2_params": 331.5374755859375, "l2_updates": 0.9769328832626343, "train/loss": 3.9553918838500977, "uptime": 5518.846563103001, "examples_seen": 29747200.0, "progress": 0.2579860216868112, "epoch": 23.21883095646391, "img/sec/core": 781.444009119415, "core_hours_NVIDIA A100-SXM4-40GB": 11.636175095368896, "core_hours": 11.636175095368896} {"step": 29100, "global_schedule": 0.9169138073921204, "l2_grads": 1.305748462677002, "l2_params": 331.5854797363281, "l2_updates": 0.986219584941864, "train/loss": 2.7464089393615723, "uptime": 5527.123108475, "examples_seen": 29798400.0, "progress": 0.2584300595898866, "epoch": 23.258794520932867, "img/sec/core": 773.2694877324902, "core_hours_NVIDIA A100-SXM4-40GB": 11.654567418417782, "core_hours": 11.654567418417782} {"step": 29150, "global_schedule": 0.9164907932281494, "l2_grads": 1.108115315437317, "l2_params": 331.59722900390625, "l2_updates": 0.9315400719642639, "train/loss": 5.169492244720459, "uptime": 5535.639412994, "examples_seen": 29849600.0, "progress": 0.258874097492962, "epoch": 23.298758085401825, "img/sec/core": 751.4996658141293, "core_hours_NVIDIA A100-SXM4-40GB": 11.673492539571118, "core_hours": 11.673492539571118} {"step": 29200, "global_schedule": 0.9160667657852173, "l2_grads": 1.1581918001174927, "l2_params": 331.568603515625, "l2_updates": 0.9465153813362122, "train/loss": 3.4560461044311523, "uptime": 5544.026091343001, "examples_seen": 29900800.0, "progress": 0.25931813539603743, "epoch": 23.33872164987078, "img/sec/core": 763.1149942411027, "core_hours_NVIDIA A100-SXM4-40GB": 11.6921296025689, "core_hours": 11.6921296025689} {"step": 29250, "global_schedule": 0.9156417846679688, "l2_grads": 1.2041246891021729, "l2_params": 331.53204345703125, "l2_updates": 0.9480505585670471, "train/loss": 3.0534729957580566, "uptime": 5552.591849272001, "examples_seen": 29952000.0, "progress": 0.25976217329911283, "epoch": 23.37868521433974, "img/sec/core": 747.1609696478009, "core_hours_NVIDIA A100-SXM4-40GB": 11.711164620188898, "core_hours": 11.711164620188898} {"step": 29300, "global_schedule": 0.9152157306671143, "l2_grads": 1.1894469261169434, "l2_params": 331.5234680175781, "l2_updates": 0.9673287272453308, "train/loss": 3.4890804290771484, "uptime": 5561.132973233001, "examples_seen": 30003200.0, "progress": 0.26020621120218823, "epoch": 23.418648778808695, "img/sec/core": 749.3159014227074, "core_hours_NVIDIA A100-SXM4-40GB": 11.730144895657787, "core_hours": 11.730144895657787} {"step": 29350, "global_schedule": 0.9147888422012329, "l2_grads": 1.3858816623687744, "l2_params": 331.5024719238281, "l2_updates": 0.9427027106285095, "train/loss": 2.7448415756225586, "uptime": 5570.240715399001, "examples_seen": 30054400.0, "progress": 0.26065024910526363, "epoch": 23.458612343277654, "img/sec/core": 702.6988559131872, "core_hours_NVIDIA A100-SXM4-40GB": 11.75038432269334, "core_hours": 11.75038432269334} {"step": 29400, "global_schedule": 0.9143608808517456, "l2_grads": 1.2819530963897705, "l2_params": 331.4694519042969, "l2_updates": 0.9432705044746399, "train/loss": 2.9771430492401123, "uptime": 5578.83963654, "examples_seen": 30105600.0, "progress": 0.26109428700833903, "epoch": 23.49857590774661, "img/sec/core": 744.2794154123352, "core_hours_NVIDIA A100-SXM4-40GB": 11.769493036340007, "core_hours": 11.769493036340007} {"step": 29450, "global_schedule": 0.9139320254325867, "l2_grads": 0.9896727204322815, "l2_params": 331.4232177734375, "l2_updates": 0.9517384171485901, "train/loss": 4.375131607055664, "uptime": 5587.894609408, "examples_seen": 30156800.0, "progress": 0.26153832491141443, "epoch": 23.538539472215565, "img/sec/core": 706.7939455255058, "core_hours_NVIDIA A100-SXM4-40GB": 11.789615198268896, "core_hours": 11.789615198268896} {"step": 29500, "global_schedule": 0.9135022163391113, "l2_grads": 1.2745875120162964, "l2_params": 331.4161376953125, "l2_updates": 1.000480055809021, "train/loss": 2.774932384490967, "uptime": 5596.498549038, "examples_seen": 30208000.0, "progress": 0.26198236281448983, "epoch": 23.578503036684523, "img/sec/core": 743.8452935774284, "core_hours_NVIDIA A100-SXM4-40GB": 11.80873506411334, "core_hours": 11.80873506411334} {"step": 29550, "global_schedule": 0.91307133436203, "l2_grads": 1.3403072357177734, "l2_params": 331.4388122558594, "l2_updates": 0.9549969434738159, "train/loss": 2.5978455543518066, "uptime": 5605.595367806001, "examples_seen": 30259200.0, "progress": 0.26242640071756523, "epoch": 23.61846660115348, "img/sec/core": 703.5426519117531, "core_hours_NVIDIA A100-SXM4-40GB": 11.828950216931121, "core_hours": 11.828950216931121} {"step": 29600, "global_schedule": 0.9126394987106323, "l2_grads": 1.1440150737762451, "l2_params": 331.41546630859375, "l2_updates": 0.946311891078949, "train/loss": 3.657581090927124, "uptime": 5614.796240922, "examples_seen": 30310400.0, "progress": 0.26287043862064063, "epoch": 23.658430165622438, "img/sec/core": 695.5861600647042, "core_hours_NVIDIA A100-SXM4-40GB": 11.84939660163334, "core_hours": 11.84939660163334} {"step": 29650, "global_schedule": 0.912206768989563, "l2_grads": 1.243096113204956, "l2_params": 331.3771667480469, "l2_updates": 0.9927436709403992, "train/loss": 2.6729092597961426, "uptime": 5623.875579292, "examples_seen": 30361600.0, "progress": 0.2633144765237161, "epoch": 23.698393730091393, "img/sec/core": 704.8971785374564, "core_hours_NVIDIA A100-SXM4-40GB": 11.86957290912223, "core_hours": 11.86957290912223} {"step": 29700, "global_schedule": 0.9117730259895325, "l2_grads": 1.3028234243392944, "l2_params": 331.36859130859375, "l2_updates": 0.9316815137863159, "train/loss": 3.172865867614746, "uptime": 5632.9915511300005, "examples_seen": 30412800.0, "progress": 0.2637585144267915, "epoch": 23.738357294560352, "img/sec/core": 702.0644769130665, "core_hours_NVIDIA A100-SXM4-40GB": 11.889830624317785, "core_hours": 11.889830624317785} {"step": 29750, "global_schedule": 0.9113383293151855, "l2_grads": 1.2646621465682983, "l2_params": 331.3266296386719, "l2_updates": 0.9779416918754578, "train/loss": 2.8897335529327393, "uptime": 5642.169210758, "examples_seen": 30464000.0, "progress": 0.2642025523298669, "epoch": 23.778320859029307, "img/sec/core": 697.3455389949909, "core_hours_NVIDIA A100-SXM4-40GB": 11.910225423491118, "core_hours": 11.910225423491118} {"step": 29800, "global_schedule": 0.9109026789665222, "l2_grads": 1.2461885213851929, "l2_params": 331.2973327636719, "l2_updates": 0.9760584831237793, "train/loss": 2.700134515762329, "uptime": 5651.47123571, "examples_seen": 30515200.0, "progress": 0.2646465902329423, "epoch": 23.818284423498262, "img/sec/core": 688.0222352687047, "core_hours_NVIDIA A100-SXM4-40GB": 11.930896590051116, "core_hours": 11.930896590051116} {"step": 29850, "global_schedule": 0.9104660749435425, "l2_grads": 1.0687440633773804, "l2_params": 331.30377197265625, "l2_updates": 0.9518327713012695, "train/loss": 4.328219890594482, "uptime": 5660.402922125, "examples_seen": 30566400.0, "progress": 0.2650906281360177, "epoch": 23.85824798796722, "img/sec/core": 716.5500111212349, "core_hours_NVIDIA A100-SXM4-40GB": 11.95074478208445, "core_hours": 11.95074478208445} {"step": 29900, "global_schedule": 0.9100284576416016, "l2_grads": 1.282606601715088, "l2_params": 331.27960205078125, "l2_updates": 0.9804112315177917, "train/loss": 2.6604325771331787, "uptime": 5669.473420805001, "examples_seen": 30617600.0, "progress": 0.2655346660390931, "epoch": 23.898211552436177, "img/sec/core": 705.5841388424377, "core_hours_NVIDIA A100-SXM4-40GB": 11.970901445817788, "core_hours": 11.970901445817788} {"step": 29950, "global_schedule": 0.9095898866653442, "l2_grads": 1.3410300016403198, "l2_params": 331.2493896484375, "l2_updates": 0.9600368738174438, "train/loss": 2.6584079265594482, "uptime": 5678.505557265, "examples_seen": 30668800.0, "progress": 0.2659787039421685, "epoch": 23.938175116905136, "img/sec/core": 708.5809684501826, "core_hours_NVIDIA A100-SXM4-40GB": 11.99097286017334, "core_hours": 11.99097286017334} {"step": 30000, "global_schedule": 0.9091504216194153, "l2_grads": 1.2578949928283691, "l2_params": 331.2433166503906, "l2_updates": 0.9699970483779907, "train/loss": 2.906679153442383, "uptime": 5687.206953599001, "examples_seen": 30720000.0, "progress": 0.2664227418452439, "epoch": 23.97813868137409, "img/sec/core": 735.5141352418908, "core_hours_NVIDIA A100-SXM4-40GB": 12.01030929647112, "core_hours": 12.01030929647112, "val/acc@1": 0.58184, "val/loss": 1.77723853515625, "z/secs/eval/val": 2.5433849539986113} {"step": 30050, "global_schedule": 0.9087099432945251, "l2_grads": 1.2684485912322998, "l2_params": 331.2533264160156, "l2_updates": 0.9419035315513611, "train/loss": 2.6670727729797363, "uptime": 5699.320523145001, "examples_seen": 30771200.0, "progress": 0.2668667797483193, "epoch": 24.018102245843046, "img/sec/core": 719.7736598849307, "core_hours_NVIDIA A100-SXM4-40GB": 12.030068594448897, "core_hours": 12.030068594448897} {"step": 30100, "global_schedule": 0.9082685708999634, "l2_grads": 0.9510625600814819, "l2_params": 331.26593017578125, "l2_updates": 0.9366236329078674, "train/loss": 5.165399074554443, "uptime": 5708.1041905130005, "examples_seen": 30822400.0, "progress": 0.26731081765139475, "epoch": 24.058065810312005, "img/sec/core": 728.6250414395709, "core_hours_NVIDIA A100-SXM4-40GB": 12.049587855266674, "core_hours": 12.049587855266674} {"step": 30150, "global_schedule": 0.9078261852264404, "l2_grads": 1.029476523399353, "l2_params": 331.25836181640625, "l2_updates": 0.9638714790344238, "train/loss": 4.177816867828369, "uptime": 5716.642525222, "examples_seen": 30873600.0, "progress": 0.26775485555447015, "epoch": 24.09802937478096, "img/sec/core": 749.5606834497333, "core_hours_NVIDIA A100-SXM4-40GB": 12.068561932397785, "core_hours": 12.068561932397785} {"step": 30200, "global_schedule": 0.9073828458786011, "l2_grads": 1.2693393230438232, "l2_params": 331.249755859375, "l2_updates": 0.9585593938827515, "train/loss": 2.626664638519287, "uptime": 5725.528944891001, "examples_seen": 30924800.0, "progress": 0.26819889345754555, "epoch": 24.13799293924992, "img/sec/core": 720.200062385693, "core_hours_NVIDIA A100-SXM4-40GB": 12.08830953166223, "core_hours": 12.08830953166223} {"step": 30250, "global_schedule": 0.9069385528564453, "l2_grads": 1.173943042755127, "l2_params": 331.2236633300781, "l2_updates": 0.9379580616950989, "train/loss": 3.615175247192383, "uptime": 5734.359066058001, "examples_seen": 30976000.0, "progress": 0.26864293136062095, "epoch": 24.177956503718875, "img/sec/core": 724.7918662676783, "core_hours_NVIDIA A100-SXM4-40GB": 12.107932023144453, "core_hours": 12.107932023144453} {"step": 30300, "global_schedule": 0.9064933061599731, "l2_grads": 1.246029019355774, "l2_params": 331.2002868652344, "l2_updates": 0.9595797061920166, "train/loss": 3.029843330383301, "uptime": 5742.815716219, "examples_seen": 31027200.0, "progress": 0.26908696926369635, "epoch": 24.217920068187833, "img/sec/core": 756.8008464529036, "core_hours_NVIDIA A100-SXM4-40GB": 12.126724579057786, "core_hours": 12.126724579057786} {"step": 30350, "global_schedule": 0.9060471057891846, "l2_grads": 1.1119693517684937, "l2_params": 331.20654296875, "l2_updates": 0.9410160183906555, "train/loss": 4.4114885330200195, "uptime": 5751.118419566001, "examples_seen": 31078400.0, "progress": 0.26953100716677175, "epoch": 24.25788363265679, "img/sec/core": 770.8332735159023, "core_hours_NVIDIA A100-SXM4-40GB": 12.145175030940008, "core_hours": 12.145175030940008} {"step": 30400, "global_schedule": 0.9055999517440796, "l2_grads": 1.114874005317688, "l2_params": 331.21295166015625, "l2_updates": 0.946385383605957, "train/loss": 3.5175108909606934, "uptime": 5759.543442425, "examples_seen": 31129600.0, "progress": 0.26997504506984715, "epoch": 24.297847197125744, "img/sec/core": 759.6418558276056, "core_hours_NVIDIA A100-SXM4-40GB": 12.163897303960006, "core_hours": 12.163897303960006} {"step": 30450, "global_schedule": 0.9051518440246582, "l2_grads": 1.1806831359863281, "l2_params": 331.22003173828125, "l2_updates": 0.9530144929885864, "train/loss": 3.211442708969116, "uptime": 5767.955669049001, "examples_seen": 31180800.0, "progress": 0.27041908297292255, "epoch": 24.337810761594703, "img/sec/core": 760.7973829116852, "core_hours_NVIDIA A100-SXM4-40GB": 12.18259114090223, "core_hours": 12.18259114090223} {"step": 30500, "global_schedule": 0.9047027826309204, "l2_grads": 1.2433167695999146, "l2_params": 331.2152404785156, "l2_updates": 0.9548302292823792, "train/loss": 3.0872690677642822, "uptime": 5776.398987635001, "examples_seen": 31232000.0, "progress": 0.27086312087599795, "epoch": 24.37777432606366, "img/sec/core": 757.9957968910577, "core_hours_NVIDIA A100-SXM4-40GB": 12.201354071093341, "core_hours": 12.201354071093341} {"step": 30550, "global_schedule": 0.9042527675628662, "l2_grads": 1.0121499300003052, "l2_params": 331.2171325683594, "l2_updates": 0.9383712410926819, "train/loss": 4.680739402770996, "uptime": 5784.741110829, "examples_seen": 31283200.0, "progress": 0.27130715877907335, "epoch": 24.417737890532617, "img/sec/core": 767.1907799927658, "core_hours_NVIDIA A100-SXM4-40GB": 12.219892122635562, "core_hours": 12.219892122635562} {"step": 30600, "global_schedule": 0.9038017988204956, "l2_grads": 1.2329957485198975, "l2_params": 331.19415283203125, "l2_updates": 0.9679661989212036, "train/loss": 2.69707989692688, "uptime": 5793.09191334, "examples_seen": 31334400.0, "progress": 0.2717511966821488, "epoch": 24.457701455001573, "img/sec/core": 766.393408486111, "core_hours_NVIDIA A100-SXM4-40GB": 12.238449461548896, "core_hours": 12.238449461548896} {"step": 30650, "global_schedule": 0.9033499360084534, "l2_grads": 1.389711618423462, "l2_params": 331.1849670410156, "l2_updates": 0.9291092157363892, "train/loss": 2.674332618713379, "uptime": 5801.414672695, "examples_seen": 31385600.0, "progress": 0.2721952345852242, "epoch": 24.497665019470528, "img/sec/core": 768.9757359324716, "core_hours_NVIDIA A100-SXM4-40GB": 12.256944482337785, "core_hours": 12.256944482337785} {"step": 30700, "global_schedule": 0.9028971195220947, "l2_grads": 1.3043979406356812, "l2_params": 331.1828308105469, "l2_updates": 0.957569420337677, "train/loss": 2.8963685035705566, "uptime": 5809.664310807, "examples_seen": 31436800.0, "progress": 0.2726392724882996, "epoch": 24.537628583939487, "img/sec/core": 775.7916060209398, "core_hours_NVIDIA A100-SXM4-40GB": 12.275277011475563, "core_hours": 12.275277011475563} {"step": 30750, "global_schedule": 0.9024432897567749, "l2_grads": 1.3631181716918945, "l2_params": 331.16607666015625, "l2_updates": 0.9078194499015808, "train/loss": 3.102773666381836, "uptime": 5818.066830838001, "examples_seen": 31488000.0, "progress": 0.273083310391375, "epoch": 24.577592148408442, "img/sec/core": 761.6762562168874, "core_hours_NVIDIA A100-SXM4-40GB": 12.293949278211121, "core_hours": 12.293949278211121} {"step": 30800, "global_schedule": 0.9019886255264282, "l2_grads": 1.2955386638641357, "l2_params": 331.139404296875, "l2_updates": 0.9509032368659973, "train/loss": 2.6342077255249023, "uptime": 5827.011994548, "examples_seen": 31539200.0, "progress": 0.2735273482944504, "epoch": 24.6175557128774, "img/sec/core": 715.4704159126661, "core_hours_NVIDIA A100-SXM4-40GB": 12.313827419788897, "core_hours": 12.313827419788897} {"step": 30850, "global_schedule": 0.9015328884124756, "l2_grads": 1.1606327295303345, "l2_params": 331.1025695800781, "l2_updates": 0.9329034090042114, "train/loss": 3.5134289264678955, "uptime": 5835.891519697001, "examples_seen": 31590400.0, "progress": 0.2739713861975258, "epoch": 24.657519277346356, "img/sec/core": 720.7592627540506, "core_hours_NVIDIA A100-SXM4-40GB": 12.333559697897787, "core_hours": 12.333559697897787} {"step": 30900, "global_schedule": 0.9010763168334961, "l2_grads": 1.0121181011199951, "l2_params": 331.070556640625, "l2_updates": 0.9458595514297485, "train/loss": 5.256616592407227, "uptime": 5844.610016120001, "examples_seen": 31641600.0, "progress": 0.2744154241006012, "epoch": 24.697482841815315, "img/sec/core": 734.0715290214871, "core_hours_NVIDIA A100-SXM4-40GB": 12.352934134393342, "core_hours": 12.352934134393342} {"step": 30950, "global_schedule": 0.9006187915802002, "l2_grads": 1.2695122957229614, "l2_params": 331.03436279296875, "l2_updates": 0.9655933976173401, "train/loss": 2.718478202819824, "uptime": 5853.737676931001, "examples_seen": 31692800.0, "progress": 0.2748594620036766, "epoch": 24.73744640628427, "img/sec/core": 701.1654061780059, "core_hours_NVIDIA A100-SXM4-40GB": 12.373217825084454, "core_hours": 12.373217825084454} {"step": 31000, "global_schedule": 0.9001603126525879, "l2_grads": 1.322421669960022, "l2_params": 331.0113525390625, "l2_updates": 0.9321225881576538, "train/loss": 2.7542905807495117, "uptime": 5863.045130489001, "examples_seen": 31744000.0, "progress": 0.275303499906752, "epoch": 24.777409970753226, "img/sec/core": 687.6209438078901, "core_hours_NVIDIA A100-SXM4-40GB": 12.393901055213343, "core_hours": 12.393901055213343} {"step": 31050, "global_schedule": 0.8997008800506592, "l2_grads": 1.0912214517593384, "l2_params": 330.98583984375, "l2_updates": 0.9231020212173462, "train/loss": 4.562341213226318, "uptime": 5872.748375813, "examples_seen": 31795200.0, "progress": 0.27574753780982747, "epoch": 24.817373535222185, "img/sec/core": 730.8781869093987, "core_hours_NVIDIA A100-SXM4-40GB": 12.413360142208896, "core_hours": 12.413360142208896} {"step": 31100, "global_schedule": 0.8992404937744141, "l2_grads": 1.3476942777633667, "l2_params": 330.9546813964844, "l2_updates": 0.9530836343765259, "train/loss": 2.7011990547180176, "uptime": 5881.749411348001, "examples_seen": 31846400.0, "progress": 0.27619157571290287, "epoch": 24.85733709969114, "img/sec/core": 711.0293004747766, "core_hours_NVIDIA A100-SXM4-40GB": 12.433362443397787, "core_hours": 12.433362443397787} {"step": 31150, "global_schedule": 0.8987792134284973, "l2_grads": 1.3084754943847656, "l2_params": 330.9366760253906, "l2_updates": 0.9602074027061462, "train/loss": 2.709902048110962, "uptime": 5890.175488973, "examples_seen": 31897600.0, "progress": 0.27663561361597827, "epoch": 24.8973006641601, "img/sec/core": 759.5467647973954, "core_hours_NVIDIA A100-SXM4-40GB": 12.45208706034223, "core_hours": 12.45208706034223} {"step": 31200, "global_schedule": 0.8983169794082642, "l2_grads": 1.3578901290893555, "l2_params": 330.9425964355469, "l2_updates": 0.9387747645378113, "train/loss": 2.7079877853393555, "uptime": 5898.56834826, "examples_seen": 31948800.0, "progress": 0.27707965151905367, "epoch": 24.937264228629054, "img/sec/core": 762.5529966781868, "core_hours_NVIDIA A100-SXM4-40GB": 12.470737858757785, "core_hours": 12.470737858757785} {"step": 31250, "global_schedule": 0.8978537917137146, "l2_grads": 1.0959464311599731, "l2_params": 330.9012451171875, "l2_updates": 0.9033199548721313, "train/loss": 4.044647693634033, "uptime": 5906.899000342, "examples_seen": 32000000.0, "progress": 0.27752368942212907, "epoch": 24.977227793098013, "img/sec/core": 768.2471836542053, "core_hours_NVIDIA A100-SXM4-40GB": 12.489250418940008, "core_hours": 12.489250418940008} {"step": 31300, "global_schedule": 0.8973897099494934, "l2_grads": 1.326324701309204, "l2_params": 330.8712158203125, "l2_updates": 0.963725209236145, "train/loss": 2.5731201171875, "uptime": 5916.817760817001, "examples_seen": 32051200.0, "progress": 0.27796772732520447, "epoch": 25.01719135756697, "img/sec/core": 645.2419146657242, "core_hours_NVIDIA A100-SXM4-40GB": 12.511292108884453, "core_hours": 12.511292108884453} {"step": 31350, "global_schedule": 0.8969246745109558, "l2_grads": 1.216745376586914, "l2_params": 330.8455505371094, "l2_updates": 0.939562976360321, "train/loss": 3.0362303256988525, "uptime": 5925.905223495001, "examples_seen": 32102400.0, "progress": 0.2784117652282799, "epoch": 25.057154922035924, "img/sec/core": 704.2669914335393, "core_hours_NVIDIA A100-SXM4-40GB": 12.53148647039112, "core_hours": 12.53148647039112} {"step": 31400, "global_schedule": 0.8964587450027466, "l2_grads": 1.006169080734253, "l2_params": 330.8554992675781, "l2_updates": 0.9413229823112488, "train/loss": 4.901034832000732, "uptime": 5934.973373414001, "examples_seen": 32153600.0, "progress": 0.2788558031313553, "epoch": 25.097118486504883, "img/sec/core": 705.7668937068128, "core_hours_NVIDIA A100-SXM4-40GB": 12.551637914655565, "core_hours": 12.551637914655565} {"step": 31450, "global_schedule": 0.8959918022155762, "l2_grads": 1.3118950128555298, "l2_params": 330.79742431640625, "l2_updates": 0.9261803030967712, "train/loss": 2.6253836154937744, "uptime": 5943.475279725, "examples_seen": 32204800.0, "progress": 0.2792998410344307, "epoch": 25.137082050973838, "img/sec/core": 752.7723507985444, "core_hours_NVIDIA A100-SXM4-40GB": 12.570531039791119, "core_hours": 12.570531039791119} {"step": 31500, "global_schedule": 0.8955240249633789, "l2_grads": 1.4393234252929688, "l2_params": 330.80712890625, "l2_updates": 0.9363364577293396, "train/loss": 2.6476776599884033, "uptime": 5951.976734403001, "examples_seen": 32256000.0, "progress": 0.27974387893750613, "epoch": 25.177045615442797, "img/sec/core": 752.8123412292775, "core_hours_NVIDIA A100-SXM4-40GB": 12.589423161297786, "core_hours": 12.589423161297786} {"step": 31550, "global_schedule": 0.8950552940368652, "l2_grads": 1.174400806427002, "l2_params": 330.7937316894531, "l2_updates": 0.9343288540840149, "train/loss": 3.1766269207000732, "uptime": 5960.419978742, "examples_seen": 32307200.0, "progress": 0.28018791684058153, "epoch": 25.217009179911752, "img/sec/core": 758.0024624465942, "core_hours_NVIDIA A100-SXM4-40GB": 12.608185926495564, "core_hours": 12.608185926495564} {"step": 31600, "global_schedule": 0.8945856094360352, "l2_grads": 1.2598044872283936, "l2_params": 330.7993469238281, "l2_updates": 0.9646497368812561, "train/loss": 2.9169881343841553, "uptime": 5968.701326078, "examples_seen": 32358400.0, "progress": 0.28063195474365693, "epoch": 25.256972744380707, "img/sec/core": 772.8211051091047, "core_hours_NVIDIA A100-SXM4-40GB": 12.626588920575562, "core_hours": 12.626588920575562} {"step": 31650, "global_schedule": 0.8941149711608887, "l2_grads": 1.2673048973083496, "l2_params": 330.8053283691406, "l2_updates": 0.941179096698761, "train/loss": 2.919107437133789, "uptime": 5977.37812252, "examples_seen": 32409600.0, "progress": 0.28107599264673233, "epoch": 25.296936308849666, "img/sec/core": 737.5994173403803, "core_hours_NVIDIA A100-SXM4-40GB": 12.645870690446674, "core_hours": 12.645870690446674} {"step": 31700, "global_schedule": 0.8936434984207153, "l2_grads": 1.1668282747268677, "l2_params": 330.7878723144531, "l2_updates": 0.9343421459197998, "train/loss": 3.855564832687378, "uptime": 5985.953371629001, "examples_seen": 32460800.0, "progress": 0.28152003054980773, "epoch": 25.33689987331862, "img/sec/core": 746.3340036713928, "core_hours_NVIDIA A100-SXM4-40GB": 12.664926799577787, "core_hours": 12.664926799577787} {"step": 31750, "global_schedule": 0.8931710720062256, "l2_grads": 1.2632561922073364, "l2_params": 330.7646789550781, "l2_updates": 0.9257165193557739, "train/loss": 5.284734725952148, "uptime": 5994.459710834, "examples_seen": 32512000.0, "progress": 0.28196406845288313, "epoch": 25.37686343778758, "img/sec/core": 752.3800598309485, "core_hours_NVIDIA A100-SXM4-40GB": 12.683829775588896, "core_hours": 12.683829775588896} {"step": 31800, "global_schedule": 0.8926976919174194, "l2_grads": 1.520418643951416, "l2_params": 330.7279357910156, "l2_updates": 0.943343460559845, "train/loss": 2.7948968410491943, "uptime": 6002.829941454, "examples_seen": 32563200.0, "progress": 0.28240810635595853, "epoch": 25.416827002256536, "img/sec/core": 764.6145357940567, "core_hours_NVIDIA A100-SXM4-40GB": 12.702430288077784, "core_hours": 12.702430288077784} {"step": 31850, "global_schedule": 0.8922233581542969, "l2_grads": 1.0567197799682617, "l2_params": 330.67755126953125, "l2_updates": 0.9055452942848206, "train/loss": 4.2628607749938965, "uptime": 6011.141102703001, "examples_seen": 32614400.0, "progress": 0.28285214425903393, "epoch": 25.456790566725495, "img/sec/core": 770.0488305132103, "core_hours_NVIDIA A100-SXM4-40GB": 12.720899535297786, "core_hours": 12.720899535297786} {"step": 31900, "global_schedule": 0.8917481899261475, "l2_grads": 1.295037031173706, "l2_params": 330.6268310546875, "l2_updates": 0.9195305705070496, "train/loss": 2.977865695953369, "uptime": 6020.118630043, "examples_seen": 32665600.0, "progress": 0.28329618216210933, "epoch": 25.49675413119445, "img/sec/core": 712.891173439814, "core_hours_NVIDIA A100-SXM4-40GB": 12.74084959605334, "core_hours": 12.74084959605334} {"step": 31950, "global_schedule": 0.8912720680236816, "l2_grads": 1.3336496353149414, "l2_params": 330.607666015625, "l2_updates": 0.9734469056129456, "train/loss": 2.8693525791168213, "uptime": 6029.023179343001, "examples_seen": 32716800.0, "progress": 0.2837402200651848, "epoch": 25.536717695663405, "img/sec/core": 718.7337375962545, "core_hours_NVIDIA A100-SXM4-40GB": 12.760637483386677, "core_hours": 12.760637483386677} {"step": 32000, "global_schedule": 0.8907949924468994, "l2_grads": 0.9716811180114746, "l2_params": 330.5885925292969, "l2_updates": 0.9375808835029602, "train/loss": 5.220489978790283, "uptime": 6037.983227769, "examples_seen": 32768000.0, "progress": 0.2841842579682602, "epoch": 25.576681260132364, "img/sec/core": 714.2818538155834, "core_hours_NVIDIA A100-SXM4-40GB": 12.780548702111117, "core_hours": 12.780548702111117} {"step": 32050, "global_schedule": 0.8903170824050903, "l2_grads": 1.150171160697937, "l2_params": 330.54119873046875, "l2_updates": 0.9434139132499695, "train/loss": 3.5648179054260254, "uptime": 6047.157999619001, "examples_seen": 32819200.0, "progress": 0.2846282958713356, "epoch": 25.61664482460132, "img/sec/core": 783.2753919212242, "core_hours_NVIDIA A100-SXM4-40GB": 12.798706073540009, "core_hours": 12.798706073540009} {"step": 32100, "global_schedule": 0.8898382186889648, "l2_grads": 1.2645107507705688, "l2_params": 330.5304870605469, "l2_updates": 0.9312728047370911, "train/loss": 2.761930465698242, "uptime": 6055.694969049, "examples_seen": 32870400.0, "progress": 0.285072333774411, "epoch": 25.65660838907028, "img/sec/core": 749.6805573076596, "core_hours_NVIDIA A100-SXM4-40GB": 12.817677116717784, "core_hours": 12.817677116717784} {"step": 32150, "global_schedule": 0.889358401298523, "l2_grads": 1.300096035003662, "l2_params": 330.4957275390625, "l2_updates": 0.9507048726081848, "train/loss": 2.783764362335205, "uptime": 6064.5372612030005, "examples_seen": 32921600.0, "progress": 0.2855163716774864, "epoch": 25.696571953539234, "img/sec/core": 723.7942253586916, "core_hours_NVIDIA A100-SXM4-40GB": 12.837326654837785, "core_hours": 12.837326654837785} {"step": 32200, "global_schedule": 0.8888777494430542, "l2_grads": 1.3244056701660156, "l2_params": 330.4885559082031, "l2_updates": 0.9675166606903076, "train/loss": 2.8026340007781982, "uptime": 6073.419515213, "examples_seen": 32972800.0, "progress": 0.2859604095805618, "epoch": 25.736535518008193, "img/sec/core": 720.5378266367162, "core_hours_NVIDIA A100-SXM4-40GB": 12.857064997082226, "core_hours": 12.857064997082226} {"step": 32250, "global_schedule": 0.888396143913269, "l2_grads": 1.028518557548523, "l2_params": 330.5054931640625, "l2_updates": 0.9266319274902344, "train/loss": 5.134211540222168, "uptime": 6081.7615034400005, "examples_seen": 33024000.0, "progress": 0.2864044474836372, "epoch": 25.776499082477148, "img/sec/core": 767.2031925536427, "core_hours_NVIDIA A100-SXM4-40GB": 12.875602748697784, "core_hours": 12.875602748697784} {"step": 32300, "global_schedule": 0.8879135847091675, "l2_grads": 1.2999693155288696, "l2_params": 330.4534912109375, "l2_updates": 0.9294896721839905, "train/loss": 2.869201183319092, "uptime": 6090.0543228530005, "examples_seen": 33075200.0, "progress": 0.2868484853867126, "epoch": 25.816462646946103, "img/sec/core": 771.7520039043964, "core_hours_NVIDIA A100-SXM4-40GB": 12.894031236282228, "core_hours": 12.894031236282228} {"step": 32350, "global_schedule": 0.8874301910400391, "l2_grads": 1.1666511297225952, "l2_params": 330.443603515625, "l2_updates": 0.9320409893989563, "train/loss": 2.918037176132202, "uptime": 6098.5648062830005, "examples_seen": 33126400.0, "progress": 0.287292523289788, "epoch": 25.856426211415062, "img/sec/core": 752.0136843742123, "core_hours_NVIDIA A100-SXM4-40GB": 12.912943421682229, "core_hours": 12.912943421682229} {"step": 32400, "global_schedule": 0.8869458436965942, "l2_grads": 1.3010237216949463, "l2_params": 330.4074401855469, "l2_updates": 0.9006425142288208, "train/loss": 4.205506801605225, "uptime": 6107.087076638001, "examples_seen": 33177600.0, "progress": 0.28773656119286345, "epoch": 25.896389775884018, "img/sec/core": 750.9735942892946, "core_hours_NVIDIA A100-SXM4-40GB": 12.931881800248897, "core_hours": 12.931881800248897} {"step": 32450, "global_schedule": 0.8864606022834778, "l2_grads": 1.418347954750061, "l2_params": 330.3740539550781, "l2_updates": 0.9255721569061279, "train/loss": 2.826903820037842, "uptime": 6115.463895995001, "examples_seen": 33228800.0, "progress": 0.28818059909593885, "epoch": 25.936353340352976, "img/sec/core": 764.0131328189987, "core_hours_NVIDIA A100-SXM4-40GB": 12.950496954375561, "core_hours": 12.950496954375561} {"step": 32500, "global_schedule": 0.8859744668006897, "l2_grads": 1.298825740814209, "l2_params": 330.3592834472656, "l2_updates": 0.9320919513702393, "train/loss": 2.6712987422943115, "uptime": 6123.935651290001, "examples_seen": 33280000.0, "progress": 0.28862463699901425, "epoch": 25.976316904821932, "img/sec/core": 755.4514710519134, "core_hours_NVIDIA A100-SXM4-40GB": 12.96932307725334, "core_hours": 12.96932307725334, "val/acc@1": 0.5945, "val/loss": 1.7116277685546875, "z/secs/eval/val": 2.580461416999242} {"step": 32550, "global_schedule": 0.88548743724823, "l2_grads": 1.0685219764709473, "l2_params": 330.3229675292969, "l2_updates": 0.9346200227737427, "train/loss": 4.36828088760376, "uptime": 6135.615999081001, "examples_seen": 33331200.0, "progress": 0.28906867490208965, "epoch": 26.016280469290887, "img/sec/core": 703.4008645972336, "core_hours_NVIDIA A100-SXM4-40GB": 12.989542304920008, "core_hours": 12.989542304920008} {"step": 32600, "global_schedule": 0.8849994540214539, "l2_grads": 1.322339415550232, "l2_params": 330.3255615234375, "l2_updates": 0.9543071389198303, "train/loss": 2.5435357093811035, "uptime": 6144.264097207, "examples_seen": 33382400.0, "progress": 0.28951271280516505, "epoch": 26.056244033759846, "img/sec/core": 740.0471070927534, "core_hours_NVIDIA A100-SXM4-40GB": 13.008760300755563, "core_hours": 13.008760300755563} {"step": 32650, "global_schedule": 0.8845106363296509, "l2_grads": 1.0783839225769043, "l2_params": 330.31549072265625, "l2_updates": 0.8982784152030945, "train/loss": 4.539618492126465, "uptime": 6152.865217155, "examples_seen": 33433600.0, "progress": 0.28995675070824045, "epoch": 26.0962075982288, "img/sec/core": 744.0891463777632, "core_hours_NVIDIA A100-SXM4-40GB": 13.027873900640007, "core_hours": 13.027873900640007} {"step": 32700, "global_schedule": 0.8840208053588867, "l2_grads": 1.2988654375076294, "l2_params": 330.267578125, "l2_updates": 0.8992162942886353, "train/loss": 2.586474895477295, "uptime": 6161.958518527001, "examples_seen": 33484800.0, "progress": 0.29040078861131585, "epoch": 26.13617116269776, "img/sec/core": 703.8147904903344, "core_hours_NVIDIA A100-SXM4-40GB": 13.04808123702223, "core_hours": 13.04808123702223} {"step": 32750, "global_schedule": 0.8835301399230957, "l2_grads": 1.3484013080596924, "l2_params": 330.2240295410156, "l2_updates": 0.9393429756164551, "train/loss": 2.5509634017944336, "uptime": 6171.308379412001, "examples_seen": 33536000.0, "progress": 0.29084482651439125, "epoch": 26.176134727166716, "img/sec/core": 684.5021630500645, "core_hours_NVIDIA A100-SXM4-40GB": 13.068858705655565, "core_hours": 13.068858705655565} {"step": 32800, "global_schedule": 0.8830386400222778, "l2_grads": 1.4153157472610474, "l2_params": 330.1832275390625, "l2_updates": 0.9134005308151245, "train/loss": 2.7037885189056396, "uptime": 6180.533892391, "examples_seen": 33587200.0, "progress": 0.29128886441746665, "epoch": 26.216098291635674, "img/sec/core": 693.7283611836942, "core_hours_NVIDIA A100-SXM4-40GB": 13.089359845608895, "core_hours": 13.089359845608895} {"step": 32850, "global_schedule": 0.8825461864471436, "l2_grads": 1.3328170776367188, "l2_params": 330.1542053222656, "l2_updates": 0.908388614654541, "train/loss": 2.5790412425994873, "uptime": 6189.094842120001, "examples_seen": 33638400.0, "progress": 0.2917329023205421, "epoch": 26.25606185610463, "img/sec/core": 747.5806075954031, "core_hours_NVIDIA A100-SXM4-40GB": 13.108384178340009, "core_hours": 13.108384178340009} {"step": 32900, "global_schedule": 0.8820527791976929, "l2_grads": 1.4191974401474, "l2_params": 330.0967102050781, "l2_updates": 0.9356817007064819, "train/loss": 2.671783208847046, "uptime": 6197.388004815, "examples_seen": 33689600.0, "progress": 0.2921769402236175, "epoch": 26.296025420573585, "img/sec/core": 771.7200584837261, "core_hours_NVIDIA A100-SXM4-40GB": 13.12681342877334, "core_hours": 13.12681342877334} {"step": 32950, "global_schedule": 0.8815585374832153, "l2_grads": 1.1686931848526, "l2_params": 330.0544738769531, "l2_updates": 0.9061431884765625, "train/loss": 5.1182403564453125, "uptime": 6206.263312476001, "examples_seen": 33740800.0, "progress": 0.2926209781266929, "epoch": 26.335988985042544, "img/sec/core": 721.101762829277, "core_hours_NVIDIA A100-SXM4-40GB": 13.146536334686676, "core_hours": 13.146536334686676} {"step": 33000, "global_schedule": 0.8810634613037109, "l2_grads": 1.309906005859375, "l2_params": 330.0386657714844, "l2_updates": 0.9318941235542297, "train/loss": 2.6140458583831787, "uptime": 6215.183320636001, "examples_seen": 33792000.0, "progress": 0.2930650160297683, "epoch": 26.3759525495115, "img/sec/core": 717.4881328808699, "core_hours_NVIDIA A100-SXM4-40GB": 13.16635857504223, "core_hours": 13.16635857504223} {"step": 33050, "global_schedule": 0.8805674314498901, "l2_grads": 1.2267489433288574, "l2_params": 330.0144348144531, "l2_updates": 0.9077330231666565, "train/loss": 2.9326324462890625, "uptime": 6224.318521386, "examples_seen": 33843200.0, "progress": 0.2935090539328437, "epoch": 26.415916113980458, "img/sec/core": 758.1516158175832, "core_hours_NVIDIA A100-SXM4-40GB": 13.185117648986674, "core_hours": 13.185117648986674} {"step": 33100, "global_schedule": 0.8800704479217529, "l2_grads": 1.00348961353302, "l2_params": 329.9981689453125, "l2_updates": 0.9167025685310364, "train/loss": 4.806373119354248, "uptime": 6233.338401184001, "examples_seen": 33894400.0, "progress": 0.2939530918359191, "epoch": 26.455879678449413, "img/sec/core": 709.543823568285, "core_hours_NVIDIA A100-SXM4-40GB": 13.205161826315566, "core_hours": 13.205161826315566} {"step": 33150, "global_schedule": 0.8795726299285889, "l2_grads": 0.9673997163772583, "l2_params": 329.97906494140625, "l2_updates": 0.9226368069648743, "train/loss": 4.931368827819824, "uptime": 6243.061308575001, "examples_seen": 33945600.0, "progress": 0.2943971297389945, "epoch": 26.49584324291837, "img/sec/core": 658.2393251964922, "core_hours_NVIDIA A100-SXM4-40GB": 13.226768287184456, "core_hours": 13.226768287184456} {"step": 33200, "global_schedule": 0.879073977470398, "l2_grads": 1.3729513883590698, "l2_params": 329.9634704589844, "l2_updates": 0.9348542094230652, "train/loss": 2.6871604919433594, "uptime": 6252.190810671, "examples_seen": 33996800.0, "progress": 0.2948411676420699, "epoch": 26.535806807387328, "img/sec/core": 701.023991527968, "core_hours_NVIDIA A100-SXM4-40GB": 13.247056069620008, "core_hours": 13.247056069620008} {"step": 33250, "global_schedule": 0.8785743713378906, "l2_grads": 1.386203646659851, "l2_params": 329.9380187988281, "l2_updates": 0.9269636273384094, "train/loss": 2.6622772216796875, "uptime": 6261.0998840190005, "examples_seen": 34048000.0, "progress": 0.2952852055451453, "epoch": 26.575770371856283, "img/sec/core": 718.368762946177, "core_hours_NVIDIA A100-SXM4-40GB": 13.266854010393342, "core_hours": 13.266854010393342} {"step": 33300, "global_schedule": 0.8780738711357117, "l2_grads": 1.2723430395126343, "l2_params": 329.9171142578125, "l2_updates": 0.9406898021697998, "train/loss": 2.7068915367126465, "uptime": 6270.193798381, "examples_seen": 34099200.0, "progress": 0.2957292434482207, "epoch": 26.615733936325242, "img/sec/core": 703.7673487165509, "core_hours_NVIDIA A100-SXM4-40GB": 13.287062708975563, "core_hours": 13.287062708975563} {"step": 33350, "global_schedule": 0.8775725364685059, "l2_grads": 1.410891056060791, "l2_params": 329.8724060058594, "l2_updates": 0.8958142399787903, "train/loss": 3.061373472213745, "uptime": 6279.742081578001, "examples_seen": 34150400.0, "progress": 0.29617328135129617, "epoch": 26.655697500794197, "img/sec/core": 670.2775638253638, "core_hours_NVIDIA A100-SXM4-40GB": 13.308281116080009, "core_hours": 13.308281116080009} {"step": 33400, "global_schedule": 0.8770702481269836, "l2_grads": 1.3424068689346313, "l2_params": 329.81982421875, "l2_updates": 0.9162313342094421, "train/loss": 2.645172595977783, "uptime": 6288.861157613001, "examples_seen": 34201600.0, "progress": 0.29661731925437157, "epoch": 26.695661065263156, "img/sec/core": 701.8254892750191, "core_hours_NVIDIA A100-SXM4-40GB": 13.32854572949112, "core_hours": 13.32854572949112} {"step": 33450, "global_schedule": 0.8765671253204346, "l2_grads": 1.2494995594024658, "l2_params": 329.7916564941406, "l2_updates": 0.9408630728721619, "train/loss": 2.594249963760376, "uptime": 6297.285719532001, "examples_seen": 34252800.0, "progress": 0.29706135715744697, "epoch": 26.73562462973211, "img/sec/core": 759.6834187384385, "core_hours_NVIDIA A100-SXM4-40GB": 13.34726697820001, "core_hours": 13.34726697820001} {"step": 33500, "global_schedule": 0.8760631084442139, "l2_grads": 1.3206498622894287, "l2_params": 329.766845703125, "l2_updates": 0.9225560426712036, "train/loss": 2.7798333168029785, "uptime": 6305.773655555, "examples_seen": 34304000.0, "progress": 0.29750539506052237, "epoch": 26.775588194201067, "img/sec/core": 754.011338287496, "core_hours_NVIDIA A100-SXM4-40GB": 13.366129058251119, "core_hours": 13.366129058251119} {"step": 33550, "global_schedule": 0.8755581974983215, "l2_grads": 1.3331117630004883, "l2_params": 329.7218322753906, "l2_updates": 0.9056981205940247, "train/loss": 2.6399333477020264, "uptime": 6314.418434641, "examples_seen": 34355200.0, "progress": 0.29794943296359777, "epoch": 26.815551758670026, "img/sec/core": 740.3312376558575, "core_hours_NVIDIA A100-SXM4-40GB": 13.38533967844223, "core_hours": 13.38533967844223} {"step": 33600, "global_schedule": 0.8750523924827576, "l2_grads": 1.13382887840271, "l2_params": 329.6744079589844, "l2_updates": 0.9340558052062988, "train/loss": 3.9211225509643555, "uptime": 6323.543152097, "examples_seen": 34406400.0, "progress": 0.29839347086667317, "epoch": 26.85551532313898, "img/sec/core": 701.3915807104866, "core_hours_NVIDIA A100-SXM4-40GB": 13.405616828344451, "core_hours": 13.405616828344451} {"step": 33650, "global_schedule": 0.8745457530021667, "l2_grads": 1.29324471950531, "l2_params": 329.67388916015625, "l2_updates": 0.9244771003723145, "train/loss": 2.836935043334961, "uptime": 6332.492724799, "examples_seen": 34457600.0, "progress": 0.29883750876974857, "epoch": 26.89547888760794, "img/sec/core": 715.1179406106788, "core_hours_NVIDIA A100-SXM4-40GB": 13.42550476768223, "core_hours": 13.42550476768223} {"step": 33700, "global_schedule": 0.8740382194519043, "l2_grads": 1.3318525552749634, "l2_params": 329.6948547363281, "l2_updates": 0.9192933440208435, "train/loss": 2.702097177505493, "uptime": 6341.043362766, "examples_seen": 34508800.0, "progress": 0.299281546672824, "epoch": 26.935442452076895, "img/sec/core": 748.4821629332838, "core_hours_NVIDIA A100-SXM4-40GB": 13.444506185386675, "core_hours": 13.444506185386675} {"step": 33750, "global_schedule": 0.8735297918319702, "l2_grads": 1.0891599655151367, "l2_params": 329.6424560546875, "l2_updates": 0.916965901851654, "train/loss": 3.9417576789855957, "uptime": 6349.525739964001, "examples_seen": 34560000.0, "progress": 0.2997255845758994, "epoch": 26.975406016545854, "img/sec/core": 754.5054706489979, "core_hours_NVIDIA A100-SXM4-40GB": 13.463355912493345, "core_hours": 13.463355912493345} {"step": 33800, "global_schedule": 0.8730204701423645, "l2_grads": 1.3116075992584229, "l2_params": 329.6088562011719, "l2_updates": 0.9131090641021729, "train/loss": 2.653852939605713, "uptime": 6358.796824994, "examples_seen": 34611200.0, "progress": 0.30016962247897483, "epoch": 27.01536958101481, "img/sec/core": 690.3183369898002, "core_hours_NVIDIA A100-SXM4-40GB": 13.48395832367112, "core_hours": 13.48395832367112} {"step": 33850, "global_schedule": 0.8725103139877319, "l2_grads": 1.2566542625427246, "l2_params": 329.5899353027344, "l2_updates": 0.9371537566184998, "train/loss": 3.030184745788574, "uptime": 6367.263710428, "examples_seen": 34662400.0, "progress": 0.30061366038205023, "epoch": 27.055333145483765, "img/sec/core": 755.8859807291173, "core_hours_NVIDIA A100-SXM4-40GB": 13.502773624635564, "core_hours": 13.502773624635564} {"step": 33900, "global_schedule": 0.8719992637634277, "l2_grads": 1.1640076637268066, "l2_params": 329.5509948730469, "l2_updates": 0.8800769448280334, "train/loss": 4.783669471740723, "uptime": 6375.691407407001, "examples_seen": 34713600.0, "progress": 0.30105769828512563, "epoch": 27.095296709952724, "img/sec/core": 759.4008204076206, "core_hours_NVIDIA A100-SXM4-40GB": 13.521501840144454, "core_hours": 13.521501840144454} {"step": 33950, "global_schedule": 0.8714873790740967, "l2_grads": 1.293742299079895, "l2_params": 329.5135803222656, "l2_updates": 0.907363772392273, "train/loss": 5.15319299697876, "uptime": 6384.144278359001, "examples_seen": 34764800.0, "progress": 0.30150173618820103, "epoch": 27.13526027442168, "img/sec/core": 757.1392058795967, "core_hours_NVIDIA A100-SXM4-40GB": 13.540285997815566, "core_hours": 13.540285997815566} {"step": 34000, "global_schedule": 0.870974600315094, "l2_grads": 1.3198914527893066, "l2_params": 329.4865417480469, "l2_updates": 0.9124695658683777, "train/loss": 2.7207958698272705, "uptime": 6392.675184776001, "examples_seen": 34816000.0, "progress": 0.30194577409127643, "epoch": 27.175223838890638, "img/sec/core": 750.2133638749854, "core_hours_NVIDIA A100-SXM4-40GB": 13.559243567631121, "core_hours": 13.559243567631121} {"step": 34050, "global_schedule": 0.8704609274864197, "l2_grads": 1.333189606666565, "l2_params": 329.4450988769531, "l2_updates": 0.910347580909729, "train/loss": 2.706909418106079, "uptime": 6402.193915278, "examples_seen": 34867200.0, "progress": 0.30238981199435183, "epoch": 27.215187403359593, "img/sec/core": 724.6605384887969, "core_hours_NVIDIA A100-SXM4-40GB": 13.57886961523112, "core_hours": 13.57886961523112} {"step": 34100, "global_schedule": 0.8699464201927185, "l2_grads": 1.0459063053131104, "l2_params": 329.39337158203125, "l2_updates": 0.9126282334327698, "train/loss": 4.257388591766357, "uptime": 6411.312890248, "examples_seen": 34918400.0, "progress": 0.30283384989742723, "epoch": 27.25515096782855, "img/sec/core": 701.8332675607238, "core_hours_NVIDIA A100-SXM4-40GB": 13.599134004053344, "core_hours": 13.599134004053344} {"step": 34150, "global_schedule": 0.8694310188293457, "l2_grads": 1.0091187953948975, "l2_params": 329.37774658203125, "l2_updates": 0.9241225719451904, "train/loss": 4.797058582305908, "uptime": 6419.853841639, "examples_seen": 34969600.0, "progress": 0.30327788780050263, "epoch": 27.295114532297507, "img/sec/core": 749.3310413572952, "core_hours_NVIDIA A100-SXM4-40GB": 13.618113896033345, "core_hours": 13.618113896033345} {"step": 34200, "global_schedule": 0.868914783000946, "l2_grads": 1.1189939975738525, "l2_params": 329.350830078125, "l2_updates": 0.9385722875595093, "train/loss": 3.795355796813965, "uptime": 6428.177898274, "examples_seen": 35020800.0, "progress": 0.30372192570357803, "epoch": 27.335078096766463, "img/sec/core": 768.8558933021152, "core_hours_NVIDIA A100-SXM4-40GB": 13.636611799666674, "core_hours": 13.636611799666674} {"step": 34250, "global_schedule": 0.8683977127075195, "l2_grads": 1.289725422859192, "l2_params": 329.3387451171875, "l2_updates": 0.9177570343017578, "train/loss": 2.6664435863494873, "uptime": 6437.22883853, "examples_seen": 35072000.0, "progress": 0.3041659636066535, "epoch": 27.37504166123542, "img/sec/core": 707.1088548791683, "core_hours_NVIDIA A100-SXM4-40GB": 13.656725000235564, "core_hours": 13.656725000235564} {"step": 34300, "global_schedule": 0.8678796887397766, "l2_grads": 1.3464728593826294, "l2_params": 329.2718505859375, "l2_updates": 0.8926376104354858, "train/loss": 2.6871988773345947, "uptime": 6446.406013256001, "examples_seen": 35123200.0, "progress": 0.3046100015097289, "epoch": 27.415005225704377, "img/sec/core": 697.3823852200875, "core_hours_NVIDIA A100-SXM4-40GB": 13.6771187218489, "core_hours": 13.6771187218489} {"step": 34350, "global_schedule": 0.8673608303070068, "l2_grads": 1.2874255180358887, "l2_params": 329.2210998535156, "l2_updates": 0.9325447678565979, "train/loss": 2.6445562839508057, "uptime": 6455.506704401001, "examples_seen": 35174400.0, "progress": 0.3050540394128043, "epoch": 27.454968790173336, "img/sec/core": 703.2432919686487, "core_hours_NVIDIA A100-SXM4-40GB": 13.697342479948901, "core_hours": 13.697342479948901} {"step": 34400, "global_schedule": 0.8668411374092102, "l2_grads": 1.1743780374526978, "l2_params": 329.2160949707031, "l2_updates": 0.8989414572715759, "train/loss": 4.949682235717773, "uptime": 6464.379783433, "examples_seen": 35225600.0, "progress": 0.3054980773158797, "epoch": 27.49493235464229, "img/sec/core": 721.2828801501571, "core_hours_NVIDIA A100-SXM4-40GB": 13.717060433353343, "core_hours": 13.717060433353343} {"step": 34450, "global_schedule": 0.8663206100463867, "l2_grads": 1.114532709121704, "l2_params": 329.1761474609375, "l2_updates": 0.9055442214012146, "train/loss": 3.4222640991210938, "uptime": 6472.849350385, "examples_seen": 35276800.0, "progress": 0.3059421152189551, "epoch": 27.534895919111246, "img/sec/core": 755.6466624882456, "core_hours_NVIDIA A100-SXM4-40GB": 13.735881693246677, "core_hours": 13.735881693246677} {"step": 34500, "global_schedule": 0.8657991886138916, "l2_grads": 1.3352235555648804, "l2_params": 329.1468505859375, "l2_updates": 0.9234556555747986, "train/loss": 2.645737648010254, "uptime": 6481.306904962001, "examples_seen": 35328000.0, "progress": 0.3063861531220305, "epoch": 27.574859483580205, "img/sec/core": 756.7199172919679, "core_hours_NVIDIA A100-SXM4-40GB": 13.754676258973346, "core_hours": 13.754676258973346} {"step": 34550, "global_schedule": 0.8652769327163696, "l2_grads": 1.3914655447006226, "l2_params": 329.1185302734375, "l2_updates": 0.9050946831703186, "train/loss": 2.626962423324585, "uptime": 6489.823263582, "examples_seen": 35379200.0, "progress": 0.3068301910251059, "epoch": 27.61482304804916, "img/sec/core": 751.4948918391428, "core_hours_NVIDIA A100-SXM4-40GB": 13.773601500351123, "core_hours": 13.773601500351123} {"step": 34600, "global_schedule": 0.8647537231445312, "l2_grads": 1.059884786605835, "l2_params": 329.0451965332031, "l2_updates": 0.8990323543548584, "train/loss": 5.111181735992432, "uptime": 6498.958431243, "examples_seen": 35430400.0, "progress": 0.3072742289281813, "epoch": 27.65478661251812, "img/sec/core": 700.5892215118809, "core_hours_NVIDIA A100-SXM4-40GB": 13.79390187293112, "core_hours": 13.79390187293112} {"step": 34650, "global_schedule": 0.8642297387123108, "l2_grads": 1.3753567934036255, "l2_params": 328.9957275390625, "l2_updates": 0.891202449798584, "train/loss": 2.799531936645508, "uptime": 6508.288811722001, "examples_seen": 35481600.0, "progress": 0.3077182668312567, "epoch": 27.694750176987075, "img/sec/core": 685.9312987721936, "core_hours_NVIDIA A100-SXM4-40GB": 13.814636051773345, "core_hours": 13.814636051773345} {"step": 34700, "global_schedule": 0.8637049198150635, "l2_grads": 1.2661441564559937, "l2_params": 328.9250793457031, "l2_updates": 0.9083899259567261, "train/loss": 2.647636890411377, "uptime": 6517.223779811, "examples_seen": 35532800.0, "progress": 0.30816230473433215, "epoch": 27.734713741456034, "img/sec/core": 716.2868335120089, "core_hours_NVIDIA A100-SXM4-40GB": 13.834491536415564, "core_hours": 13.834491536415564} {"step": 34750, "global_schedule": 0.8631792068481445, "l2_grads": 1.113674283027649, "l2_params": 328.89947509765625, "l2_updates": 0.8825015425682068, "train/loss": 5.211585998535156, "uptime": 6526.324869948001, "examples_seen": 35584000.0, "progress": 0.30860634263740755, "epoch": 27.77467730592499, "img/sec/core": 703.2124617665833, "core_hours_NVIDIA A100-SXM4-40GB": 13.854716181164457, "core_hours": 13.854716181164457} {"step": 34800, "global_schedule": 0.8626526594161987, "l2_grads": 1.2703131437301636, "l2_params": 328.8225402832031, "l2_updates": 0.8646847605705261, "train/loss": 5.184108257293701, "uptime": 6535.314787485, "examples_seen": 35635200.0, "progress": 0.30905038054048295, "epoch": 27.814640870393944, "img/sec/core": 711.9086436176916, "core_hours_NVIDIA A100-SXM4-40GB": 13.87469377569112, "core_hours": 13.87469377569112} {"step": 34850, "global_schedule": 0.8621252775192261, "l2_grads": 1.0727835893630981, "l2_params": 328.7851257324219, "l2_updates": 0.9128261804580688, "train/loss": 4.140682220458984, "uptime": 6544.366014125, "examples_seen": 35686400.0, "progress": 0.30949441844355835, "epoch": 27.854604434862903, "img/sec/core": 707.0864817058578, "core_hours_NVIDIA A100-SXM4-40GB": 13.894807612668899, "core_hours": 13.894807612668899} {"step": 34900, "global_schedule": 0.8615970611572266, "l2_grads": 1.218772292137146, "l2_params": 328.78826904296875, "l2_updates": 0.8927362561225891, "train/loss": 5.200666904449463, "uptime": 6553.120134897001, "examples_seen": 35737600.0, "progress": 0.30993845634663375, "epoch": 27.89456799933186, "img/sec/core": 731.0842706751282, "core_hours_NVIDIA A100-SXM4-40GB": 13.914261214384455, "core_hours": 13.914261214384455} {"step": 34950, "global_schedule": 0.8610678911209106, "l2_grads": 1.0286451578140259, "l2_params": 328.7382507324219, "l2_updates": 0.8939595222473145, "train/loss": 4.4699296951293945, "uptime": 6561.441717373, "examples_seen": 35788800.0, "progress": 0.31038249424970915, "epoch": 27.934531563800817, "img/sec/core": 769.084488251931, "core_hours_NVIDIA A100-SXM4-40GB": 13.932753619886677, "core_hours": 13.932753619886677} {"step": 35000, "global_schedule": 0.8605380058288574, "l2_grads": 1.2606922388076782, "l2_params": 328.70458984375, "l2_updates": 0.8842840790748596, "train/loss": 4.518494129180908, "uptime": 6569.7994674950005, "examples_seen": 35840000.0, "progress": 0.31082653215278455, "epoch": 27.974495128269773, "img/sec/core": 765.7563227635702, "core_hours_NVIDIA A100-SXM4-40GB": 13.951326397935565, "core_hours": 13.951326397935565, "val/acc@1": 0.60492, "val/loss": 1.6615794287109376, "z/secs/eval/val": 3.8828099640013534} {"step": 35050, "global_schedule": 0.8600071668624878, "l2_grads": 1.5649646520614624, "l2_params": 328.6678466796875, "l2_updates": 0.8716328144073486, "train/loss": 2.4467344284057617, "uptime": 6583.651778267, "examples_seen": 35891200.0, "progress": 0.31127057005585995, "epoch": 28.014458692738728, "img/sec/core": 714.6692347509484, "core_hours_NVIDIA A100-SXM4-40GB": 13.971226823937782, "core_hours": 13.971226823937782} {"step": 35100, "global_schedule": 0.8594756126403809, "l2_grads": 1.3701660633087158, "l2_params": 328.6328125, "l2_updates": 0.8771377205848694, "train/loss": 2.5443880558013916, "uptime": 6592.063615524001, "examples_seen": 35942400.0, "progress": 0.31171460795893535, "epoch": 28.054422257207687, "img/sec/core": 760.8325986898275, "core_hours_NVIDIA A100-SXM4-40GB": 13.989919795620008, "core_hours": 13.989919795620008} {"step": 35150, "global_schedule": 0.8589431047439575, "l2_grads": 1.4392799139022827, "l2_params": 328.5922546386719, "l2_updates": 0.9050135016441345, "train/loss": 2.5767252445220947, "uptime": 6600.274860006, "examples_seen": 35993600.0, "progress": 0.3121586458620108, "epoch": 28.094385821676642, "img/sec/core": 779.4190045162958, "core_hours_NVIDIA A100-SXM4-40GB": 14.008167005580008, "core_hours": 14.008167005580008} {"step": 35200, "global_schedule": 0.8584098219871521, "l2_grads": 1.2949098348617554, "l2_params": 328.5458984375, "l2_updates": 0.8998724818229675, "train/loss": 3.698287010192871, "uptime": 6608.843565949001, "examples_seen": 36044800.0, "progress": 0.3126026837650862, "epoch": 28.1343493861456, "img/sec/core": 746.9039132131967, "core_hours_NVIDIA A100-SXM4-40GB": 14.02720857434223, "core_hours": 14.02720857434223} {"step": 35250, "global_schedule": 0.857875645160675, "l2_grads": 1.3359886407852173, "l2_params": 328.4903259277344, "l2_updates": 0.9062326550483704, "train/loss": 3.1485846042633057, "uptime": 6617.35053541, "examples_seen": 36096000.0, "progress": 0.3130467216681616, "epoch": 28.174312950614556, "img/sec/core": 752.3243182359143, "core_hours_NVIDIA A100-SXM4-40GB": 14.046112950922229, "core_hours": 14.046112950922229} {"step": 35300, "global_schedule": 0.8573406338691711, "l2_grads": 1.3967711925506592, "l2_params": 328.45257568359375, "l2_updates": 0.8806872367858887, "train/loss": 2.465719223022461, "uptime": 6625.820913498001, "examples_seen": 36147200.0, "progress": 0.313490759571237, "epoch": 28.214276515083515, "img/sec/core": 755.5743006402788, "core_hours_NVIDIA A100-SXM4-40GB": 14.064936013340008, "core_hours": 14.064936013340008} {"step": 35350, "global_schedule": 0.8568048477172852, "l2_grads": 1.2878657579421997, "l2_params": 328.4165344238281, "l2_updates": 0.896760106086731, "train/loss": 2.5429372787475586, "uptime": 6634.3282568800005, "examples_seen": 36198400.0, "progress": 0.3139347974743124, "epoch": 28.25424007955247, "img/sec/core": 752.2912515252858, "core_hours_NVIDIA A100-SXM4-40GB": 14.083841220855563, "core_hours": 14.083841220855563} {"step": 35400, "global_schedule": 0.8562681674957275, "l2_grads": 1.1455276012420654, "l2_params": 328.39044189453125, "l2_updates": 0.9188438057899475, "train/loss": 3.5789988040924072, "uptime": 6642.786021808, "examples_seen": 36249600.0, "progress": 0.3143788353773878, "epoch": 28.294203644021426, "img/sec/core": 756.7010970962789, "core_hours_NVIDIA A100-SXM4-40GB": 14.102636254028896, "core_hours": 14.102636254028896} {"step": 35450, "global_schedule": 0.8557306528091431, "l2_grads": 1.055121898651123, "l2_params": 328.36639404296875, "l2_updates": 0.8934666514396667, "train/loss": 4.681249618530273, "uptime": 6651.118670874001, "examples_seen": 36300800.0, "progress": 0.3148228732804632, "epoch": 28.334167208490385, "img/sec/core": 768.0630672560089, "core_hours_NVIDIA A100-SXM4-40GB": 14.12115325195334, "core_hours": 14.12115325195334} {"step": 35500, "global_schedule": 0.8551923036575317, "l2_grads": 1.3473331928253174, "l2_params": 328.3343811035156, "l2_updates": 0.9140232801437378, "train/loss": 2.6043310165405273, "uptime": 6659.476473426001, "examples_seen": 36352000.0, "progress": 0.3152669111835386, "epoch": 28.37413077295934, "img/sec/core": 765.751519036358, "core_hours_NVIDIA A100-SXM4-40GB": 14.139726146513341, "core_hours": 14.139726146513341} {"step": 35550, "global_schedule": 0.8546531200408936, "l2_grads": 1.088971734046936, "l2_params": 328.3106384277344, "l2_updates": 0.8867331147193909, "train/loss": 5.073491096496582, "uptime": 6667.906570721001, "examples_seen": 36403200.0, "progress": 0.315710949086614, "epoch": 28.4140943374283, "img/sec/core": 759.1845949151241, "core_hours_NVIDIA A100-SXM4-40GB": 14.158459696057786, "core_hours": 14.158459696057786} {"step": 35600, "global_schedule": 0.8541131615638733, "l2_grads": 1.2128429412841797, "l2_params": 328.2693176269531, "l2_updates": 0.8781655430793762, "train/loss": 3.194309711456299, "uptime": 6677.199688821, "examples_seen": 36454400.0, "progress": 0.3161549869896894, "epoch": 28.454057901897254, "img/sec/core": 688.6816600341072, "core_hours_NVIDIA A100-SXM4-40GB": 14.179111069613338, "core_hours": 14.179111069613338} {"step": 35650, "global_schedule": 0.8535723686218262, "l2_grads": 1.1709879636764526, "l2_params": 328.2481384277344, "l2_updates": 0.883901834487915, "train/loss": 5.036127090454102, "uptime": 6686.295410884, "examples_seen": 36505600.0, "progress": 0.31659902489276487, "epoch": 28.49402146636621, "img/sec/core": 703.6274806629931, "core_hours_NVIDIA A100-SXM4-40GB": 14.199323785308897, "core_hours": 14.199323785308897} {"step": 35700, "global_schedule": 0.8530306816101074, "l2_grads": 1.2619478702545166, "l2_params": 328.1827392578125, "l2_updates": 0.8907727003097534, "train/loss": 3.272355318069458, "uptime": 6694.952500295001, "examples_seen": 36556800.0, "progress": 0.31704306279584027, "epoch": 28.53398503083517, "img/sec/core": 739.2784914370011, "core_hours_NVIDIA A100-SXM4-40GB": 14.218561761777787, "core_hours": 14.218561761777787} {"step": 35750, "global_schedule": 0.8524881601333618, "l2_grads": 1.3799611330032349, "l2_params": 328.1618957519531, "l2_updates": 0.8650639653205872, "train/loss": 3.011143684387207, "uptime": 6703.445525785, "examples_seen": 36608000.0, "progress": 0.31748710069891567, "epoch": 28.573948595304124, "img/sec/core": 753.5594950864393, "core_hours_NVIDIA A100-SXM4-40GB": 14.237435151755562, "core_hours": 14.237435151755562} {"step": 35800, "global_schedule": 0.8519449234008789, "l2_grads": 1.3600423336029053, "l2_params": 328.12164306640625, "l2_updates": 0.901890754699707, "train/loss": 2.8656556606292725, "uptime": 6712.442328684001, "examples_seen": 36659200.0, "progress": 0.31793113860199107, "epoch": 28.613912159773083, "img/sec/core": 711.3638113280139, "core_hours_NVIDIA A100-SXM4-40GB": 14.257428047086675, "core_hours": 14.257428047086675} {"step": 35850, "global_schedule": 0.8514007329940796, "l2_grads": 1.3689939975738525, "l2_params": 328.0769958496094, "l2_updates": 0.9244539737701416, "train/loss": 2.6620850563049316, "uptime": 6721.088738981001, "examples_seen": 36710400.0, "progress": 0.31837517650506647, "epoch": 28.653875724242038, "img/sec/core": 740.1915685426507, "core_hours_NVIDIA A100-SXM4-40GB": 14.27664229219112, "core_hours": 14.27664229219112} {"step": 35900, "global_schedule": 0.850855827331543, "l2_grads": 1.4434939622879028, "l2_params": 328.066650390625, "l2_updates": 0.8964238166809082, "train/loss": 2.534421443939209, "uptime": 6729.928176065001, "examples_seen": 36761600.0, "progress": 0.31881921440814187, "epoch": 28.693839288710997, "img/sec/core": 724.0280053109601, "core_hours_NVIDIA A100-SXM4-40GB": 14.296285485711119, "core_hours": 14.296285485711119} {"step": 35950, "global_schedule": 0.8503099679946899, "l2_grads": 1.33855402469635, "l2_params": 328.02545166015625, "l2_updates": 0.8927344679832458, "train/loss": 2.529409408569336, "uptime": 6739.050906537001, "examples_seen": 36812800.0, "progress": 0.31926325231121727, "epoch": 28.733802853179952, "img/sec/core": 701.5443478949115, "core_hours_NVIDIA A100-SXM4-40GB": 14.31655822009334, "core_hours": 14.31655822009334} {"step": 36000, "global_schedule": 0.8497633934020996, "l2_grads": 1.3432674407958984, "l2_params": 327.95904541015625, "l2_updates": 0.9089587926864624, "train/loss": 2.6411962509155273, "uptime": 6748.346459628001, "examples_seen": 36864000.0, "progress": 0.31970729021429267, "epoch": 28.773766417648908, "img/sec/core": 688.5012583270902, "core_hours_NVIDIA A100-SXM4-40GB": 14.337215004740008, "core_hours": 14.337215004740008} {"step": 36050, "global_schedule": 0.8492159843444824, "l2_grads": 1.3251314163208008, "l2_params": 327.9216613769531, "l2_updates": 0.8787733912467957, "train/loss": 2.6076762676239014, "uptime": 6757.27522652, "examples_seen": 36915200.0, "progress": 0.3201513281173681, "epoch": 28.813729982117867, "img/sec/core": 796.6798716888286, "core_hours_NVIDIA A100-SXM4-40GB": 14.35506687062445, "core_hours": 14.35506687062445} {"step": 36100, "global_schedule": 0.8486677408218384, "l2_grads": 1.276159405708313, "l2_params": 327.8739318847656, "l2_updates": 0.8909960985183716, "train/loss": 2.909356117248535, "uptime": 6766.0531741760005, "examples_seen": 36966400.0, "progress": 0.32059536602044353, "epoch": 28.853693546586822, "img/sec/core": 729.0998136249757, "core_hours_NVIDIA A100-SXM4-40GB": 14.374573420971116, "core_hours": 14.374573420971116} {"step": 36150, "global_schedule": 0.8481186628341675, "l2_grads": 1.3890925645828247, "l2_params": 327.81195068359375, "l2_updates": 0.8926678895950317, "train/loss": 2.6353020668029785, "uptime": 6774.755131891001, "examples_seen": 37017600.0, "progress": 0.32103940392351893, "epoch": 28.89365711105578, "img/sec/core": 735.466685728398, "core_hours_NVIDIA A100-SXM4-40GB": 14.39391110478223, "core_hours": 14.39391110478223} {"step": 36200, "global_schedule": 0.8475688099861145, "l2_grads": 1.4087170362472534, "l2_params": 327.7669372558594, "l2_updates": 0.8887874484062195, "train/loss": 2.7725470066070557, "uptime": 6783.271988259001, "examples_seen": 37068800.0, "progress": 0.32148344182659433, "epoch": 28.933620675524736, "img/sec/core": 751.4509724558089, "core_hours_NVIDIA A100-SXM4-40GB": 14.412837452266674, "core_hours": 14.412837452266674} {"step": 36250, "global_schedule": 0.8470181226730347, "l2_grads": 1.4060136079788208, "l2_params": 327.6878967285156, "l2_updates": 0.8564776182174683, "train/loss": 2.58905291557312, "uptime": 6791.990880351001, "examples_seen": 37120000.0, "progress": 0.32192747972966973, "epoch": 28.973584239993695, "img/sec/core": 734.0382163775657, "core_hours_NVIDIA A100-SXM4-40GB": 14.432212768026671, "core_hours": 14.432212768026671} {"step": 36300, "global_schedule": 0.8464666604995728, "l2_grads": 1.1838493347167969, "l2_params": 327.6128234863281, "l2_updates": 0.8941940069198608, "train/loss": 3.4434916973114014, "uptime": 6801.958502934, "examples_seen": 37171200.0, "progress": 0.32237151763274513, "epoch": 29.01354780446265, "img/sec/core": 642.0788855826073, "core_hours_NVIDIA A100-SXM4-40GB": 14.454363040433337, "core_hours": 14.454363040433337} {"step": 36350, "global_schedule": 0.8459143042564392, "l2_grads": 1.085228443145752, "l2_params": 327.5760498046875, "l2_updates": 0.8766317367553711, "train/loss": 4.963344097137451, "uptime": 6811.077074563, "examples_seen": 37222400.0, "progress": 0.32281555553582053, "epoch": 29.053511368931606, "img/sec/core": 701.8643116917384, "core_hours_NVIDIA A100-SXM4-40GB": 14.474626532942228, "core_hours": 14.474626532942228} {"step": 36400, "global_schedule": 0.8453612327575684, "l2_grads": 1.297346830368042, "l2_params": 327.52508544921875, "l2_updates": 0.9018398523330688, "train/loss": 2.6404433250427246, "uptime": 6819.347054068001, "examples_seen": 37273600.0, "progress": 0.32325959343889593, "epoch": 29.093474933400564, "img/sec/core": 773.8834172599429, "core_hours_NVIDIA A100-SXM4-40GB": 14.493004265175562, "core_hours": 14.493004265175562} {"step": 36450, "global_schedule": 0.8448072671890259, "l2_grads": 1.3871221542358398, "l2_params": 327.50958251953125, "l2_updates": 0.8760406374931335, "train/loss": 5.123154163360596, "uptime": 6827.860520882001, "examples_seen": 37324800.0, "progress": 0.32370363134197133, "epoch": 29.13343849786952, "img/sec/core": 751.750155350998, "core_hours_NVIDIA A100-SXM4-40GB": 14.511923080317784, "core_hours": 14.511923080317784} {"step": 36500, "global_schedule": 0.8442525267601013, "l2_grads": 1.3420863151550293, "l2_params": 327.4625549316406, "l2_updates": 0.8980404734611511, "train/loss": 2.8114590644836426, "uptime": 6836.160199999, "examples_seen": 37376000.0, "progress": 0.32414766924504673, "epoch": 29.17340206233848, "img/sec/core": 771.1141490870245, "core_hours_NVIDIA A100-SXM4-40GB": 14.530366811688895, "core_hours": 14.530366811688895} {"step": 36550, "global_schedule": 0.8436969518661499, "l2_grads": 1.1967105865478516, "l2_params": 327.42742919921875, "l2_updates": 0.8934313654899597, "train/loss": 3.158010482788086, "uptime": 6845.145224405, "examples_seen": 37427200.0, "progress": 0.3245917071481222, "epoch": 29.213365626807434, "img/sec/core": 712.2963400885498, "core_hours_NVIDIA A100-SXM4-40GB": 14.550333532591115, "core_hours": 14.550333532591115} {"step": 36600, "global_schedule": 0.8431406021118164, "l2_grads": 1.3454400300979614, "l2_params": 327.4046936035156, "l2_updates": 0.8700463175773621, "train/loss": 2.547117233276367, "uptime": 6854.480106001001, "examples_seen": 37478400.0, "progress": 0.3250357450511976, "epoch": 29.25332919127639, "img/sec/core": 685.6005546702671, "core_hours_NVIDIA A100-SXM4-40GB": 14.571077713915564, "core_hours": 14.571077713915564} {"step": 36650, "global_schedule": 0.842583417892456, "l2_grads": 1.3355157375335693, "l2_params": 327.3583068847656, "l2_updates": 0.8710163831710815, "train/loss": 2.664541721343994, "uptime": 6864.012588781001, "examples_seen": 37529600.0, "progress": 0.325479782954273, "epoch": 29.293292755745348, "img/sec/core": 671.3885718658805, "core_hours_NVIDIA A100-SXM4-40GB": 14.592261008982229, "core_hours": 14.592261008982229} {"step": 36700, "global_schedule": 0.8420255184173584, "l2_grads": 1.2560510635375977, "l2_params": 327.3251647949219, "l2_updates": 0.8953158259391785, "train/loss": 2.7062244415283203, "uptime": 6872.798661831001, "examples_seen": 37580800.0, "progress": 0.3259238208573484, "epoch": 29.333256320214304, "img/sec/core": 728.4255393255839, "core_hours_NVIDIA A100-SXM4-40GB": 14.611785615760006, "core_hours": 14.611785615760006} {"step": 36750, "global_schedule": 0.8414667844772339, "l2_grads": 1.3090623617172241, "l2_params": 327.3046569824219, "l2_updates": 0.8756808042526245, "train/loss": 2.691427707672119, "uptime": 6881.230734668001, "examples_seen": 37632000.0, "progress": 0.3263678587604238, "epoch": 29.373219884683262, "img/sec/core": 759.0067263077377, "core_hours_NVIDIA A100-SXM4-40GB": 14.630523555397785, "core_hours": 14.630523555397785} {"step": 36800, "global_schedule": 0.8409071564674377, "l2_grads": 1.1668895483016968, "l2_params": 327.2667236328125, "l2_updates": 0.8699227571487427, "train/loss": 5.066171169281006, "uptime": 6889.588192943, "examples_seen": 37683200.0, "progress": 0.3268118966634992, "epoch": 29.413183449152218, "img/sec/core": 765.783063392066, "core_hours_NVIDIA A100-SXM4-40GB": 14.649095684897782, "core_hours": 14.649095684897782} {"step": 36850, "global_schedule": 0.8403468132019043, "l2_grads": 1.150059700012207, "l2_params": 327.25811767578125, "l2_updates": 0.8555191159248352, "train/loss": 5.086172103881836, "uptime": 6898.021690575, "examples_seen": 37734400.0, "progress": 0.3272559345665746, "epoch": 29.453147013621177, "img/sec/core": 758.8784961195041, "core_hours_NVIDIA A100-SXM4-40GB": 14.667836790746671, "core_hours": 14.667836790746671} {"step": 36900, "global_schedule": 0.839785635471344, "l2_grads": 1.394161581993103, "l2_params": 327.182861328125, "l2_updates": 0.8704785704612732, "train/loss": 2.720829486846924, "uptime": 6906.600347380001, "examples_seen": 37785600.0, "progress": 0.32769997246965, "epoch": 29.493110578090132, "img/sec/core": 746.037537749415, "core_hours_NVIDIA A100-SXM4-40GB": 14.686900472535562, "core_hours": 14.686900472535562} {"step": 36950, "global_schedule": 0.8392236828804016, "l2_grads": 1.4325755834579468, "l2_params": 327.1819152832031, "l2_updates": 0.8566735982894897, "train/loss": 2.620760679244995, "uptime": 6915.876711989, "examples_seen": 37836800.0, "progress": 0.3281440103727254, "epoch": 29.533074142559087, "img/sec/core": 689.9254470648411, "core_hours_NVIDIA A100-SXM4-40GB": 14.707514616111116, "core_hours": 14.707514616111116} {"step": 37000, "global_schedule": 0.8386609554290771, "l2_grads": 1.320042610168457, "l2_params": 327.10552978515625, "l2_updates": 0.8909515738487244, "train/loss": 2.5352258682250977, "uptime": 6924.439156584, "examples_seen": 37888000.0, "progress": 0.32858804827580085, "epoch": 29.573037707028046, "img/sec/core": 747.4500919675941, "core_hours_NVIDIA A100-SXM4-40GB": 14.72654227076667, "core_hours": 14.72654227076667} {"step": 37050, "global_schedule": 0.8380973935127258, "l2_grads": 1.4763041734695435, "l2_params": 327.0489196777344, "l2_updates": 0.8626757264137268, "train/loss": 2.6216976642608643, "uptime": 6934.273277460001, "examples_seen": 37939200.0, "progress": 0.32903208617887625, "epoch": 29.613001271497, "img/sec/core": 724.1507588929799, "core_hours_NVIDIA A100-SXM4-40GB": 14.74618213449334, "core_hours": 14.74618213449334} {"step": 37100, "global_schedule": 0.8375331163406372, "l2_grads": 1.3573116064071655, "l2_params": 327.0021057128906, "l2_updates": 0.8728866577148438, "train/loss": 2.5198564529418945, "uptime": 6942.983939125001, "examples_seen": 37990400.0, "progress": 0.32947612408195165, "epoch": 29.65296483596596, "img/sec/core": 734.7317857282546, "core_hours_NVIDIA A100-SXM4-40GB": 14.765539160415562, "core_hours": 14.765539160415562} {"step": 37150, "global_schedule": 0.836967945098877, "l2_grads": 1.2754322290420532, "l2_params": 326.9427795410156, "l2_updates": 0.8988636136054993, "train/loss": 3.1161224842071533, "uptime": 6951.5304170300005, "examples_seen": 38041600.0, "progress": 0.32992016198502705, "epoch": 29.692928400434916, "img/sec/core": 748.8464922206002, "core_hours_NVIDIA A100-SXM4-40GB": 14.784531333537783, "core_hours": 14.784531333537783} {"step": 37200, "global_schedule": 0.8364019989967346, "l2_grads": 1.3420039415359497, "l2_params": 326.9181213378906, "l2_updates": 0.869756281375885, "train/loss": 2.5239129066467285, "uptime": 6960.139536726001, "examples_seen": 38092800.0, "progress": 0.33036419988810245, "epoch": 29.732891964903875, "img/sec/core": 743.3977254344801, "core_hours_NVIDIA A100-SXM4-40GB": 14.803662710640006, "core_hours": 14.803662710640006} {"step": 37250, "global_schedule": 0.835835337638855, "l2_grads": 1.3030469417572021, "l2_params": 326.908203125, "l2_updates": 0.8991594314575195, "train/loss": 2.6212220191955566, "uptime": 6968.592832557, "examples_seen": 38144000.0, "progress": 0.33080823779117785, "epoch": 29.77285552937283, "img/sec/core": 757.101150598619, "core_hours_NVIDIA A100-SXM4-40GB": 14.822447812486672, "core_hours": 14.822447812486672} {"step": 37300, "global_schedule": 0.8352677822113037, "l2_grads": 1.1278555393218994, "l2_params": 326.8404541015625, "l2_updates": 0.8881484270095825, "train/loss": 3.8551812171936035, "uptime": 6977.343821243001, "examples_seen": 38195200.0, "progress": 0.33125227569425325, "epoch": 29.812819093841785, "img/sec/core": 731.3459346871656, "core_hours_NVIDIA A100-SXM4-40GB": 14.841894454011118, "core_hours": 14.841894454011118} {"step": 37350, "global_schedule": 0.8346995115280151, "l2_grads": 1.3863049745559692, "l2_params": 326.8127746582031, "l2_updates": 0.875544011592865, "train/loss": 2.6562414169311523, "uptime": 6986.256824289001, "examples_seen": 38246400.0, "progress": 0.33169631359732865, "epoch": 29.852782658310744, "img/sec/core": 718.0520377890084, "core_hours_NVIDIA A100-SXM4-40GB": 14.861701127446674, "core_hours": 14.861701127446674} {"step": 37400, "global_schedule": 0.8341304659843445, "l2_grads": 1.208843469619751, "l2_params": 326.7694396972656, "l2_updates": 0.8929852843284607, "train/loss": 3.2585105895996094, "uptime": 6995.5769534890005, "examples_seen": 38297600.0, "progress": 0.33214035150040405, "epoch": 29.8927462227797, "img/sec/core": 686.6857596781376, "core_hours_NVIDIA A100-SXM4-40GB": 14.882412525668894, "core_hours": 14.882412525668894} {"step": 37450, "global_schedule": 0.833560585975647, "l2_grads": 1.0703632831573486, "l2_params": 326.72650146484375, "l2_updates": 0.8860152959823608, "train/loss": 4.893272876739502, "uptime": 7004.335394251, "examples_seen": 38348800.0, "progress": 0.3325843894034795, "epoch": 29.93270978724866, "img/sec/core": 730.7236726162141, "core_hours_NVIDIA A100-SXM4-40GB": 14.901875727362228, "core_hours": 14.901875727362228} {"step": 37500, "global_schedule": 0.8329899907112122, "l2_grads": 1.4389208555221558, "l2_params": 326.6716613769531, "l2_updates": 0.8555928468704224, "train/loss": 2.647876024246216, "uptime": 7013.341536133001, "examples_seen": 38400000.0, "progress": 0.3330284273065549, "epoch": 29.972673351717614, "img/sec/core": 710.6261575548683, "core_hours_NVIDIA A100-SXM4-40GB": 14.921889375988895, "core_hours": 14.921889375988895, "val/acc@1": 0.6084, "val/loss": 1.686585673828125, "z/secs/eval/val": 4.596649794999394} {"step": 37550, "global_schedule": 0.8324185609817505, "l2_grads": 1.4806307554244995, "l2_params": 326.60308837890625, "l2_updates": 0.858586847782135, "train/loss": 2.5975213050842285, "uptime": 7027.119164395001, "examples_seen": 38451200.0, "progress": 0.3334724652096303, "epoch": 30.01263691618657, "img/sec/core": 697.1624833013349, "core_hours_NVIDIA A100-SXM4-40GB": 14.942289530275561, "core_hours": 14.942289530275561} {"step": 37600, "global_schedule": 0.8318463563919067, "l2_grads": 1.4273613691329956, "l2_params": 326.5457763671875, "l2_updates": 0.866479218006134, "train/loss": 2.570953607559204, "uptime": 7036.014417769, "examples_seen": 38502400.0, "progress": 0.3339165031127057, "epoch": 30.052600480655528, "img/sec/core": 719.4848455589878, "core_hours_NVIDIA A100-SXM4-40GB": 14.96205675999556, "core_hours": 14.96205675999556} {"step": 37650, "global_schedule": 0.8312734365463257, "l2_grads": 1.4293867349624634, "l2_params": 326.52825927734375, "l2_updates": 0.8784306049346924, "train/loss": 2.581801414489746, "uptime": 7044.897320004, "examples_seen": 38553600.0, "progress": 0.3343605410157811, "epoch": 30.092564045124483, "img/sec/core": 720.4852457773275, "core_hours_NVIDIA A100-SXM4-40GB": 14.981796542740003, "core_hours": 14.981796542740003} {"step": 37700, "global_schedule": 0.8306996822357178, "l2_grads": 1.235528588294983, "l2_params": 326.4696350097656, "l2_updates": 0.8518469929695129, "train/loss": 5.153144836425781, "uptime": 7053.545242225, "examples_seen": 38604800.0, "progress": 0.3348045789188565, "epoch": 30.132527609593442, "img/sec/core": 740.0621601867165, "core_hours_NVIDIA A100-SXM4-40GB": 15.00101414767556, "core_hours": 15.00101414767556} {"step": 37750, "global_schedule": 0.8301251530647278, "l2_grads": 1.3219815492630005, "l2_params": 326.41241455078125, "l2_updates": 0.8585284352302551, "train/loss": 4.182702541351318, "uptime": 7061.842615306001, "examples_seen": 38656000.0, "progress": 0.3352486168219319, "epoch": 30.172491174062397, "img/sec/core": 771.3284599260206, "core_hours_NVIDIA A100-SXM4-40GB": 15.019452754522229, "core_hours": 15.019452754522229} {"step": 37800, "global_schedule": 0.8295498490333557, "l2_grads": 1.425795555114746, "l2_params": 326.39825439453125, "l2_updates": 0.8633711338043213, "train/loss": 2.4899754524230957, "uptime": 7070.473867232, "examples_seen": 38707200.0, "progress": 0.3356926547250073, "epoch": 30.212454738531356, "img/sec/core": 741.491507242639, "core_hours_NVIDIA A100-SXM4-40GB": 15.038633314357782, "core_hours": 15.038633314357782} {"step": 37850, "global_schedule": 0.8289737701416016, "l2_grads": 1.2902967929840088, "l2_params": 326.3496398925781, "l2_updates": 0.8938091993331909, "train/loss": 2.800156831741333, "uptime": 7079.092886604001, "examples_seen": 38758400.0, "progress": 0.3361366926280827, "epoch": 30.25241830300031, "img/sec/core": 742.5438699894655, "core_hours_NVIDIA A100-SXM4-40GB": 15.057786690740008, "core_hours": 15.057786690740008} {"step": 37900, "global_schedule": 0.8283969759941101, "l2_grads": 1.4682047367095947, "l2_params": 326.3367919921875, "l2_updates": 0.8873838782310486, "train/loss": 2.561335802078247, "uptime": 7087.565452445, "examples_seen": 38809600.0, "progress": 0.3365807305311581, "epoch": 30.292381867469267, "img/sec/core": 755.3791991831221, "core_hours_NVIDIA A100-SXM4-40GB": 15.076614614831117, "core_hours": 15.076614614831117} {"step": 37950, "global_schedule": 0.8278193473815918, "l2_grads": 1.2228854894638062, "l2_params": 326.30267333984375, "l2_updates": 0.8715289235115051, "train/loss": 4.863642692565918, "uptime": 7096.505414544001, "examples_seen": 38860800.0, "progress": 0.33702476843423357, "epoch": 30.332345431938226, "img/sec/core": 715.8867038950186, "core_hours_NVIDIA A100-SXM4-40GB": 15.09648119727334, "core_hours": 15.09648119727334} {"step": 38000, "global_schedule": 0.8272410035133362, "l2_grads": 1.1615537405014038, "l2_params": 326.25347900390625, "l2_updates": 0.8692739009857178, "train/loss": 3.507316827774048, "uptime": 7105.932425071, "examples_seen": 38912000.0, "progress": 0.33746880633730897, "epoch": 30.37230899640718, "img/sec/core": 678.9002708409489, "core_hours_NVIDIA A100-SXM4-40GB": 15.117430109555558, "core_hours": 15.117430109555558} {"step": 38050, "global_schedule": 0.8266618251800537, "l2_grads": 1.2475225925445557, "l2_params": 326.2078552246094, "l2_updates": 0.8600162863731384, "train/loss": 3.6726019382476807, "uptime": 7115.007541177001, "examples_seen": 38963200.0, "progress": 0.33791284424038437, "epoch": 30.41227256087614, "img/sec/core": 766.2340060223944, "core_hours_NVIDIA A100-SXM4-40GB": 15.135991309020003, "core_hours": 15.135991309020003} {"step": 38100, "global_schedule": 0.8260819911956787, "l2_grads": 1.3933459520339966, "l2_params": 326.14984130859375, "l2_updates": 0.8722877502441406, "train/loss": 2.510427951812744, "uptime": 7123.800126561, "examples_seen": 39014400.0, "progress": 0.33835688214345977, "epoch": 30.452236125345095, "img/sec/core": 727.8860221985493, "core_hours_NVIDIA A100-SXM4-40GB": 15.155530387651112, "core_hours": 15.155530387651112} {"step": 38150, "global_schedule": 0.8255012631416321, "l2_grads": 1.4142794609069824, "l2_params": 326.1033935546875, "l2_updates": 0.8631837368011475, "train/loss": 2.704280138015747, "uptime": 7132.4552580790005, "examples_seen": 39065600.0, "progress": 0.33880092004653517, "epoch": 30.49219968981405, "img/sec/core": 739.4457249655501, "core_hours_NVIDIA A100-SXM4-40GB": 15.174764013246667, "core_hours": 15.174764013246667} {"step": 38200, "global_schedule": 0.8249198198318481, "l2_grads": 1.3842759132385254, "l2_params": 326.0809020996094, "l2_updates": 0.8448376655578613, "train/loss": 2.655351161956787, "uptime": 7141.100266555, "examples_seen": 39116800.0, "progress": 0.33924495794961057, "epoch": 30.53216325428301, "img/sec/core": 740.311593420357, "core_hours_NVIDIA A100-SXM4-40GB": 15.193975143193336, "core_hours": 15.193975143193336} {"step": 38250, "global_schedule": 0.8243376612663269, "l2_grads": 1.2151436805725098, "l2_params": 326.0459899902344, "l2_updates": 0.8559959530830383, "train/loss": 3.3896355628967285, "uptime": 7149.5573300880005, "examples_seen": 39168000.0, "progress": 0.33968899585268597, "epoch": 30.572126818751965, "img/sec/core": 756.7638548565599, "core_hours_NVIDIA A100-SXM4-40GB": 15.212768617711113, "core_hours": 15.212768617711113} {"step": 38300, "global_schedule": 0.8237547278404236, "l2_grads": 1.396891713142395, "l2_params": 325.9847412109375, "l2_updates": 0.883730947971344, "train/loss": 2.498088836669922, "uptime": 7158.934330916001, "examples_seen": 39219200.0, "progress": 0.34013303375576137, "epoch": 30.612090383220924, "img/sec/core": 682.5210019059508, "core_hours_NVIDIA A100-SXM4-40GB": 15.233606397328892, "core_hours": 15.233606397328892} {"step": 38350, "global_schedule": 0.8231710195541382, "l2_grads": 1.2699599266052246, "l2_params": 325.9396057128906, "l2_updates": 0.8768077492713928, "train/loss": 2.6926918029785156, "uptime": 7168.301534223001, "examples_seen": 39270400.0, "progress": 0.34057707165883677, "epoch": 30.65205394768988, "img/sec/core": 683.234877075588, "core_hours_NVIDIA A100-SXM4-40GB": 15.254422404677781, "core_hours": 15.254422404677781} {"step": 38400, "global_schedule": 0.8225865364074707, "l2_grads": 1.2241398096084595, "l2_params": 325.885498046875, "l2_updates": 0.8605402708053589, "train/loss": 3.487781047821045, "uptime": 7176.809314862001, "examples_seen": 39321600.0, "progress": 0.34102110956191223, "epoch": 30.692017512158838, "img/sec/core": 752.2525875505262, "core_hours_NVIDIA A100-SXM4-40GB": 15.273328583875559, "core_hours": 15.273328583875559} {"step": 38450, "global_schedule": 0.8220012784004211, "l2_grads": 1.0856200456619263, "l2_params": 325.8475036621094, "l2_updates": 0.8506113290786743, "train/loss": 4.343266487121582, "uptime": 7185.293161725, "examples_seen": 39372800.0, "progress": 0.34146514746498763, "epoch": 30.731981076627793, "img/sec/core": 754.374766936548, "core_hours_NVIDIA A100-SXM4-40GB": 15.292181576904445, "core_hours": 15.292181576904445} {"step": 38500, "global_schedule": 0.8214153051376343, "l2_grads": 1.3049418926239014, "l2_params": 325.78515625, "l2_updates": 0.8710947036743164, "train/loss": 2.6732735633850098, "uptime": 7193.746506344001, "examples_seen": 39424000.0, "progress": 0.34190918536806303, "epoch": 30.77194464109675, "img/sec/core": 757.0967810319609, "core_hours_NVIDIA A100-SXM4-40GB": 15.310966787168892, "core_hours": 15.310966787168892} {"step": 38550, "global_schedule": 0.8208285570144653, "l2_grads": 1.2776814699172974, "l2_params": 325.74957275390625, "l2_updates": 0.8702353835105896, "train/loss": 2.7906486988067627, "uptime": 7202.542871401001, "examples_seen": 39475200.0, "progress": 0.34235322327113843, "epoch": 30.811908205565707, "img/sec/core": 727.5732599236528, "core_hours_NVIDIA A100-SXM4-40GB": 15.330514265073337, "core_hours": 15.330514265073337} {"step": 38600, "global_schedule": 0.8202410936355591, "l2_grads": 1.2906996011734009, "l2_params": 325.6772766113281, "l2_updates": 0.8380577564239502, "train/loss": 4.562543869018555, "uptime": 7211.170626015, "examples_seen": 39526400.0, "progress": 0.34279726117421383, "epoch": 30.851871770034663, "img/sec/core": 741.7920752655168, "core_hours_NVIDIA A100-SXM4-40GB": 15.349687053104446, "core_hours": 15.349687053104446} {"step": 38650, "global_schedule": 0.819652795791626, "l2_grads": 1.4323898553848267, "l2_params": 325.614013671875, "l2_updates": 0.86251300573349, "train/loss": 2.4751760959625244, "uptime": 7219.784453159, "examples_seen": 39577600.0, "progress": 0.34324129907728923, "epoch": 30.89183533450362, "img/sec/core": 742.9914593141458, "core_hours_NVIDIA A100-SXM4-40GB": 15.368828891202222, "core_hours": 15.368828891202222} {"step": 38700, "global_schedule": 0.8190639019012451, "l2_grads": 1.1892915964126587, "l2_params": 325.5450439453125, "l2_updates": 0.8523900508880615, "train/loss": 3.946326732635498, "uptime": 7228.782284643001, "examples_seen": 39628800.0, "progress": 0.34368533698036463, "epoch": 30.931798898972577, "img/sec/core": 711.2824919404038, "core_hours_NVIDIA A100-SXM4-40GB": 15.38882407227778, "core_hours": 15.38882407227778} {"step": 38750, "global_schedule": 0.8184741139411926, "l2_grads": 1.2887768745422363, "l2_params": 325.4825134277344, "l2_updates": 0.8623754382133484, "train/loss": 5.0515336990356445, "uptime": 7237.400495589, "examples_seen": 39680000.0, "progress": 0.34412937488344003, "epoch": 30.971762463441536, "img/sec/core": 742.613523862676, "core_hours_NVIDIA A100-SXM4-40GB": 15.407975652157777, "core_hours": 15.407975652157777} {"step": 38800, "global_schedule": 0.8178836107254028, "l2_grads": 1.4610848426818848, "l2_params": 325.4625549316406, "l2_updates": 0.8505399227142334, "train/loss": 2.575002908706665, "uptime": 7246.7041075940015, "examples_seen": 39731200.0, "progress": 0.34457341278651543, "epoch": 31.01172602791049, "img/sec/core": 687.9048692657382, "core_hours_NVIDIA A100-SXM4-40GB": 15.428650345502227, "core_hours": 15.428650345502227} {"step": 38850, "global_schedule": 0.8172924518585205, "l2_grads": 1.2330846786499023, "l2_params": 325.3948669433594, "l2_updates": 0.8473721742630005, "train/loss": 4.960770606994629, "uptime": 7255.156248762001, "examples_seen": 39782400.0, "progress": 0.3450174506895909, "epoch": 31.051689592379446, "img/sec/core": 757.2045796195051, "core_hours_NVIDIA A100-SXM4-40GB": 15.447432881431116, "core_hours": 15.447432881431116} {"step": 38900, "global_schedule": 0.8167004585266113, "l2_grads": 1.235268235206604, "l2_params": 325.3760986328125, "l2_updates": 0.8546109199523926, "train/loss": 4.0238542556762695, "uptime": 7263.819739301, "examples_seen": 39833600.0, "progress": 0.3454614885926663, "epoch": 31.091653156848405, "img/sec/core": 738.7322663065995, "core_hours_NVIDIA A100-SXM4-40GB": 15.466685082628889, "core_hours": 15.466685082628889} {"step": 38950, "global_schedule": 0.8161077499389648, "l2_grads": 1.2699919939041138, "l2_params": 325.30743408203125, "l2_updates": 0.8492565155029297, "train/loss": 3.0660088062286377, "uptime": 7272.214332952002, "examples_seen": 39884800.0, "progress": 0.3459055264957417, "epoch": 31.13161672131736, "img/sec/core": 762.3954495088137, "core_hours_NVIDIA A100-SXM4-40GB": 15.485339735186672, "core_hours": 15.485339735186672} {"step": 39000, "global_schedule": 0.8155142664909363, "l2_grads": 1.4359596967697144, "l2_params": 325.2440490722656, "l2_updates": 0.8481090068817139, "train/loss": 2.4906489849090576, "uptime": 7281.092592941999, "examples_seen": 39936000.0, "progress": 0.3463495643988171, "epoch": 31.17158028578632, "img/sec/core": 720.8619715136605, "core_hours_NVIDIA A100-SXM4-40GB": 15.505069201831109, "core_hours": 15.505069201831109} {"step": 39050, "global_schedule": 0.8149200677871704, "l2_grads": 1.4296478033065796, "l2_params": 325.1850280761719, "l2_updates": 0.8527036905288696, "train/loss": 2.6561365127563477, "uptime": 7290.822879835001, "examples_seen": 39987200.0, "progress": 0.3467936023018925, "epoch": 31.211543850255275, "img/sec/core": 704.9692676741136, "core_hours_NVIDIA A100-SXM4-40GB": 15.525243446120008, "core_hours": 15.525243446120008} {"step": 39100, "global_schedule": 0.8143251538276672, "l2_grads": 1.1762627363204956, "l2_params": 325.10943603515625, "l2_updates": 0.8479765057563782, "train/loss": 3.1016533374786377, "uptime": 7300.421758733, "examples_seen": 40038400.0, "progress": 0.3472376402049679, "epoch": 31.25150741472423, "img/sec/core": 666.7445300652662, "core_hours_NVIDIA A100-SXM4-40GB": 15.54657428811556, "core_hours": 15.54657428811556} {"step": 39150, "global_schedule": 0.8137295246124268, "l2_grads": 1.2343865633010864, "l2_params": 325.063232421875, "l2_updates": 0.8749183416366577, "train/loss": 2.803969621658325, "uptime": 7309.048368549002, "examples_seen": 40089600.0, "progress": 0.3476816781080433, "epoch": 31.29147097919319, "img/sec/core": 741.8905151046467, "core_hours_NVIDIA A100-SXM4-40GB": 15.565744532151118, "core_hours": 15.565744532151118} {"step": 39200, "global_schedule": 0.8131331205368042, "l2_grads": 1.4275590181350708, "l2_params": 325.02679443359375, "l2_updates": 0.8487128019332886, "train/loss": 2.428227186203003, "uptime": 7318.115017154001, "examples_seen": 40140800.0, "progress": 0.3481257160111187, "epoch": 31.331434543662144, "img/sec/core": 705.8837591291377, "core_hours_NVIDIA A100-SXM4-40GB": 15.58589264016223, "core_hours": 15.58589264016223} {"step": 39250, "global_schedule": 0.8125359416007996, "l2_grads": 1.3905744552612305, "l2_params": 324.9814758300781, "l2_updates": 0.8424566984176636, "train/loss": 2.5367021560668945, "uptime": 7326.9559920910015, "examples_seen": 40192000.0, "progress": 0.3485697539141941, "epoch": 31.371398108131103, "img/sec/core": 723.9020634721426, "core_hours_NVIDIA A100-SXM4-40GB": 15.60553925113334, "core_hours": 15.60553925113334} {"step": 39300, "global_schedule": 0.8119380474090576, "l2_grads": 1.107528567314148, "l2_params": 324.9368591308594, "l2_updates": 0.8638125658035278, "train/loss": 4.248737335205078, "uptime": 7336.0036788550005, "examples_seen": 40243200.0, "progress": 0.34901379181726955, "epoch": 31.41136167260006, "img/sec/core": 707.3631268343332, "core_hours_NVIDIA A100-SXM4-40GB": 15.625645221720005, "core_hours": 15.625645221720005} {"step": 39350, "global_schedule": 0.8113394975662231, "l2_grads": 1.1343427896499634, "l2_params": 324.8993225097656, "l2_updates": 0.8574708700180054, "train/loss": 3.698676586151123, "uptime": 7345.204932622999, "examples_seen": 40294400.0, "progress": 0.34945782972034495, "epoch": 31.451325237069018, "img/sec/core": 695.5573839577095, "core_hours_NVIDIA A100-SXM4-40GB": 15.646092452315559, "core_hours": 15.646092452315559} {"step": 39400, "global_schedule": 0.8107401728630066, "l2_grads": 1.365656852722168, "l2_params": 324.8636779785156, "l2_updates": 0.863706648349762, "train/loss": 2.6354265213012695, "uptime": 7353.694507188002, "examples_seen": 40345600.0, "progress": 0.34990186762342035, "epoch": 31.491288801537973, "img/sec/core": 753.865809293102, "core_hours_NVIDIA A100-SXM4-40GB": 15.664958173571119, "core_hours": 15.664958173571119} {"step": 39450, "global_schedule": 0.810140073299408, "l2_grads": 1.4570081233978271, "l2_params": 324.80438232421875, "l2_updates": 0.8450856804847717, "train/loss": 2.5211644172668457, "uptime": 7362.234664251, "examples_seen": 40396800.0, "progress": 0.35034590552649575, "epoch": 31.531252366006928, "img/sec/core": 749.400737338787, "core_hours_NVIDIA A100-SXM4-40GB": 15.683936300377782, "core_hours": 15.683936300377782} {"step": 39500, "global_schedule": 0.8095393180847168, "l2_grads": 1.2904667854309082, "l2_params": 324.7550964355469, "l2_updates": 0.8320823311805725, "train/loss": 3.143354892730713, "uptime": 7370.818220952, "examples_seen": 40448000.0, "progress": 0.35078994342957115, "epoch": 31.571215930475887, "img/sec/core": 745.6116645975505, "core_hours_NVIDIA A100-SXM4-40GB": 15.703010870824448, "core_hours": 15.703010870824448} {"step": 39550, "global_schedule": 0.8089377880096436, "l2_grads": 1.3836140632629395, "l2_params": 324.6830749511719, "l2_updates": 0.8560789227485657, "train/loss": 2.7756152153015137, "uptime": 7379.4619959520005, "examples_seen": 40499200.0, "progress": 0.35123398133264655, "epoch": 31.611179494944842, "img/sec/core": 740.4172366818502, "core_hours_NVIDIA A100-SXM4-40GB": 15.72221925971334, "core_hours": 15.72221925971334} {"step": 39600, "global_schedule": 0.808335542678833, "l2_grads": 1.4341988563537598, "l2_params": 324.6632080078125, "l2_updates": 0.8314415216445923, "train/loss": 2.53658127784729, "uptime": 7387.856392452, "examples_seen": 40550400.0, "progress": 0.35167801923572195, "epoch": 31.6511430594138, "img/sec/core": 762.4133551471043, "core_hours_NVIDIA A100-SXM4-40GB": 15.740873474157784, "core_hours": 15.740873474157784} {"step": 39650, "global_schedule": 0.8077325820922852, "l2_grads": 1.3883981704711914, "l2_params": 324.57171630859375, "l2_updates": 0.8266205787658691, "train/loss": 2.7609925270080566, "uptime": 7396.4367406559995, "examples_seen": 40601600.0, "progress": 0.35212205713879735, "epoch": 31.691106623882757, "img/sec/core": 745.8904752859635, "core_hours_NVIDIA A100-SXM4-40GB": 15.759940914611114, "core_hours": 15.759940914611114} {"step": 39700, "global_schedule": 0.80712890625, "l2_grads": 1.249570608139038, "l2_params": 324.5077819824219, "l2_updates": 0.8570942878723145, "train/loss": 4.575560569763184, "uptime": 7405.4818949810015, "examples_seen": 40652800.0, "progress": 0.35256609504187275, "epoch": 31.731070188351715, "img/sec/core": 707.5611725396, "core_hours_NVIDIA A100-SXM4-40GB": 15.780041257555563, "core_hours": 15.780041257555563} {"step": 39750, "global_schedule": 0.8065245151519775, "l2_grads": 1.3297876119613647, "l2_params": 324.48773193359375, "l2_updates": 0.8486829996109009, "train/loss": 3.108248233795166, "uptime": 7414.155583971, "examples_seen": 40704000.0, "progress": 0.3530101329449482, "epoch": 31.77103375282067, "img/sec/core": 737.8636710838672, "core_hours_NVIDIA A100-SXM4-40GB": 15.799316121977784, "core_hours": 15.799316121977784} {"step": 39800, "global_schedule": 0.8059194087982178, "l2_grads": 1.3841512203216553, "l2_params": 324.429931640625, "l2_updates": 0.8363162875175476, "train/loss": 2.5006964206695557, "uptime": 7423.491652966999, "examples_seen": 40755200.0, "progress": 0.3534541708480236, "epoch": 31.810997317289626, "img/sec/core": 685.5133571466407, "core_hours_NVIDIA A100-SXM4-40GB": 15.820062941968892, "core_hours": 15.820062941968892} {"step": 39850, "global_schedule": 0.8053135871887207, "l2_grads": 1.1602047681808472, "l2_params": 324.35626220703125, "l2_updates": 0.8454803228378296, "train/loss": 4.78049898147583, "uptime": 7431.963728227, "examples_seen": 40806400.0, "progress": 0.353898208751099, "epoch": 31.850960881758585, "img/sec/core": 755.4229399042865, "core_hours_NVIDIA A100-SXM4-40GB": 15.838889775880004, "core_hours": 15.838889775880004} {"step": 39900, "global_schedule": 0.8047070503234863, "l2_grads": 1.3604869842529297, "l2_params": 324.32440185546875, "l2_updates": 0.8529761433601379, "train/loss": 2.415574312210083, "uptime": 7440.686424630001, "examples_seen": 40857600.0, "progress": 0.3543422466541744, "epoch": 31.89092444622754, "img/sec/core": 733.7180734385954, "core_hours_NVIDIA A100-SXM4-40GB": 15.858273545664451, "core_hours": 15.858273545664451} {"step": 39950, "global_schedule": 0.8040997385978699, "l2_grads": 1.330619215965271, "l2_params": 324.25518798828125, "l2_updates": 0.8500349521636963, "train/loss": 2.4510395526885986, "uptime": 7449.285055484999, "examples_seen": 40908800.0, "progress": 0.3547862845572498, "epoch": 31.9308880106965, "img/sec/core": 744.3045419585402, "core_hours_NVIDIA A100-SXM4-40GB": 15.877381614231115, "core_hours": 15.877381614231115} {"step": 40000, "global_schedule": 0.8034918308258057, "l2_grads": 1.20418119430542, "l2_params": 324.18084716796875, "l2_updates": 0.8279088139533997, "train/loss": 4.763584613800049, "uptime": 7458.482167223001, "examples_seen": 40960000.0, "progress": 0.3552303224603252, "epoch": 31.970851575165455, "img/sec/core": 695.8706365995029, "core_hours_NVIDIA A100-SXM4-40GB": 15.897819640315562, "core_hours": 15.897819640315562, "val/acc@1": 0.62214, "val/loss": 1.5846654760742187, "z/secs/eval/val": 2.7809223129988823} {"step": 40050, "global_schedule": 0.8028830885887146, "l2_grads": 1.380745768547058, "l2_params": 324.1014404296875, "l2_updates": 0.8625248074531555, "train/loss": 2.5827276706695557, "uptime": 7471.466959104002, "examples_seen": 41011200.0, "progress": 0.3556743603634006, "epoch": 32.01081513963441, "img/sec/core": 689.8439650892374, "core_hours_NVIDIA A100-SXM4-40GB": 15.91843621876223, "core_hours": 15.91843621876223} {"step": 40100, "global_schedule": 0.8022737503051758, "l2_grads": 1.4455914497375488, "l2_params": 324.080810546875, "l2_updates": 0.8286951184272766, "train/loss": 2.5230515003204346, "uptime": 7479.897168458001, "examples_seen": 41062400.0, "progress": 0.356118398266476, "epoch": 32.050778704103365, "img/sec/core": 759.1745034141998, "core_hours_NVIDIA A100-SXM4-40GB": 15.937170017326672, "core_hours": 15.937170017326672} {"step": 40150, "global_schedule": 0.8016636371612549, "l2_grads": 1.1988661289215088, "l2_params": 324.06207275390625, "l2_updates": 0.8511925935745239, "train/loss": 5.0041985511779785, "uptime": 7488.482177350999, "examples_seen": 41113600.0, "progress": 0.3565624361695514, "epoch": 32.09074226857233, "img/sec/core": 745.4855411063888, "core_hours_NVIDIA A100-SXM4-40GB": 15.956247814866668, "core_hours": 15.956247814866668} {"step": 40200, "global_schedule": 0.8010528087615967, "l2_grads": 1.2487080097198486, "l2_params": 324.0152893066406, "l2_updates": 0.8066772818565369, "train/loss": 5.046388149261475, "uptime": 7497.020252058001, "examples_seen": 41164800.0, "progress": 0.35700647407262687, "epoch": 32.13070583304128, "img/sec/core": 749.5835091196853, "core_hours_NVIDIA A100-SXM4-40GB": 15.97522131421556, "core_hours": 15.97522131421556} {"step": 40250, "global_schedule": 0.8004412651062012, "l2_grads": 1.3792130947113037, "l2_params": 323.9626159667969, "l2_updates": 0.8157327771186829, "train/loss": 2.6214635372161865, "uptime": 7505.935083101, "examples_seen": 41216000.0, "progress": 0.35745051197570227, "epoch": 32.17066939751024, "img/sec/core": 717.9048003412191, "core_hours_NVIDIA A100-SXM4-40GB": 15.99503204986667, "core_hours": 15.99503204986667} {"step": 40300, "global_schedule": 0.7998290061950684, "l2_grads": 1.377801537513733, "l2_params": 323.88201904296875, "l2_updates": 0.8256141543388367, "train/loss": 2.4193828105926514, "uptime": 7514.663112614, "examples_seen": 41267200.0, "progress": 0.35789454987877767, "epoch": 32.210632961979194, "img/sec/core": 733.2697478242054, "core_hours_NVIDIA A100-SXM4-40GB": 16.01442767100667, "core_hours": 16.01442767100667} {"step": 40350, "global_schedule": 0.7992161512374878, "l2_grads": 1.1857993602752686, "l2_params": 323.8083190917969, "l2_updates": 0.8346195816993713, "train/loss": 3.5500338077545166, "uptime": 7523.316734475002, "examples_seen": 41318400.0, "progress": 0.35833858778185307, "epoch": 32.25059652644815, "img/sec/core": 739.5747240634731, "core_hours_NVIDIA A100-SXM4-40GB": 16.033657941808897, "core_hours": 16.033657941808897} {"step": 40400, "global_schedule": 0.7986024618148804, "l2_grads": 1.2483856678009033, "l2_params": 323.7486572265625, "l2_updates": 0.8353484272956848, "train/loss": 2.945289373397827, "uptime": 7532.341480528999, "examples_seen": 41369600.0, "progress": 0.35878262568492847, "epoch": 32.29056009091711, "img/sec/core": 709.1612286602806, "core_hours_NVIDIA A100-SXM4-40GB": 16.05371293304, "core_hours": 16.05371293304} {"step": 40450, "global_schedule": 0.7979881763458252, "l2_grads": 1.1268234252929688, "l2_params": 323.6865234375, "l2_updates": 0.8409066200256348, "train/loss": 4.999255180358887, "uptime": 7540.813204627999, "examples_seen": 41420800.0, "progress": 0.35922666358800387, "epoch": 32.33052365538607, "img/sec/core": 755.4542529018273, "core_hours_NVIDIA A100-SXM4-40GB": 16.072538986593333, "core_hours": 16.072538986593333} {"step": 40500, "global_schedule": 0.7973731756210327, "l2_grads": 1.3692759275436401, "l2_params": 323.6495056152344, "l2_updates": 0.8153175711631775, "train/loss": 4.328248977661133, "uptime": 7549.317418106, "examples_seen": 41472000.0, "progress": 0.35967070149107927, "epoch": 32.37048721985502, "img/sec/core": 752.5681259713657, "core_hours_NVIDIA A100-SXM4-40GB": 16.09143723876667, "core_hours": 16.09143723876667} {"step": 40550, "global_schedule": 0.7967574000358582, "l2_grads": 1.157418966293335, "l2_params": 323.5910949707031, "l2_updates": 0.8219165205955505, "train/loss": 3.7009329795837402, "uptime": 7557.777990357999, "examples_seen": 41523200.0, "progress": 0.36011473939415467, "epoch": 32.41045078432398, "img/sec/core": 756.4500141805152, "core_hours_NVIDIA A100-SXM4-40GB": 16.110238510437778, "core_hours": 16.110238510437778} {"step": 40600, "global_schedule": 0.7961410284042358, "l2_grads": 1.3526045083999634, "l2_params": 323.5588073730469, "l2_updates": 0.8285894989967346, "train/loss": 2.4757025241851807, "uptime": 7566.242768793001, "examples_seen": 41574400.0, "progress": 0.36055877729723007, "epoch": 32.45041434879294, "img/sec/core": 756.0741310766094, "core_hours_NVIDIA A100-SXM4-40GB": 16.129049129182228, "core_hours": 16.129049129182228} {"step": 40650, "global_schedule": 0.7955238819122314, "l2_grads": 1.4024564027786255, "l2_params": 323.5009460449219, "l2_updates": 0.8104687929153442, "train/loss": 2.486813545227051, "uptime": 7575.436099195, "examples_seen": 41625600.0, "progress": 0.36100281520030547, "epoch": 32.490377913261895, "img/sec/core": 696.1568572156076, "core_hours_NVIDIA A100-SXM4-40GB": 16.14947875229778, "core_hours": 16.14947875229778} {"step": 40700, "global_schedule": 0.7949061393737793, "l2_grads": 1.1798728704452515, "l2_params": 323.4241638183594, "l2_updates": 0.8369675874710083, "train/loss": 3.7159435749053955, "uptime": 7584.580289521002, "examples_seen": 41676800.0, "progress": 0.3614468531033809, "epoch": 32.53034147773085, "img/sec/core": 699.8979430471018, "core_hours_NVIDIA A100-SXM4-40GB": 16.16979917524445, "core_hours": 16.16979917524445} {"step": 40750, "global_schedule": 0.7942875623703003, "l2_grads": 1.3218350410461426, "l2_params": 323.3775329589844, "l2_updates": 0.8412535190582275, "train/loss": 2.3729188442230225, "uptime": 7593.151720917, "examples_seen": 41728000.0, "progress": 0.36189089100645633, "epoch": 32.570305042199806, "img/sec/core": 746.6664206153722, "core_hours_NVIDIA A100-SXM4-40GB": 16.188846800568893, "core_hours": 16.188846800568893} {"step": 40800, "global_schedule": 0.7936683893203735, "l2_grads": 1.161807656288147, "l2_params": 323.3246765136719, "l2_updates": 0.8088282942771912, "train/loss": 4.712829113006592, "uptime": 7601.732765727002, "examples_seen": 41779200.0, "progress": 0.36233492890953173, "epoch": 32.61026860666876, "img/sec/core": 745.829924176631, "core_hours_NVIDIA A100-SXM4-40GB": 16.207915789035564, "core_hours": 16.207915789035564} {"step": 40850, "global_schedule": 0.7930485010147095, "l2_grads": 1.10051429271698, "l2_params": 323.2868347167969, "l2_updates": 0.8371709585189819, "train/loss": 5.069376468658447, "uptime": 7610.959010643002, "examples_seen": 41830400.0, "progress": 0.36277896681260713, "epoch": 32.65023217113772, "img/sec/core": 693.6733262847515, "core_hours_NVIDIA A100-SXM4-40GB": 16.228418555515564, "core_hours": 16.228418555515564} {"step": 40900, "global_schedule": 0.7924279570579529, "l2_grads": 1.3276135921478271, "l2_params": 323.21783447265625, "l2_updates": 0.8527124524116516, "train/loss": 2.9439516067504883, "uptime": 7619.543381573001, "examples_seen": 41881600.0, "progress": 0.36322300471568253, "epoch": 32.69019573560668, "img/sec/core": 745.5409432081548, "core_hours_NVIDIA A100-SXM4-40GB": 16.247494935360006, "core_hours": 16.247494935360006} {"step": 40950, "global_schedule": 0.791806697845459, "l2_grads": 1.343039870262146, "l2_params": 323.18243408203125, "l2_updates": 0.8342443108558655, "train/loss": 2.525822877883911, "uptime": 7629.112712267999, "examples_seen": 41932800.0, "progress": 0.36366704261875793, "epoch": 32.730159300075634, "img/sec/core": 668.8033054752105, "core_hours_NVIDIA A100-SXM4-40GB": 16.268760114682223, "core_hours": 16.268760114682223} {"step": 41000, "global_schedule": 0.7911847829818726, "l2_grads": 1.4787031412124634, "l2_params": 323.1229553222656, "l2_updates": 0.8076024055480957, "train/loss": 2.5725748538970947, "uptime": 7638.562371252001, "examples_seen": 41984000.0, "progress": 0.36411108052183333, "epoch": 32.77012286454459, "img/sec/core": 677.2731175627715, "core_hours_NVIDIA A100-SXM4-40GB": 16.289759356868892, "core_hours": 16.289759356868892} {"step": 41050, "global_schedule": 0.7905621528625488, "l2_grads": 1.2263118028640747, "l2_params": 323.0461730957031, "l2_updates": 0.8016369342803955, "train/loss": 4.100872993469238, "uptime": 7648.637597344999, "examples_seen": 42035200.0, "progress": 0.36455511842490873, "epoch": 32.810086429013545, "img/sec/core": 697.1383423730349, "core_hours_NVIDIA A100-SXM4-40GB": 16.310160217584446, "core_hours": 16.310160217584446} {"step": 41100, "global_schedule": 0.7899389266967773, "l2_grads": 1.1700685024261475, "l2_params": 322.9845275878906, "l2_updates": 0.830967903137207, "train/loss": 4.293666362762451, "uptime": 7658.219745971999, "examples_seen": 42086400.0, "progress": 0.36499915632798413, "epoch": 32.85004999348251, "img/sec/core": 667.9086548466456, "core_hours_NVIDIA A100-SXM4-40GB": 16.3314538812, "core_hours": 16.3314538812} {"step": 41150, "global_schedule": 0.789314866065979, "l2_grads": 1.2248022556304932, "l2_params": 322.9383544921875, "l2_updates": 0.8119516968727112, "train/loss": 4.981888294219971, "uptime": 7667.348192359999, "examples_seen": 42137600.0, "progress": 0.3654431942310596, "epoch": 32.89001355795146, "img/sec/core": 701.1050651963242, "core_hours_NVIDIA A100-SXM4-40GB": 16.351739317617778, "core_hours": 16.351739317617778} {"step": 41200, "global_schedule": 0.7886902689933777, "l2_grads": 1.4574636220932007, "l2_params": 322.8697509765625, "l2_updates": 0.832241952419281, "train/loss": 2.6683244705200195, "uptime": 7676.584785661, "examples_seen": 42188800.0, "progress": 0.365887232134135, "epoch": 32.92997712242042, "img/sec/core": 692.8961567796571, "core_hours_NVIDIA A100-SXM4-40GB": 16.37226508050889, "core_hours": 16.37226508050889} {"step": 41250, "global_schedule": 0.7880649566650391, "l2_grads": 1.3008918762207031, "l2_params": 322.8146057128906, "l2_updates": 0.7982873320579529, "train/loss": 4.028952121734619, "uptime": 7686.179842202002, "examples_seen": 42240000.0, "progress": 0.3663312700372104, "epoch": 32.96994068688937, "img/sec/core": 667.0101392994578, "core_hours_NVIDIA A100-SXM4-40GB": 16.393587428377785, "core_hours": 16.393587428377785} {"step": 41300, "global_schedule": 0.7874389886856079, "l2_grads": 1.266114592552185, "l2_params": 322.7481384277344, "l2_updates": 0.8130061626434326, "train/loss": 3.5428061485290527, "uptime": 7696.346390975001, "examples_seen": 42291200.0, "progress": 0.3667753079402858, "epoch": 33.00990425135833, "img/sec/core": 629.5154966450048, "core_hours_NVIDIA A100-SXM4-40GB": 16.41617975898445, "core_hours": 16.41617975898445} {"step": 41350, "global_schedule": 0.7868122458457947, "l2_grads": 1.4162836074829102, "l2_params": 322.6933288574219, "l2_updates": 0.8310606479644775, "train/loss": 2.619736671447754, "uptime": 7704.868435590999, "examples_seen": 42342400.0, "progress": 0.3672193458433612, "epoch": 33.04986781582729, "img/sec/core": 750.9934867021668, "core_hours_NVIDIA A100-SXM4-40GB": 16.435117635908888, "core_hours": 16.435117635908888} {"step": 41400, "global_schedule": 0.7861849069595337, "l2_grads": 1.4633547067642212, "l2_params": 322.6592712402344, "l2_updates": 0.83162522315979, "train/loss": 2.5105371475219727, "uptime": 7713.888485352001, "examples_seen": 42393600.0, "progress": 0.3676633837464366, "epoch": 33.089831380296246, "img/sec/core": 709.5304537753393, "core_hours_NVIDIA A100-SXM4-40GB": 16.455162190933336, "core_hours": 16.455162190933336} {"step": 41450, "global_schedule": 0.7855569124221802, "l2_grads": 1.3774243593215942, "l2_params": 322.6156921386719, "l2_updates": 0.8343522548675537, "train/loss": 2.4233925342559814, "uptime": 7723.439574255002, "examples_seen": 42444800.0, "progress": 0.368107421649512, "epoch": 33.1297949447652, "img/sec/core": 670.0806646233854, "core_hours_NVIDIA A100-SXM4-40GB": 16.47638683294001, "core_hours": 16.47638683294001} {"step": 41500, "global_schedule": 0.7849282026290894, "l2_grads": 1.452125072479248, "l2_params": 322.560791015625, "l2_updates": 0.8360460996627808, "train/loss": 2.4700818061828613, "uptime": 7732.866692497, "examples_seen": 42496000.0, "progress": 0.3685514595525874, "epoch": 33.16975850923416, "img/sec/core": 678.8925136727255, "core_hours_NVIDIA A100-SXM4-40GB": 16.49733598458889, "core_hours": 16.49733598458889} {"step": 41550, "global_schedule": 0.7842988967895508, "l2_grads": 1.3954323530197144, "l2_params": 322.5173645019531, "l2_updates": 0.8257007598876953, "train/loss": 2.507230758666992, "uptime": 7742.325808519001, "examples_seen": 42547200.0, "progress": 0.3689954974556628, "epoch": 33.20972207370312, "img/sec/core": 676.5959932317601, "core_hours_NVIDIA A100-SXM4-40GB": 16.518356242415557, "core_hours": 16.518356242415557} {"step": 41600, "global_schedule": 0.7836688160896301, "l2_grads": 1.4411721229553223, "l2_params": 322.4773864746094, "l2_updates": 0.8211653828620911, "train/loss": 2.528012275695801, "uptime": 7751.948205603001, "examples_seen": 42598400.0, "progress": 0.36943953535873825, "epoch": 33.249685638172075, "img/sec/core": 665.1149338496708, "core_hours_NVIDIA A100-SXM4-40GB": 16.53973934704667, "core_hours": 16.53973934704667} {"step": 41650, "global_schedule": 0.7830381393432617, "l2_grads": 1.1805903911590576, "l2_params": 322.41552734375, "l2_updates": 0.8006047606468201, "train/loss": 4.073899745941162, "uptime": 7761.271104707999, "examples_seen": 42649600.0, "progress": 0.36988357326181365, "epoch": 33.28964920264103, "img/sec/core": 686.4817400596792, "core_hours_NVIDIA A100-SXM4-40GB": 16.560456900613335, "core_hours": 16.560456900613335} {"step": 41700, "global_schedule": 0.7824068069458008, "l2_grads": 1.4466090202331543, "l2_params": 322.3461608886719, "l2_updates": 0.8316649198532104, "train/loss": 2.4263007640838623, "uptime": 7770.772803586, "examples_seen": 42700800.0, "progress": 0.37032761116488905, "epoch": 33.329612767109985, "img/sec/core": 673.5637576157982, "core_hours_NVIDIA A100-SXM4-40GB": 16.58157178700889, "core_hours": 16.58157178700889} {"step": 41750, "global_schedule": 0.7817747592926025, "l2_grads": 1.6444662809371948, "l2_params": 322.2822265625, "l2_updates": 0.8013887405395508, "train/loss": 2.6146345138549805, "uptime": 7779.500368201001, "examples_seen": 42752000.0, "progress": 0.37077164906796445, "epoch": 33.36957633157894, "img/sec/core": 733.3088074764423, "core_hours_NVIDIA A100-SXM4-40GB": 16.600966375042226, "core_hours": 16.600966375042226} {"step": 41800, "global_schedule": 0.7811421155929565, "l2_grads": 1.2900454998016357, "l2_params": 322.2210693359375, "l2_updates": 0.817553699016571, "train/loss": 3.2613418102264404, "uptime": 7788.959154216, "examples_seen": 42803200.0, "progress": 0.37121568697103985, "epoch": 33.4095398960479, "img/sec/core": 676.6195989476491, "core_hours_NVIDIA A100-SXM4-40GB": 16.621985899520002, "core_hours": 16.621985899520002} {"step": 41850, "global_schedule": 0.7805087566375732, "l2_grads": 1.3333475589752197, "l2_params": 322.1469421386719, "l2_updates": 0.81748366355896, "train/loss": 2.384843587875366, "uptime": 7798.603923954999, "examples_seen": 42854400.0, "progress": 0.37165972487411525, "epoch": 33.44950346051686, "img/sec/core": 663.5720886234379, "core_hours_NVIDIA A100-SXM4-40GB": 16.643418721162224, "core_hours": 16.643418721162224} {"step": 41900, "global_schedule": 0.7798748016357422, "l2_grads": 1.529276967048645, "l2_params": 322.0968933105469, "l2_updates": 0.8168540596961975, "train/loss": 2.594043016433716, "uptime": 7807.707317762002, "examples_seen": 42905600.0, "progress": 0.37210376277719065, "epoch": 33.489467024985814, "img/sec/core": 703.0345095118854, "core_hours_NVIDIA A100-SXM4-40GB": 16.663648485177784, "core_hours": 16.663648485177784} {"step": 41950, "global_schedule": 0.7792401313781738, "l2_grads": 1.2130298614501953, "l2_params": 322.00091552734375, "l2_updates": 0.8109654784202576, "train/loss": 3.681950330734253, "uptime": 7816.915216804, "examples_seen": 42956800.0, "progress": 0.37254780068026605, "epoch": 33.52943058945477, "img/sec/core": 695.0554052351408, "core_hours_NVIDIA A100-SXM4-40GB": 16.68411048304889, "core_hours": 16.68411048304889} {"step": 42000, "global_schedule": 0.7786048054695129, "l2_grads": 1.4174811840057373, "l2_params": 321.9633483886719, "l2_updates": 0.817421019077301, "train/loss": 2.666393518447876, "uptime": 7826.333142998001, "examples_seen": 43008000.0, "progress": 0.37299183858334145, "epoch": 33.569394153923724, "img/sec/core": 679.5551237253077, "core_hours_NVIDIA A100-SXM4-40GB": 16.705039207924447, "core_hours": 16.705039207924447} {"step": 42050, "global_schedule": 0.7779688835144043, "l2_grads": 1.273331880569458, "l2_params": 321.89813232421875, "l2_updates": 0.8058263063430786, "train/loss": 3.8848178386688232, "uptime": 7835.260973385002, "examples_seen": 43059200.0, "progress": 0.3734358764864169, "epoch": 33.60935771839269, "img/sec/core": 775.7188762240837, "core_hours_NVIDIA A100-SXM4-40GB": 16.72337345588223, "core_hours": 16.72337345588223} {"step": 42100, "global_schedule": 0.7773322463035583, "l2_grads": 1.1970081329345703, "l2_params": 321.8297119140625, "l2_updates": 0.8183761835098267, "train/loss": 4.640352725982666, "uptime": 7844.435701361001, "examples_seen": 43110400.0, "progress": 0.3738799143894923, "epoch": 33.64932128286164, "img/sec/core": 697.5683657044395, "core_hours_NVIDIA A100-SXM4-40GB": 16.743761740273335, "core_hours": 16.743761740273335} {"step": 42150, "global_schedule": 0.7766950130462646, "l2_grads": 1.3503994941711426, "l2_params": 321.7480163574219, "l2_updates": 0.8033633828163147, "train/loss": 2.7340378761291504, "uptime": 7853.846804867999, "examples_seen": 43161600.0, "progress": 0.3743239522925677, "epoch": 33.6892848473306, "img/sec/core": 680.0477749756867, "core_hours_NVIDIA A100-SXM4-40GB": 16.76467530362222, "core_hours": 16.76467530362222} {"step": 42200, "global_schedule": 0.7760571241378784, "l2_grads": 1.479624629020691, "l2_params": 321.7085876464844, "l2_updates": 0.8385938405990601, "train/loss": 2.527515411376953, "uptime": 7863.166615289001, "examples_seen": 43212800.0, "progress": 0.3747679901956431, "epoch": 33.72924841179955, "img/sec/core": 686.709247387426, "core_hours_NVIDIA A100-SXM4-40GB": 16.78538599344667, "core_hours": 16.78538599344667} {"step": 42250, "global_schedule": 0.7754185199737549, "l2_grads": 1.2496349811553955, "l2_params": 321.675537109375, "l2_updates": 0.8086211085319519, "train/loss": 4.15412712097168, "uptime": 7872.740822149002, "examples_seen": 43264000.0, "progress": 0.3752120280987185, "epoch": 33.76921197626851, "img/sec/core": 668.4626824533889, "core_hours_NVIDIA A100-SXM4-40GB": 16.806662008691116, "core_hours": 16.806662008691116} {"step": 42300, "global_schedule": 0.7747793197631836, "l2_grads": 1.3051762580871582, "l2_params": 321.62408447265625, "l2_updates": 0.8116633892059326, "train/loss": 3.999657154083252, "uptime": 7882.2912843409995, "examples_seen": 43315200.0, "progress": 0.3756560660017939, "epoch": 33.80917554073747, "img/sec/core": 670.124635995404, "core_hours_NVIDIA A100-SXM4-40GB": 16.827885258006667, "core_hours": 16.827885258006667} {"step": 42350, "global_schedule": 0.7741395235061646, "l2_grads": 1.4522684812545776, "l2_params": 321.55718994140625, "l2_updates": 0.805978536605835, "train/loss": 2.529651641845703, "uptime": 7891.740688275999, "examples_seen": 43366400.0, "progress": 0.3761001039048693, "epoch": 33.849139105206426, "img/sec/core": 677.2913978515923, "core_hours_NVIDIA A100-SXM4-40GB": 16.848883933417774, "core_hours": 16.848883933417774} {"step": 42400, "global_schedule": 0.7734990119934082, "l2_grads": 1.4140796661376953, "l2_params": 321.4949645996094, "l2_updates": 0.8146257996559143, "train/loss": 2.494899272918701, "uptime": 7900.351732688001, "examples_seen": 43417600.0, "progress": 0.3765441418079447, "epoch": 33.88910266967538, "img/sec/core": 743.2315633025379, "core_hours_NVIDIA A100-SXM4-40GB": 16.86801958766667, "core_hours": 16.86801958766667} {"step": 42450, "global_schedule": 0.7728579044342041, "l2_grads": 1.450837254524231, "l2_params": 321.4466857910156, "l2_updates": 0.7937039732933044, "train/loss": 2.454315185546875, "uptime": 7908.936748622002, "examples_seen": 43468800.0, "progress": 0.3769881797110201, "epoch": 33.92906623414434, "img/sec/core": 745.4849296962857, "core_hours_NVIDIA A100-SXM4-40GB": 16.887097400853335, "core_hours": 16.887097400853335} {"step": 42500, "global_schedule": 0.7722162008285522, "l2_grads": 1.3510037660598755, "l2_params": 321.38555908203125, "l2_updates": 0.8153182864189148, "train/loss": 2.6264350414276123, "uptime": 7917.557297347999, "examples_seen": 43520000.0, "progress": 0.37743221761409557, "epoch": 33.9690297986133, "img/sec/core": 742.4121367934536, "core_hours_NVIDIA A100-SXM4-40GB": 16.906254175799997, "core_hours": 16.906254175799997, "val/acc@1": 0.62866, "val/loss": 1.5580347778320311, "z/secs/eval/val": 2.5868717590019514} {"step": 42550, "global_schedule": 0.7715737819671631, "l2_grads": 1.1464186906814575, "l2_params": 321.34161376953125, "l2_updates": 0.7970001697540283, "train/loss": 4.161016464233398, "uptime": 7929.883716504, "examples_seen": 43571200.0, "progress": 0.37787625551717097, "epoch": 34.008993363082254, "img/sec/core": 657.1768285789235, "core_hours_NVIDIA A100-SXM4-40GB": 16.927895569111104, "core_hours": 16.927895569111104} {"step": 42600, "global_schedule": 0.7709307074546814, "l2_grads": 1.2394828796386719, "l2_params": 321.2666320800781, "l2_updates": 0.8075630068778992, "train/loss": 2.9242677688598633, "uptime": 7938.388215663001, "examples_seen": 43622400.0, "progress": 0.37832029342024637, "epoch": 34.04895692755121, "img/sec/core": 752.5428458919791, "core_hours_NVIDIA A100-SXM4-40GB": 16.946794456131105, "core_hours": 16.946794456131105} {"step": 42650, "global_schedule": 0.770287036895752, "l2_grads": 1.187852144241333, "l2_params": 321.22711181640625, "l2_updates": 0.8060871362686157, "train/loss": 4.854037284851074, "uptime": 7946.919980143002, "examples_seen": 43673600.0, "progress": 0.37876433132332177, "epoch": 34.088920492020165, "img/sec/core": 750.1379128551391, "core_hours_NVIDIA A100-SXM4-40GB": 16.965753932753334, "core_hours": 16.965753932753334} {"step": 42700, "global_schedule": 0.76964271068573, "l2_grads": 1.5081650018692017, "l2_params": 321.1941223144531, "l2_updates": 0.801971971988678, "train/loss": 2.4939653873443604, "uptime": 7955.968246781, "examples_seen": 43724800.0, "progress": 0.37920836922639717, "epoch": 34.12888405648912, "img/sec/core": 707.317794230735, "core_hours_NVIDIA A100-SXM4-40GB": 16.98586119194888, "core_hours": 16.98586119194888} {"step": 42750, "global_schedule": 0.7689977884292603, "l2_grads": 1.3977687358856201, "l2_params": 321.1159973144531, "l2_updates": 0.8397531509399414, "train/loss": 2.450639247894287, "uptime": 7964.740590754, "examples_seen": 43776000.0, "progress": 0.37965240712947257, "epoch": 34.16884762095808, "img/sec/core": 729.5655550783703, "core_hours_NVIDIA A100-SXM4-40GB": 17.00535528966666, "core_hours": 17.00535528966666} {"step": 42800, "global_schedule": 0.768352210521698, "l2_grads": 1.2069743871688843, "l2_params": 321.0841979980469, "l2_updates": 0.8114586472511292, "train/loss": 3.419318914413452, "uptime": 7973.809738072001, "examples_seen": 43827200.0, "progress": 0.38009644503254797, "epoch": 34.20881118542704, "img/sec/core": 705.689275473191, "core_hours_NVIDIA A100-SXM4-40GB": 17.02550895037333, "core_hours": 17.02550895037333} {"step": 42850, "global_schedule": 0.767706036567688, "l2_grads": 1.4082132577896118, "l2_params": 321.0059814453125, "l2_updates": 0.8165206909179688, "train/loss": 2.4381420612335205, "uptime": 7982.733363513, "examples_seen": 43878400.0, "progress": 0.38054048293562337, "epoch": 34.24877474989599, "img/sec/core": 717.1972918759809, "core_hours_NVIDIA A100-SXM4-40GB": 17.045339229131102, "core_hours": 17.045339229131102} {"step": 42900, "global_schedule": 0.7670592069625854, "l2_grads": 1.3781189918518066, "l2_params": 320.96014404296875, "l2_updates": 0.8030983805656433, "train/loss": 2.9063973426818848, "uptime": 7991.311167449001, "examples_seen": 43929600.0, "progress": 0.38098452083869877, "epoch": 34.28873831436495, "img/sec/core": 746.111714344405, "core_hours_NVIDIA A100-SXM4-40GB": 17.06440101565555, "core_hours": 17.06440101565555} {"step": 42950, "global_schedule": 0.7664117217063904, "l2_grads": 1.4247406721115112, "l2_params": 320.8940734863281, "l2_updates": 0.816819429397583, "train/loss": 2.470054864883423, "uptime": 7999.951267131999, "examples_seen": 43980800.0, "progress": 0.38142855874177417, "epoch": 34.328701878833904, "img/sec/core": 740.7321946289521, "core_hours_NVIDIA A100-SXM4-40GB": 17.083601237173323, "core_hours": 17.083601237173323} {"step": 43000, "global_schedule": 0.7657636404037476, "l2_grads": 1.1609188318252563, "l2_params": 320.8390808105469, "l2_updates": 0.7953509092330933, "train/loss": 4.426610946655273, "uptime": 8009.5479421280015, "examples_seen": 44032000.0, "progress": 0.3818725966448496, "epoch": 34.368665443302866, "img/sec/core": 666.8976497240858, "core_hours_NVIDIA A100-SXM4-40GB": 17.104927181608886, "core_hours": 17.104927181608886} {"step": 43050, "global_schedule": 0.765114963054657, "l2_grads": 1.4147461652755737, "l2_params": 320.78082275390625, "l2_updates": 0.8083110451698303, "train/loss": 2.480839252471924, "uptime": 8019.160396737001, "examples_seen": 44083200.0, "progress": 0.382316634547925, "epoch": 34.40862900777182, "img/sec/core": 715.7093823814483, "core_hours_NVIDIA A100-SXM4-40GB": 17.12479868612221, "core_hours": 17.12479868612221} {"step": 43100, "global_schedule": 0.7644656896591187, "l2_grads": 1.5032321214675903, "l2_params": 320.7002258300781, "l2_updates": 0.7846925854682922, "train/loss": 2.543267250061035, "uptime": 8028.274864469002, "examples_seen": 44134400.0, "progress": 0.3827606724510004, "epoch": 34.44859257224078, "img/sec/core": 702.1803344072067, "core_hours_NVIDIA A100-SXM4-40GB": 17.145053058859993, "core_hours": 17.145053058859993} {"step": 43150, "global_schedule": 0.7638157606124878, "l2_grads": 1.3915631771087646, "l2_params": 320.64251708984375, "l2_updates": 0.8162745237350464, "train/loss": 2.52447509765625, "uptime": 8037.805461640002, "examples_seen": 44185600.0, "progress": 0.38320471035407583, "epoch": 34.48855613670973, "img/sec/core": 671.5214047104882, "core_hours_NVIDIA A100-SXM4-40GB": 17.166232163684434, "core_hours": 17.166232163684434} {"step": 43200, "global_schedule": 0.7631651163101196, "l2_grads": 1.1309747695922852, "l2_params": 320.585693359375, "l2_updates": 0.7976899743080139, "train/loss": 4.817435264587402, "uptime": 8047.330726770002, "examples_seen": 44236800.0, "progress": 0.38364874825715123, "epoch": 34.52851970117869, "img/sec/core": 671.8973081225054, "core_hours_NVIDIA A100-SXM4-40GB": 17.18739941952888, "core_hours": 17.18739941952888} {"step": 43250, "global_schedule": 0.7625139951705933, "l2_grads": 1.472632884979248, "l2_params": 320.5273132324219, "l2_updates": 0.8011101484298706, "train/loss": 2.5224008560180664, "uptime": 8056.811930739999, "examples_seen": 44288000.0, "progress": 0.38409278616022663, "epoch": 34.56848326564765, "img/sec/core": 675.0197570110735, "core_hours_NVIDIA A100-SXM4-40GB": 17.208468761684426, "core_hours": 17.208468761684426} {"step": 43300, "global_schedule": 0.7618621587753296, "l2_grads": 1.2778801918029785, "l2_params": 320.4690246582031, "l2_updates": 0.7918902039527893, "train/loss": 4.969446182250977, "uptime": 8066.125313777002, "examples_seen": 44339200.0, "progress": 0.38453682406330203, "epoch": 34.608446830116605, "img/sec/core": 687.1831615399591, "core_hours_NVIDIA A100-SXM4-40GB": 17.229165168433322, "core_hours": 17.229165168433322} {"step": 43350, "global_schedule": 0.7612098455429077, "l2_grads": 1.4692199230194092, "l2_params": 320.4047546386719, "l2_updates": 0.798565149307251, "train/loss": 2.402844190597534, "uptime": 8075.577359975001, "examples_seen": 44390400.0, "progress": 0.38498086196637743, "epoch": 34.64841039458556, "img/sec/core": 677.1020650909195, "core_hours_NVIDIA A100-SXM4-40GB": 17.250169715539986, "core_hours": 17.250169715539986} {"step": 43400, "global_schedule": 0.7605568170547485, "l2_grads": 1.4793070554733276, "l2_params": 320.3309631347656, "l2_updates": 0.7935911417007446, "train/loss": 2.95222806930542, "uptime": 8085.056601773, "examples_seen": 44441600.0, "progress": 0.38542489986945283, "epoch": 34.688373959054516, "img/sec/core": 675.1594838894291, "core_hours_NVIDIA A100-SXM4-40GB": 17.271234697313318, "core_hours": 17.271234697313318} {"step": 43450, "global_schedule": 0.7599031329154968, "l2_grads": 1.2427059412002563, "l2_params": 320.2918701171875, "l2_updates": 0.8019967675209045, "train/loss": 3.6369986534118652, "uptime": 8094.446401553001, "examples_seen": 44492800.0, "progress": 0.3858689377725283, "epoch": 34.72833752352348, "img/sec/core": 681.5906781772813, "core_hours_NVIDIA A100-SXM4-40GB": 17.292100919046657, "core_hours": 17.292100919046657} {"step": 43500, "global_schedule": 0.7592489123344421, "l2_grads": 1.415937900543213, "l2_params": 320.2203674316406, "l2_updates": 0.8156405091285706, "train/loss": 2.5140180587768555, "uptime": 8103.914211161, "examples_seen": 44544000.0, "progress": 0.3863129756756037, "epoch": 34.768301087992434, "img/sec/core": 675.9747254098795, "core_hours_NVIDIA A100-SXM4-40GB": 17.313140495953316, "core_hours": 17.313140495953316} {"step": 43550, "global_schedule": 0.7585940361022949, "l2_grads": 1.1979271173477173, "l2_params": 320.1890563964844, "l2_updates": 0.7970647811889648, "train/loss": 4.231059551239014, "uptime": 8112.452738332, "examples_seen": 44595200.0, "progress": 0.3867570135786791, "epoch": 34.80826465246139, "img/sec/core": 749.5437880360261, "core_hours_NVIDIA A100-SXM4-40GB": 17.332115000777765, "core_hours": 17.332115000777765} {"step": 43600, "global_schedule": 0.7579386234283447, "l2_grads": 1.4465405941009521, "l2_params": 320.1128234863281, "l2_updates": 0.811107873916626, "train/loss": 2.4168734550476074, "uptime": 8121.360985998001, "examples_seen": 44646400.0, "progress": 0.3872010514817545, "epoch": 34.848228216930345, "img/sec/core": 718.4353466536879, "core_hours_NVIDIA A100-SXM4-40GB": 17.35191110670221, "core_hours": 17.35191110670221} {"step": 43650, "global_schedule": 0.757282555103302, "l2_grads": 1.4158871173858643, "l2_params": 320.0520935058594, "l2_updates": 0.8049402236938477, "train/loss": 2.4793405532836914, "uptime": 8130.806248383002, "examples_seen": 44697600.0, "progress": 0.3876450893848299, "epoch": 34.8881917813993, "img/sec/core": 677.588375963284, "core_hours_NVIDIA A100-SXM4-40GB": 17.372900578668876, "core_hours": 17.372900578668876} {"step": 43700, "global_schedule": 0.7566258907318115, "l2_grads": 1.463790774345398, "l2_params": 320.00787353515625, "l2_updates": 0.7865238189697266, "train/loss": 2.329645872116089, "uptime": 8140.231496454, "examples_seen": 44748800.0, "progress": 0.3880891272879053, "epoch": 34.92815534586826, "img/sec/core": 679.0272204816455, "core_hours_NVIDIA A100-SXM4-40GB": 17.39384557438221, "core_hours": 17.39384557438221} {"step": 43750, "global_schedule": 0.7559686899185181, "l2_grads": 1.3544485569000244, "l2_params": 319.9374694824219, "l2_updates": 0.8029760718345642, "train/loss": 2.6350417137145996, "uptime": 8149.699002734002, "examples_seen": 44800000.0, "progress": 0.3885331651909807, "epoch": 34.96811891033722, "img/sec/core": 675.9963828615445, "core_hours_NVIDIA A100-SXM4-40GB": 17.414884477226657, "core_hours": 17.414884477226657} {"step": 43800, "global_schedule": 0.7553107738494873, "l2_grads": 1.4195700883865356, "l2_params": 319.88629150390625, "l2_updates": 0.7882620692253113, "train/loss": 2.32210636138916, "uptime": 8160.010118496999, "examples_seen": 44851200.0, "progress": 0.3889772030940561, "epoch": 35.00808247480617, "img/sec/core": 620.6893751466883, "core_hours_NVIDIA A100-SXM4-40GB": 17.437798067811094, "core_hours": 17.437798067811094} {"step": 43850, "global_schedule": 0.7546523809432983, "l2_grads": 1.3341546058654785, "l2_params": 319.814697265625, "l2_updates": 0.8011406660079956, "train/loss": 2.82075834274292, "uptime": 8168.885368206002, "examples_seen": 44902400.0, "progress": 0.3894212409971315, "epoch": 35.04804603927513, "img/sec/core": 721.1064713489823, "core_hours_NVIDIA A100-SXM4-40GB": 17.457520844942213, "core_hours": 17.457520844942213} {"step": 43900, "global_schedule": 0.7539932727813721, "l2_grads": 1.2178047895431519, "l2_params": 319.7489929199219, "l2_updates": 0.7774056196212769, "train/loss": 3.9394750595092773, "uptime": 8177.597946419, "examples_seen": 44953600.0, "progress": 0.38986527890020695, "epoch": 35.088009603744084, "img/sec/core": 734.5701632212018, "core_hours_NVIDIA A100-SXM4-40GB": 17.476882129859987, "core_hours": 17.476882129859987} {"step": 43950, "global_schedule": 0.7533336877822876, "l2_grads": 1.3623486757278442, "l2_params": 319.69268798828125, "l2_updates": 0.7765448689460754, "train/loss": 3.1350131034851074, "uptime": 8186.892279161, "examples_seen": 45004800.0, "progress": 0.39030931680328235, "epoch": 35.127973168213046, "img/sec/core": 688.5916587727994, "core_hours_NVIDIA A100-SXM4-40GB": 17.497536202619987, "core_hours": 17.497536202619987} {"step": 44000, "global_schedule": 0.7526733875274658, "l2_grads": 1.5523957014083862, "l2_params": 319.649169921875, "l2_updates": 0.7813239097595215, "train/loss": 2.45247220993042, "uptime": 8195.640428952001, "examples_seen": 45056000.0, "progress": 0.39075335470635775, "epoch": 35.167936732682, "img/sec/core": 731.5832665077791, "core_hours_NVIDIA A100-SXM4-40GB": 17.51697653548888, "core_hours": 17.51697653548888} {"step": 44050, "global_schedule": 0.7520124912261963, "l2_grads": 1.3383989334106445, "l2_params": 319.5976867675781, "l2_updates": 0.8043392300605774, "train/loss": 2.4362986087799072, "uptime": 8205.132598726, "examples_seen": 45107200.0, "progress": 0.39119739260943315, "epoch": 35.20790029715096, "img/sec/core": 757.4954967676991, "core_hours_NVIDIA A100-SXM4-40GB": 17.535751857959983, "core_hours": 17.535751857959983} {"step": 44100, "global_schedule": 0.7513511180877686, "l2_grads": 1.2423903942108154, "l2_params": 319.5426025390625, "l2_updates": 0.7873994708061218, "train/loss": 4.240836143493652, "uptime": 8213.98198553, "examples_seen": 45158400.0, "progress": 0.39164143051250855, "epoch": 35.24786386161991, "img/sec/core": 723.2139516274876, "core_hours_NVIDIA A100-SXM4-40GB": 17.55541716196887, "core_hours": 17.55541716196887} {"step": 44150, "global_schedule": 0.7506890892982483, "l2_grads": 1.431003212928772, "l2_params": 319.48394775390625, "l2_updates": 0.7907448410987854, "train/loss": 2.5628161430358887, "uptime": 8223.417031146002, "examples_seen": 45209600.0, "progress": 0.39208546841558395, "epoch": 35.28782742608887, "img/sec/core": 678.3221046801277, "core_hours_NVIDIA A100-SXM4-40GB": 17.57638393000443, "core_hours": 17.57638393000443} {"step": 44200, "global_schedule": 0.750026524066925, "l2_grads": 1.3828908205032349, "l2_params": 319.4231872558594, "l2_updates": 0.78605717420578, "train/loss": 2.9388890266418457, "uptime": 8232.973541244, "examples_seen": 45260800.0, "progress": 0.39252950631865935, "epoch": 35.32779099055783, "img/sec/core": 669.7005428101284, "core_hours_NVIDIA A100-SXM4-40GB": 17.59762061911109, "core_hours": 17.59762061911109} {"step": 44250, "global_schedule": 0.7493633031845093, "l2_grads": 1.472476601600647, "l2_params": 319.353271484375, "l2_updates": 0.7889904975891113, "train/loss": 2.32893705368042, "uptime": 8242.493819723999, "examples_seen": 45312000.0, "progress": 0.39297354422173475, "epoch": 35.367754555026785, "img/sec/core": 672.2492428604875, "core_hours_NVIDIA A100-SXM4-40GB": 17.61877679351109, "core_hours": 17.61877679351109} {"step": 44300, "global_schedule": 0.7486995458602905, "l2_grads": 1.4020726680755615, "l2_params": 319.29150390625, "l2_updates": 0.8089859485626221, "train/loss": 2.370352268218994, "uptime": 8251.712945248002, "examples_seen": 45363200.0, "progress": 0.39341758212481015, "epoch": 35.40771811949574, "img/sec/core": 694.2090096654807, "core_hours_NVIDIA A100-SXM4-40GB": 17.639263739119986, "core_hours": 17.639263739119986} {"step": 44350, "global_schedule": 0.748035192489624, "l2_grads": 1.4993493556976318, "l2_params": 319.24310302734375, "l2_updates": 0.7973264455795288, "train/loss": 2.59978985786438, "uptime": 8260.133277708, "examples_seen": 45414400.0, "progress": 0.3938616200278856, "epoch": 35.447681683964696, "img/sec/core": 760.0650010440525, "core_hours_NVIDIA A100-SXM4-40GB": 17.657975589031093, "core_hours": 17.657975589031093} {"step": 44400, "global_schedule": 0.7473702430725098, "l2_grads": 1.3860175609588623, "l2_params": 319.1731262207031, "l2_updates": 0.7716149687767029, "train/loss": 4.784049034118652, "uptime": 8268.487549694999, "examples_seen": 45465600.0, "progress": 0.394305657930961, "epoch": 35.48764524843365, "img/sec/core": 766.0751301801325, "core_hours_NVIDIA A100-SXM4-40GB": 17.67654063789109, "core_hours": 17.67654063789109} {"step": 44450, "global_schedule": 0.7467047572135925, "l2_grads": 1.262424349784851, "l2_params": 319.0999755859375, "l2_updates": 0.7663848996162415, "train/loss": 4.911567687988281, "uptime": 8277.115935336, "examples_seen": 45516800.0, "progress": 0.3947496958340364, "epoch": 35.52760881290261, "img/sec/core": 741.7378251602545, "core_hours_NVIDIA A100-SXM4-40GB": 17.695714828204423, "core_hours": 17.695714828204423} {"step": 44500, "global_schedule": 0.7460386753082275, "l2_grads": 1.4369192123413086, "l2_params": 319.0356750488281, "l2_updates": 0.7983148694038391, "train/loss": 2.330413818359375, "uptime": 8285.757954695002, "examples_seen": 45568000.0, "progress": 0.3951937337371118, "epoch": 35.56757237737157, "img/sec/core": 740.5676537085519, "core_hours_NVIDIA A100-SXM4-40GB": 17.714919315668872, "core_hours": 17.714919315668872} {"step": 44550, "global_schedule": 0.7453719973564148, "l2_grads": 1.4944664239883423, "l2_params": 319.01165771484375, "l2_updates": 0.7999182939529419, "train/loss": 2.339207887649536, "uptime": 8294.711241874002, "examples_seen": 45619200.0, "progress": 0.3956377716401872, "epoch": 35.607535941840524, "img/sec/core": 714.8212574942786, "core_hours_NVIDIA A100-SXM4-40GB": 17.734815509399983, "core_hours": 17.734815509399983} {"step": 44600, "global_schedule": 0.7447047233581543, "l2_grads": 1.2531912326812744, "l2_params": 318.96099853515625, "l2_updates": 0.7765370607376099, "train/loss": 4.301729679107666, "uptime": 8303.876672428001, "examples_seen": 45670400.0, "progress": 0.3960818095432626, "epoch": 35.64749950630948, "img/sec/core": 698.2759797582195, "core_hours_NVIDIA A100-SXM4-40GB": 17.755183132853315, "core_hours": 17.755183132853315} {"step": 44650, "global_schedule": 0.7440369129180908, "l2_grads": 1.338020920753479, "l2_params": 318.900634765625, "l2_updates": 0.8019206523895264, "train/loss": 2.6112523078918457, "uptime": 8313.281082731, "examples_seen": 45721600.0, "progress": 0.396525847446338, "epoch": 35.68746307077844, "img/sec/core": 680.5317711370984, "core_hours_NVIDIA A100-SXM4-40GB": 17.776081822415538, "core_hours": 17.776081822415538} {"step": 44700, "global_schedule": 0.7433685064315796, "l2_grads": 1.2050859928131104, "l2_params": 318.8577880859375, "l2_updates": 0.7957329750061035, "train/loss": 3.274644374847412, "uptime": 8322.698282203999, "examples_seen": 45772800.0, "progress": 0.3969698853494134, "epoch": 35.7274266352474, "img/sec/core": 679.6075646852701, "core_hours_NVIDIA A100-SXM4-40GB": 17.797008932355535, "core_hours": 17.797008932355535} {"step": 44750, "global_schedule": 0.7426995038986206, "l2_grads": 1.3157819509506226, "l2_params": 318.77362060546875, "l2_updates": 0.7730906009674072, "train/loss": 4.876862049102783, "uptime": 8331.382354412, "examples_seen": 45824000.0, "progress": 0.3974139232524888, "epoch": 35.76739019971635, "img/sec/core": 736.981435288283, "core_hours_NVIDIA A100-SXM4-40GB": 17.816306870595536, "core_hours": 17.816306870595536} {"step": 44800, "global_schedule": 0.7420300245285034, "l2_grads": 1.3689950704574585, "l2_params": 318.70782470703125, "l2_updates": 0.7569191455841064, "train/loss": 2.9777657985687256, "uptime": 8339.976919171999, "examples_seen": 45875200.0, "progress": 0.39785796115556427, "epoch": 35.80735376418531, "img/sec/core": 744.6566729926241, "core_hours_NVIDIA A100-SXM4-40GB": 17.835405903395536, "core_hours": 17.835405903395536} {"step": 44850, "global_schedule": 0.7413598895072937, "l2_grads": 1.3737515211105347, "l2_params": 318.6135559082031, "l2_updates": 0.7822932600975037, "train/loss": 2.3087925910949707, "uptime": 8348.574997186, "examples_seen": 45926400.0, "progress": 0.39830199905863967, "epoch": 35.84731732865426, "img/sec/core": 744.3523994057547, "core_hours_NVIDIA A100-SXM4-40GB": 17.85451274342665, "core_hours": 17.85451274342665} {"step": 44900, "global_schedule": 0.740689218044281, "l2_grads": 1.475502848625183, "l2_params": 318.5365295410156, "l2_updates": 0.758460521697998, "train/loss": 2.5264475345611572, "uptime": 8357.305986256999, "examples_seen": 45977600.0, "progress": 0.39874603696171507, "epoch": 35.887280893123226, "img/sec/core": 733.0211901488609, "core_hours_NVIDIA A100-SXM4-40GB": 17.8739149413622, "core_hours": 17.8739149413622} {"step": 44950, "global_schedule": 0.7400180101394653, "l2_grads": 1.4512393474578857, "l2_params": 318.4662780761719, "l2_updates": 0.7575368285179138, "train/loss": 2.5801162719726562, "uptime": 8365.757856633, "examples_seen": 46028800.0, "progress": 0.39919007486479047, "epoch": 35.92724445759218, "img/sec/core": 757.2288399231911, "core_hours_NVIDIA A100-SXM4-40GB": 17.89269687553109, "core_hours": 17.89269687553109} {"step": 45000, "global_schedule": 0.7393462657928467, "l2_grads": 1.4423199892044067, "l2_params": 318.3805236816406, "l2_updates": 0.7889000177383423, "train/loss": 2.6271486282348633, "uptime": 8374.367086795, "examples_seen": 46080000.0, "progress": 0.39963411276786587, "epoch": 35.967208022061136, "img/sec/core": 743.3881868146559, "core_hours_NVIDIA A100-SXM4-40GB": 17.911828498113316, "core_hours": 17.911828498113316, "val/acc@1": 0.63884, "val/loss": 1.4873578198242188, "z/secs/eval/val": 2.522909344999789} {"step": 45050, "global_schedule": 0.7386739253997803, "l2_grads": 1.4079539775848389, "l2_params": 318.3105163574219, "l2_updates": 0.7591718435287476, "train/loss": 2.9930763244628906, "uptime": 8387.52313063, "examples_seen": 46131200.0, "progress": 0.40007815067094127, "epoch": 36.00717158653009, "img/sec/core": 658.5455725981224, "core_hours_NVIDIA A100-SXM4-40GB": 17.933424911199975, "core_hours": 17.933424911199975} {"step": 45100, "global_schedule": 0.7380009889602661, "l2_grads": 1.535129427909851, "l2_params": 318.2394714355469, "l2_updates": 0.7584422826766968, "train/loss": 2.462080955505371, "uptime": 8397.087374872002, "examples_seen": 46182400.0, "progress": 0.40052218857401667, "epoch": 36.04713515099905, "img/sec/core": 669.1589882129198, "core_hours_NVIDIA A100-SXM4-40GB": 17.954678787293314, "core_hours": 17.954678787293314} {"step": 45150, "global_schedule": 0.7373275756835938, "l2_grads": 1.5051393508911133, "l2_params": 318.1831359863281, "l2_updates": 0.7726972699165344, "train/loss": 2.427859306335449, "uptime": 8406.503280456001, "examples_seen": 46233600.0, "progress": 0.40096622647709207, "epoch": 36.08709871546801, "img/sec/core": 679.7009531272079, "core_hours_NVIDIA A100-SXM4-40GB": 17.975603021924428, "core_hours": 17.975603021924428} {"step": 45200, "global_schedule": 0.7366535067558289, "l2_grads": 1.5062333345413208, "l2_params": 318.1163635253906, "l2_updates": 0.7669471502304077, "train/loss": 2.4580893516540527, "uptime": 8415.680074818001, "examples_seen": 46284800.0, "progress": 0.40141026438016747, "epoch": 36.127062279936965, "img/sec/core": 697.4112906465226, "core_hours_NVIDIA A100-SXM4-40GB": 17.995995898284427, "core_hours": 17.995995898284427} {"step": 45250, "global_schedule": 0.735978901386261, "l2_grads": 1.5009753704071045, "l2_params": 318.05010986328125, "l2_updates": 0.7585861682891846, "train/loss": 2.362200975418091, "uptime": 8424.096083475002, "examples_seen": 46336000.0, "progress": 0.40185430228324287, "epoch": 36.16702584440592, "img/sec/core": 760.4554915323316, "core_hours_NVIDIA A100-SXM4-40GB": 18.01469813974443, "core_hours": 18.01469813974443} {"step": 45300, "global_schedule": 0.7353037595748901, "l2_grads": 1.2249442338943481, "l2_params": 317.97802734375, "l2_updates": 0.7798839211463928, "train/loss": 4.634238243103027, "uptime": 8432.678588597, "examples_seen": 46387200.0, "progress": 0.4022983401863183, "epoch": 36.206989408874875, "img/sec/core": 745.7030213236858, "core_hours_NVIDIA A100-SXM4-40GB": 18.03377037334887, "core_hours": 18.03377037334887} {"step": 45350, "global_schedule": 0.7346280813217163, "l2_grads": 1.3873958587646484, "l2_params": 317.9313049316406, "l2_updates": 0.7826877236366272, "train/loss": 2.512925863265991, "uptime": 8442.121117027002, "examples_seen": 46438400.0, "progress": 0.4027423780893937, "epoch": 36.24695297334383, "img/sec/core": 677.7845624129139, "core_hours_NVIDIA A100-SXM4-40GB": 18.054753769859982, "core_hours": 18.054753769859982} {"step": 45400, "global_schedule": 0.7339518666267395, "l2_grads": 1.434624195098877, "l2_params": 317.86297607421875, "l2_updates": 0.7754623293876648, "train/loss": 2.3511080741882324, "uptime": 8450.735607992001, "examples_seen": 46489600.0, "progress": 0.4031864159924691, "epoch": 36.28691653781279, "img/sec/core": 742.9342053991622, "core_hours_NVIDIA A100-SXM4-40GB": 18.073897083115536, "core_hours": 18.073897083115536} {"step": 45450, "global_schedule": 0.7332750558853149, "l2_grads": 1.1890249252319336, "l2_params": 317.7825622558594, "l2_updates": 0.7584934234619141, "train/loss": 4.435338973999023, "uptime": 8459.821961782001, "examples_seen": 46540800.0, "progress": 0.4036304538955445, "epoch": 36.32688010228175, "img/sec/core": 704.3529393543124, "core_hours_NVIDIA A100-SXM4-40GB": 18.094088980426648, "core_hours": 18.094088980426648} {"step": 45500, "global_schedule": 0.7325977087020874, "l2_grads": 1.4225869178771973, "l2_params": 317.7234802246094, "l2_updates": 0.774847686290741, "train/loss": 2.447657346725464, "uptime": 8468.456692054, "examples_seen": 46592000.0, "progress": 0.40407449179861993, "epoch": 36.366843666750704, "img/sec/core": 741.1928107070534, "core_hours_NVIDIA A100-SXM4-40GB": 18.11327726991998, "core_hours": 18.11327726991998} {"step": 45550, "global_schedule": 0.7319198250770569, "l2_grads": 1.5556954145431519, "l2_params": 317.6747741699219, "l2_updates": 0.7802951335906982, "train/loss": 2.456566095352173, "uptime": 8477.411089127001, "examples_seen": 46643200.0, "progress": 0.40451852970169533, "epoch": 36.40680723121966, "img/sec/core": 714.7326556800853, "core_hours_NVIDIA A100-SXM4-40GB": 18.133175930082203, "core_hours": 18.133175930082203} {"step": 45600, "global_schedule": 0.7312414646148682, "l2_grads": 1.3607597351074219, "l2_params": 317.60870361328125, "l2_updates": 0.7537147998809814, "train/loss": 4.9004435539245605, "uptime": 8485.937635258999, "examples_seen": 46694400.0, "progress": 0.40496256760477073, "epoch": 36.44677079568862, "img/sec/core": 750.5970062112942, "core_hours_NVIDIA A100-SXM4-40GB": 18.15212381037553, "core_hours": 18.15212381037553} {"step": 45650, "global_schedule": 0.7305624485015869, "l2_grads": 1.4240477085113525, "l2_params": 317.5389709472656, "l2_updates": 0.7781374454498291, "train/loss": 2.3397586345672607, "uptime": 8494.990930427002, "examples_seen": 46745600.0, "progress": 0.40540660550784613, "epoch": 36.48673436015758, "img/sec/core": 706.9249241557044, "core_hours_NVIDIA A100-SXM4-40GB": 18.172242244082206, "core_hours": 18.172242244082206} {"step": 45700, "global_schedule": 0.7298829555511475, "l2_grads": 1.442875862121582, "l2_params": 317.4887390136719, "l2_updates": 0.7866184711456299, "train/loss": 2.5536351203918457, "uptime": 8504.267180161, "examples_seen": 46796800.0, "progress": 0.40585064341092153, "epoch": 36.52669792462653, "img/sec/core": 689.9339909472407, "core_hours_NVIDIA A100-SXM4-40GB": 18.192856132379976, "core_hours": 18.192856132379976} {"step": 45750, "global_schedule": 0.7292029857635498, "l2_grads": 1.5258979797363281, "l2_params": 317.4234619140625, "l2_updates": 0.7611374855041504, "train/loss": 2.488070249557495, "uptime": 8513.129026516, "examples_seen": 46848000.0, "progress": 0.406294681313997, "epoch": 36.56666148909549, "img/sec/core": 722.1971295392937, "core_hours_NVIDIA A100-SXM4-40GB": 18.21254912427998, "core_hours": 18.21254912427998} {"step": 45800, "global_schedule": 0.7285223603248596, "l2_grads": 1.6195597648620605, "l2_params": 317.36761474609375, "l2_updates": 0.7497546672821045, "train/loss": 2.4874136447906494, "uptime": 8521.758262608002, "examples_seen": 46899200.0, "progress": 0.4067387192170724, "epoch": 36.60662505356444, "img/sec/core": 741.6647234779207, "core_hours_NVIDIA A100-SXM4-40GB": 18.231725204484427, "core_hours": 18.231725204484427} {"step": 45850, "global_schedule": 0.7278412580490112, "l2_grads": 1.4035574197769165, "l2_params": 317.3020935058594, "l2_updates": 0.767545223236084, "train/loss": 2.469003438949585, "uptime": 8530.351778682, "examples_seen": 46950400.0, "progress": 0.4071827571201478, "epoch": 36.646588618033405, "img/sec/core": 744.7475451131629, "core_hours_NVIDIA A100-SXM4-40GB": 18.25082190687109, "core_hours": 18.25082190687109} {"step": 45900, "global_schedule": 0.7271596193313599, "l2_grads": 1.5011849403381348, "l2_params": 317.2292175292969, "l2_updates": 0.7579058408737183, "train/loss": 2.4481096267700195, "uptime": 8538.908750314002, "examples_seen": 47001600.0, "progress": 0.4076267950232232, "epoch": 36.68655218250236, "img/sec/core": 747.9281544027227, "core_hours_NVIDIA A100-SXM4-40GB": 18.26983739938665, "core_hours": 18.26983739938665} {"step": 45950, "global_schedule": 0.7264773845672607, "l2_grads": 1.2169675827026367, "l2_params": 317.1590576171875, "l2_updates": 0.7701479196548462, "train/loss": 4.885762691497803, "uptime": 8547.545243175, "examples_seen": 47052800.0, "progress": 0.4080708329262986, "epoch": 36.726515746971316, "img/sec/core": 741.0415434836876, "core_hours_NVIDIA A100-SXM4-40GB": 18.289029605744425, "core_hours": 18.289029605744425} {"step": 46000, "global_schedule": 0.7257947325706482, "l2_grads": 1.4875415563583374, "l2_params": 317.1064453125, "l2_updates": 0.7880820631980896, "train/loss": 2.5862510204315186, "uptime": 8556.055873760999, "examples_seen": 47104000.0, "progress": 0.408514870829374, "epoch": 36.76647931144027, "img/sec/core": 752.0006814217437, "core_hours_NVIDIA A100-SXM4-40GB": 18.307942118157754, "core_hours": 18.307942118157754} {"step": 46050, "global_schedule": 0.7251114845275879, "l2_grads": 1.366889238357544, "l2_params": 317.0382385253906, "l2_updates": 0.7520630359649658, "train/loss": 2.3714582920074463, "uptime": 8565.550311694, "examples_seen": 47155200.0, "progress": 0.4089589087324494, "epoch": 36.80644287590923, "img/sec/core": 724.5682631390106, "core_hours_NVIDIA A100-SXM4-40GB": 18.327570665177753, "core_hours": 18.327570665177753} {"step": 46100, "global_schedule": 0.7244277000427246, "l2_grads": 1.2615123987197876, "l2_params": 316.9578552246094, "l2_updates": 0.7561568021774292, "train/loss": 3.421243190765381, "uptime": 8575.005539242002, "examples_seen": 47206400.0, "progress": 0.4094029466355248, "epoch": 36.84640644037819, "img/sec/core": 676.8742441690355, "core_hours_NVIDIA A100-SXM4-40GB": 18.348582281951092, "core_hours": 18.348582281951092} {"step": 46150, "global_schedule": 0.7237434387207031, "l2_grads": 1.5184895992279053, "l2_params": 316.9070129394531, "l2_updates": 0.758543848991394, "train/loss": 2.6052870750427246, "uptime": 8583.780290175999, "examples_seen": 47257600.0, "progress": 0.4098469845386002, "epoch": 36.886370004847144, "img/sec/core": 729.3654313541567, "core_hours_NVIDIA A100-SXM4-40GB": 18.368081728471086, "core_hours": 18.368081728471086} {"step": 46200, "global_schedule": 0.7230585813522339, "l2_grads": 1.4000892639160156, "l2_params": 316.8272705078125, "l2_updates": 0.7706669569015503, "train/loss": 2.4031295776367188, "uptime": 8592.315138627999, "examples_seen": 47308800.0, "progress": 0.41029102244167565, "epoch": 36.9263335693161, "img/sec/core": 749.8668589130323, "core_hours_NVIDIA A100-SXM4-40GB": 18.387048058364417, "core_hours": 18.387048058364417} {"step": 46250, "global_schedule": 0.7223732471466064, "l2_grads": 1.432586669921875, "l2_params": 316.75946044921875, "l2_updates": 0.7748526334762573, "train/loss": 2.386833667755127, "uptime": 8600.932374577, "examples_seen": 47360000.0, "progress": 0.41073506034475105, "epoch": 36.966297133785055, "img/sec/core": 742.6975468557205, "core_hours_NVIDIA A100-SXM4-40GB": 18.406197471584417, "core_hours": 18.406197471584417} {"step": 46300, "global_schedule": 0.7216874361038208, "l2_grads": 1.327368140220642, "l2_params": 316.6861877441406, "l2_updates": 0.7468507885932922, "train/loss": 3.683115005493164, "uptime": 8610.136223342999, "examples_seen": 47411200.0, "progress": 0.41117909824782645, "epoch": 37.00626069825401, "img/sec/core": 695.3612736057531, "core_hours_NVIDIA A100-SXM4-40GB": 18.426650468842194, "core_hours": 18.426650468842194} {"step": 46350, "global_schedule": 0.7210010290145874, "l2_grads": 1.5264887809753418, "l2_params": 316.64422607421875, "l2_updates": 0.7534725666046143, "train/loss": 2.4405767917633057, "uptime": 8618.777108063, "examples_seen": 47462400.0, "progress": 0.41162313615090185, "epoch": 37.04622426272297, "img/sec/core": 740.6648980267818, "core_hours_NVIDIA A100-SXM4-40GB": 18.445852434886643, "core_hours": 18.445852434886643} {"step": 46400, "global_schedule": 0.7203141450881958, "l2_grads": 1.4216210842132568, "l2_params": 316.5983581542969, "l2_updates": 0.7655442357063293, "train/loss": 2.2540314197540283, "uptime": 8627.319427757999, "examples_seen": 47513600.0, "progress": 0.41206717405397725, "epoch": 37.08618782719193, "img/sec/core": 749.2110139294308, "core_hours_NVIDIA A100-SXM4-40GB": 18.464835367542197, "core_hours": 18.464835367542197} {"step": 46450, "global_schedule": 0.7196266651153564, "l2_grads": 1.5019346475601196, "l2_params": 316.5266418457031, "l2_updates": 0.7536706924438477, "train/loss": 2.3682219982147217, "uptime": 8635.724106134001, "examples_seen": 47564800.0, "progress": 0.41251121195705265, "epoch": 37.12615139166088, "img/sec/core": 761.480655616021, "core_hours_NVIDIA A100-SXM4-40GB": 18.48351243059998, "core_hours": 18.48351243059998} {"step": 46500, "global_schedule": 0.7189387679100037, "l2_grads": 1.3359971046447754, "l2_params": 316.4671630859375, "l2_updates": 0.7496968507766724, "train/loss": 2.726691484451294, "uptime": 8644.276729006002, "examples_seen": 47616000.0, "progress": 0.41295524986012805, "epoch": 37.16611495612984, "img/sec/core": 748.3084541178513, "core_hours_NVIDIA A100-SXM4-40GB": 18.50251825920442, "core_hours": 18.50251825920442} {"step": 46550, "global_schedule": 0.7182503342628479, "l2_grads": 1.500301480293274, "l2_params": 316.4069519042969, "l2_updates": 0.7502010464668274, "train/loss": 2.619168519973755, "uptime": 8652.940043244, "examples_seen": 47667200.0, "progress": 0.41339928776320345, "epoch": 37.2060785205988, "img/sec/core": 738.7472997261486, "core_hours_NVIDIA A100-SXM4-40GB": 18.521770068622196, "core_hours": 18.521770068622196} {"step": 46600, "global_schedule": 0.7175613641738892, "l2_grads": 1.4744226932525635, "l2_params": 316.34271240234375, "l2_updates": 0.7584487199783325, "train/loss": 2.4127893447875977, "uptime": 8662.349198828002, "examples_seen": 47718400.0, "progress": 0.41384332566627885, "epoch": 37.24604208506776, "img/sec/core": 680.188561328655, "core_hours_NVIDIA A100-SXM4-40GB": 18.542679303253312, "core_hours": 18.542679303253312} {"step": 46650, "global_schedule": 0.7168719172477722, "l2_grads": 1.4679478406906128, "l2_params": 316.2882995605469, "l2_updates": 0.7628756761550903, "train/loss": 2.460144519805908, "uptime": 8671.764804213, "examples_seen": 47769600.0, "progress": 0.4142873635693543, "epoch": 37.28600564953671, "img/sec/core": 679.7226241232418, "core_hours_NVIDIA A100-SXM4-40GB": 18.56360287077553, "core_hours": 18.56360287077553} {"step": 46700, "global_schedule": 0.7161818742752075, "l2_grads": 1.3782814741134644, "l2_params": 316.2218322753906, "l2_updates": 0.7630613446235657, "train/loss": 2.59442138671875, "uptime": 8681.289683011002, "examples_seen": 47820800.0, "progress": 0.4147314014724297, "epoch": 37.32596921400567, "img/sec/core": 671.924560482878, "core_hours_NVIDIA A100-SXM4-40GB": 18.584769268104424, "core_hours": 18.584769268104424} {"step": 46750, "global_schedule": 0.7154914140701294, "l2_grads": 1.4312893152236938, "l2_params": 316.1727600097656, "l2_updates": 0.7651574015617371, "train/loss": 2.430715560913086, "uptime": 8690.687723229, "examples_seen": 47872000.0, "progress": 0.4151754393755051, "epoch": 37.36593277847462, "img/sec/core": 680.9930423305756, "core_hours_NVIDIA A100-SXM4-40GB": 18.605653801922198, "core_hours": 18.605653801922198} {"step": 46800, "global_schedule": 0.7148004174232483, "l2_grads": 1.5164577960968018, "l2_params": 316.11138916015625, "l2_updates": 0.7577604055404663, "train/loss": 2.370338201522827, "uptime": 8699.170067139, "examples_seen": 47923200.0, "progress": 0.4156194772785805, "epoch": 37.405896342943585, "img/sec/core": 754.5084316205188, "core_hours_NVIDIA A100-SXM4-40GB": 18.624503455055535, "core_hours": 18.624503455055535} {"step": 46850, "global_schedule": 0.714108943939209, "l2_grads": 1.471186637878418, "l2_params": 316.0390930175781, "l2_updates": 0.7454805970191956, "train/loss": 2.3939874172210693, "uptime": 8707.783819388, "examples_seen": 47974400.0, "progress": 0.4160635151816559, "epoch": 37.44585990741254, "img/sec/core": 742.9979194890112, "core_hours_NVIDIA A100-SXM4-40GB": 18.643645126719978, "core_hours": 18.643645126719978} {"step": 46900, "global_schedule": 0.7134169936180115, "l2_grads": 1.4921863079071045, "l2_params": 315.96826171875, "l2_updates": 0.7506707906723022, "train/loss": 2.3586111068725586, "uptime": 8716.812534643, "examples_seen": 48025600.0, "progress": 0.4165075530847313, "epoch": 37.485823471881496, "img/sec/core": 708.8494674206435, "core_hours_NVIDIA A100-SXM4-40GB": 18.663708938397754, "core_hours": 18.663708938397754} {"step": 46950, "global_schedule": 0.7127245664596558, "l2_grads": 1.4071052074432373, "l2_params": 315.89154052734375, "l2_updates": 0.7544742226600647, "train/loss": 2.493917942047119, "uptime": 8725.464819398001, "examples_seen": 48076800.0, "progress": 0.4169515909878067, "epoch": 37.52578703635045, "img/sec/core": 739.6890163954939, "core_hours_NVIDIA A100-SXM4-40GB": 18.682936237853312, "core_hours": 18.682936237853312} {"step": 47000, "global_schedule": 0.7120315432548523, "l2_grads": 1.625128149986267, "l2_params": 315.8292541503906, "l2_updates": 0.7379684448242188, "train/loss": 2.3704564571380615, "uptime": 8734.049567852, "examples_seen": 48128000.0, "progress": 0.4173956288908821, "epoch": 37.565750600819406, "img/sec/core": 745.5081572039157, "core_hours_NVIDIA A100-SXM4-40GB": 18.702013456639975, "core_hours": 18.702013456639975} {"step": 47050, "global_schedule": 0.7113380432128906, "l2_grads": 1.4012572765350342, "l2_params": 315.7508239746094, "l2_updates": 0.7764368653297424, "train/loss": 2.3454298973083496, "uptime": 8743.094944737999, "examples_seen": 48179200.0, "progress": 0.4178396667939575, "epoch": 37.60571416528837, "img/sec/core": 763.6385673626173, "core_hours_NVIDIA A100-SXM4-40GB": 18.720637741517756, "core_hours": 18.720637741517756} {"step": 47100, "global_schedule": 0.7106440663337708, "l2_grads": 1.4784539937973022, "l2_params": 315.69189453125, "l2_updates": 0.7427448630332947, "train/loss": 2.5869081020355225, "uptime": 8751.580992158002, "examples_seen": 48230400.0, "progress": 0.41828370469703297, "epoch": 37.645677729757324, "img/sec/core": 754.1791464556318, "core_hours_NVIDIA A100-SXM4-40GB": 18.73949562467332, "core_hours": 18.73949562467332} {"step": 47150, "global_schedule": 0.7099495530128479, "l2_grads": 1.4099215269088745, "l2_params": 315.61370849609375, "l2_updates": 0.7439642548561096, "train/loss": 2.467136859893799, "uptime": 8760.244069425002, "examples_seen": 48281600.0, "progress": 0.41872774260010837, "epoch": 37.68564129422628, "img/sec/core": 738.7675075206379, "core_hours_NVIDIA A100-SXM4-40GB": 18.758746907488874, "core_hours": 18.758746907488874} {"step": 47200, "global_schedule": 0.7092546224594116, "l2_grads": 1.238781452178955, "l2_params": 315.5469055175781, "l2_updates": 0.7442711591720581, "train/loss": 4.906822681427002, "uptime": 8768.797391978, "examples_seen": 48332800.0, "progress": 0.41917178050318377, "epoch": 37.725604858695235, "img/sec/core": 748.2472408054758, "core_hours_NVIDIA A100-SXM4-40GB": 18.77775429093998, "core_hours": 18.77775429093998} {"step": 47250, "global_schedule": 0.7085591554641724, "l2_grads": 1.4256739616394043, "l2_params": 315.4818420410156, "l2_updates": 0.7366296052932739, "train/loss": 2.6881165504455566, "uptime": 8777.949527170002, "examples_seen": 48384000.0, "progress": 0.41961581840625917, "epoch": 37.76556842316419, "img/sec/core": 699.2903694859107, "core_hours_NVIDIA A100-SXM4-40GB": 18.79809236914443, "core_hours": 18.79809236914443} {"step": 47300, "global_schedule": 0.7078632116317749, "l2_grads": 1.4672642946243286, "l2_params": 315.4319152832031, "l2_updates": 0.7368244528770447, "train/loss": 2.5575785636901855, "uptime": 8787.033674733002, "examples_seen": 48435200.0, "progress": 0.42005985630933457, "epoch": 37.80553198763315, "img/sec/core": 704.5240024575422, "core_hours_NVIDIA A100-SXM4-40GB": 18.818279363728877, "core_hours": 18.818279363728877} {"step": 47350, "global_schedule": 0.7071667909622192, "l2_grads": 1.373699426651001, "l2_params": 315.33843994140625, "l2_updates": 0.7583777904510498, "train/loss": 2.4391956329345703, "uptime": 8795.560314818, "examples_seen": 48486400.0, "progress": 0.42050389421240997, "epoch": 37.84549555210211, "img/sec/core": 750.588735563085, "core_hours_NVIDIA A100-SXM4-40GB": 18.837227452806648, "core_hours": 18.837227452806648} {"step": 47400, "global_schedule": 0.7064698338508606, "l2_grads": 1.495491862297058, "l2_params": 315.2838439941406, "l2_updates": 0.741678774356842, "train/loss": 2.448216438293457, "uptime": 8804.099968732002, "examples_seen": 48537600.0, "progress": 0.42094793211548537, "epoch": 37.88545911657106, "img/sec/core": 749.4448913797656, "core_hours_NVIDIA A100-SXM4-40GB": 18.85620446150443, "core_hours": 18.85620446150443} {"step": 47450, "global_schedule": 0.7057724595069885, "l2_grads": 1.522195816040039, "l2_params": 315.2149658203125, "l2_updates": 0.7309238910675049, "train/loss": 2.5609824657440186, "uptime": 8813.151453157001, "examples_seen": 48588800.0, "progress": 0.42139197001856077, "epoch": 37.92542268104002, "img/sec/core": 707.0663439826395, "core_hours_NVIDIA A100-SXM4-40GB": 18.876318871337762, "core_hours": 18.876318871337762} {"step": 47500, "global_schedule": 0.7050746083259583, "l2_grads": 1.2646774053573608, "l2_params": 315.15228271484375, "l2_updates": 0.7277287244796753, "train/loss": 3.9575929641723633, "uptime": 8822.563661443002, "examples_seen": 48640000.0, "progress": 0.42183600792163617, "epoch": 37.96538624550898, "img/sec/core": 679.9679528468038, "core_hours_NVIDIA A100-SXM4-40GB": 18.897234889751097, "core_hours": 18.897234889751097, "val/acc@1": 0.6401, "val/loss": 1.5235394311523438, "z/secs/eval/val": 3.0343030320000253} {"step": 47550, "global_schedule": 0.704376220703125, "l2_grads": 1.4542285203933716, "l2_params": 315.06463623046875, "l2_updates": 0.7434810996055603, "train/loss": 2.365849256515503, "uptime": 8835.597519065, "examples_seen": 48691200.0, "progress": 0.4222800458247116, "epoch": 38.005349809977936, "img/sec/core": 640.0834967799639, "core_hours_NVIDIA A100-SXM4-40GB": 18.91945421315776, "core_hours": 18.91945421315776} {"step": 47600, "global_schedule": 0.7036774158477783, "l2_grads": 1.2576748132705688, "l2_params": 314.9932861328125, "l2_updates": 0.7362275719642639, "train/loss": 4.658529758453369, "uptime": 8845.141581865, "examples_seen": 48742400.0, "progress": 0.422724083727787, "epoch": 38.04531337444689, "img/sec/core": 670.5739614370752, "core_hours_NVIDIA A100-SXM4-40GB": 18.940663241602202, "core_hours": 18.940663241602202} {"step": 47650, "global_schedule": 0.7029780149459839, "l2_grads": 1.218811273574829, "l2_params": 314.93328857421875, "l2_updates": 0.732617199420929, "train/loss": 4.760665416717529, "uptime": 8854.614745755001, "examples_seen": 48793600.0, "progress": 0.4231681216308624, "epoch": 38.08527693891585, "img/sec/core": 675.5926609435252, "core_hours_NVIDIA A100-SXM4-40GB": 18.961714716913317, "core_hours": 18.961714716913317} {"step": 47700, "global_schedule": 0.7022782564163208, "l2_grads": 1.4209418296813965, "l2_params": 314.8504333496094, "l2_updates": 0.7454735040664673, "train/loss": 2.4449310302734375, "uptime": 8864.168361255002, "examples_seen": 48844800.0, "progress": 0.4236121595339378, "epoch": 38.1252405033848, "img/sec/core": 669.9034517350426, "core_hours_NVIDIA A100-SXM4-40GB": 18.98294497357999, "core_hours": 18.98294497357999} {"step": 47750, "global_schedule": 0.7015779614448547, "l2_grads": 1.2318631410598755, "l2_params": 314.7602844238281, "l2_updates": 0.731328547000885, "train/loss": 3.8183038234710693, "uptime": 8872.845887813999, "examples_seen": 48896000.0, "progress": 0.4240561974370132, "epoch": 38.165204067853765, "img/sec/core": 737.5373565828563, "core_hours_NVIDIA A100-SXM4-40GB": 19.002228365933313, "core_hours": 19.002228365933313} {"step": 47800, "global_schedule": 0.7008772492408752, "l2_grads": 1.6393119096755981, "l2_params": 314.6954345703125, "l2_updates": 0.7377458810806274, "train/loss": 2.3813083171844482, "uptime": 8881.316851886999, "examples_seen": 48947200.0, "progress": 0.4245002353400886, "epoch": 38.20516763232272, "img/sec/core": 755.5220332475808, "core_hours_NVIDIA A100-SXM4-40GB": 19.021052730539978, "core_hours": 19.021052730539978} {"step": 47850, "global_schedule": 0.7001760005950928, "l2_grads": 1.484222412109375, "l2_params": 314.6253662109375, "l2_updates": 0.7308290004730225, "train/loss": 2.5880534648895264, "uptime": 8889.809467981, "examples_seen": 48998400.0, "progress": 0.42494427324316403, "epoch": 38.245131196791675, "img/sec/core": 753.5958212594364, "core_hours_NVIDIA A100-SXM4-40GB": 19.039925210748873, "core_hours": 19.039925210748873} {"step": 47900, "global_schedule": 0.6994742751121521, "l2_grads": 1.4898823499679565, "l2_params": 314.5418395996094, "l2_updates": 0.7378878593444824, "train/loss": 2.577000379562378, "uptime": 8898.515163561, "examples_seen": 49049600.0, "progress": 0.42538831114623943, "epoch": 38.28509476126063, "img/sec/core": 735.1509068044033, "core_hours_NVIDIA A100-SXM4-40GB": 19.05927120092665, "core_hours": 19.05927120092665} {"step": 47950, "global_schedule": 0.6987721920013428, "l2_grads": 1.2824045419692993, "l2_params": 314.4718933105469, "l2_updates": 0.7237610220909119, "train/loss": 3.8462867736816406, "uptime": 8907.768050523, "examples_seen": 49100800.0, "progress": 0.42583234904931483, "epoch": 38.325058325729586, "img/sec/core": 691.676017040266, "core_hours_NVIDIA A100-SXM4-40GB": 19.079833171953318, "core_hours": 19.079833171953318} {"step": 48000, "global_schedule": 0.6980695128440857, "l2_grads": 1.37616765499115, "l2_params": 314.3901062011719, "l2_updates": 0.7206715941429138, "train/loss": 4.316784381866455, "uptime": 8916.624998271001, "examples_seen": 49152000.0, "progress": 0.42627638695239023, "epoch": 38.36502189019855, "img/sec/core": 722.5965628445962, "core_hours_NVIDIA A100-SXM4-40GB": 19.099515278059986, "core_hours": 19.099515278059986} {"step": 48050, "global_schedule": 0.69736647605896, "l2_grads": 1.29964280128479, "l2_params": 314.3315734863281, "l2_updates": 0.7487120628356934, "train/loss": 3.1656129360198975, "uptime": 8925.579604101002, "examples_seen": 49203200.0, "progress": 0.4267204248554657, "epoch": 38.404985454667504, "img/sec/core": 773.7277926154135, "core_hours_NVIDIA A100-SXM4-40GB": 19.11789670671999, "core_hours": 19.11789670671999} {"step": 48100, "global_schedule": 0.6966629028320312, "l2_grads": 1.4164142608642578, "l2_params": 314.25140380859375, "l2_updates": 0.7342819571495056, "train/loss": 2.4501867294311523, "uptime": 8934.702213040002, "examples_seen": 49254400.0, "progress": 0.4271644627585411, "epoch": 38.44494901913646, "img/sec/core": 701.5536939919966, "core_hours_NVIDIA A100-SXM4-40GB": 19.138169171028878, "core_hours": 19.138169171028878} {"step": 48150, "global_schedule": 0.6959589123725891, "l2_grads": 1.413401484489441, "l2_params": 314.1884460449219, "l2_updates": 0.7493487596511841, "train/loss": 2.4096839427948, "uptime": 8943.674327193, "examples_seen": 49305600.0, "progress": 0.4276085006616165, "epoch": 38.484912583605414, "img/sec/core": 713.3212853584527, "core_hours_NVIDIA A100-SXM4-40GB": 19.158107202479986, "core_hours": 19.158107202479986} {"step": 48200, "global_schedule": 0.6952545046806335, "l2_grads": 1.2813512086868286, "l2_params": 314.1323547363281, "l2_updates": 0.7437199354171753, "train/loss": 3.016023635864258, "uptime": 8952.713555782999, "examples_seen": 49356800.0, "progress": 0.4280525385646919, "epoch": 38.52487614807437, "img/sec/core": 708.0250196440107, "core_hours_NVIDIA A100-SXM4-40GB": 19.178194377124427, "core_hours": 19.178194377124427} {"step": 48250, "global_schedule": 0.694549560546875, "l2_grads": 1.3903864622116089, "l2_params": 314.0679626464844, "l2_updates": 0.7205503582954407, "train/loss": 4.916031837463379, "uptime": 8962.181243134999, "examples_seen": 49408000.0, "progress": 0.4284965764677673, "epoch": 38.56483971254333, "img/sec/core": 675.9834542537877, "core_hours_NVIDIA A100-SXM4-40GB": 19.199233682351096, "core_hours": 19.199233682351096} {"step": 48300, "global_schedule": 0.693844199180603, "l2_grads": 1.4241691827774048, "l2_params": 313.975341796875, "l2_updates": 0.7389296889305115, "train/loss": 2.624884605407715, "uptime": 8971.300445318999, "examples_seen": 49459200.0, "progress": 0.4289406143708427, "epoch": 38.60480327701229, "img/sec/core": 701.8157806863018, "core_hours_NVIDIA A100-SXM4-40GB": 19.219498576093315, "core_hours": 19.219498576093315} {"step": 48350, "global_schedule": 0.6931383609771729, "l2_grads": 1.4455047845840454, "l2_params": 313.90185546875, "l2_updates": 0.7382633090019226, "train/loss": 2.3669161796569824, "uptime": 8980.800692304, "examples_seen": 49510400.0, "progress": 0.4293846522739181, "epoch": 38.64476684148124, "img/sec/core": 673.6666962558578, "core_hours_NVIDIA A100-SXM4-40GB": 19.240610236059982, "core_hours": 19.240610236059982} {"step": 48400, "global_schedule": 0.6924320459365845, "l2_grads": 1.5076243877410889, "l2_params": 313.8444519042969, "l2_updates": 0.728541910648346, "train/loss": 2.447925567626953, "uptime": 8989.339326279, "examples_seen": 49561600.0, "progress": 0.4298286901769935, "epoch": 38.6847304059502, "img/sec/core": 749.5344124994889, "core_hours_NVIDIA A100-SXM4-40GB": 19.259584978226652, "core_hours": 19.259584978226652} {"step": 48450, "global_schedule": 0.6917253136634827, "l2_grads": 1.6300674676895142, "l2_params": 313.7762145996094, "l2_updates": 0.7054114937782288, "train/loss": 2.4810264110565186, "uptime": 8998.057334815001, "examples_seen": 49612800.0, "progress": 0.4302727280800689, "epoch": 38.72469397041916, "img/sec/core": 734.1126099579844, "core_hours_NVIDIA A100-SXM4-40GB": 19.278958330528877, "core_hours": 19.278958330528877} {"step": 48500, "global_schedule": 0.6910181045532227, "l2_grads": 1.4738223552703857, "l2_params": 313.6833801269531, "l2_updates": 0.7430166602134705, "train/loss": 2.3327431678771973, "uptime": 9006.591055261002, "examples_seen": 49664000.0, "progress": 0.43071676598314435, "epoch": 38.764657534888116, "img/sec/core": 749.9659779690862, "core_hours_NVIDIA A100-SXM4-40GB": 19.29792215374221, "core_hours": 19.29792215374221} {"step": 48550, "global_schedule": 0.6903104782104492, "l2_grads": 1.491071105003357, "l2_params": 313.6219787597656, "l2_updates": 0.7256323099136353, "train/loss": 2.357130527496338, "uptime": 9015.496776544, "examples_seen": 49715200.0, "progress": 0.43116080388621975, "epoch": 38.80462109935707, "img/sec/core": 718.6391530373434, "core_hours_NVIDIA A100-SXM4-40GB": 19.317712645482207, "core_hours": 19.317712645482207} {"step": 48600, "global_schedule": 0.6896023750305176, "l2_grads": 1.353054404258728, "l2_params": 313.5656433105469, "l2_updates": 0.7077382802963257, "train/loss": 4.360354423522949, "uptime": 9024.100670755002, "examples_seen": 49766400.0, "progress": 0.43160484178929515, "epoch": 38.844584663826026, "img/sec/core": 743.8492202537434, "core_hours_NVIDIA A100-SXM4-40GB": 19.336832410395548, "core_hours": 19.336832410395548} {"step": 48650, "global_schedule": 0.6888939142227173, "l2_grads": 1.5278748273849487, "l2_params": 313.4833984375, "l2_updates": 0.724799633026123, "train/loss": 2.5569052696228027, "uptime": 9032.661104323002, "examples_seen": 49817600.0, "progress": 0.43204887969237055, "epoch": 38.88454822829498, "img/sec/core": 747.6256838116257, "core_hours_NVIDIA A100-SXM4-40GB": 19.355855596102213, "core_hours": 19.355855596102213} {"step": 48700, "global_schedule": 0.6881848573684692, "l2_grads": 1.4901145696640015, "l2_params": 313.40472412109375, "l2_updates": 0.7195476293563843, "train/loss": 2.3037612438201904, "uptime": 9041.677764058002, "examples_seen": 49868800.0, "progress": 0.43249291759544595, "epoch": 38.924511792763944, "img/sec/core": 709.7972184929198, "core_hours_NVIDIA A100-SXM4-40GB": 19.375892617735545, "core_hours": 19.375892617735545} {"step": 48750, "global_schedule": 0.6874755024909973, "l2_grads": 1.4342752695083618, "l2_params": 313.3401184082031, "l2_updates": 0.7319406867027283, "train/loss": 2.40989089012146, "uptime": 9050.274822089, "examples_seen": 49920000.0, "progress": 0.43293695549852135, "epoch": 38.9644753572329, "img/sec/core": 744.4407118020354, "core_hours_NVIDIA A100-SXM4-40GB": 19.39499719113776, "core_hours": 19.39499719113776} {"step": 48800, "global_schedule": 0.6867656707763672, "l2_grads": 1.407716155052185, "l2_params": 313.27545166015625, "l2_updates": 0.7269788980484009, "train/loss": 2.7704129219055176, "uptime": 9059.762125099, "examples_seen": 49971200.0, "progress": 0.43338099340159675, "epoch": 39.004438921701855, "img/sec/core": 674.5858115056413, "core_hours_NVIDIA A100-SXM4-40GB": 19.416080086715542, "core_hours": 19.416080086715542} {"step": 48850, "global_schedule": 0.6860553622245789, "l2_grads": 1.5006940364837646, "l2_params": 313.1826477050781, "l2_updates": 0.72194904088974, "train/loss": 2.3585410118103027, "uptime": 9068.332333844, "examples_seen": 50022400.0, "progress": 0.43382503130467215, "epoch": 39.04440248617081, "img/sec/core": 746.7729422265504, "core_hours_NVIDIA A100-SXM4-40GB": 19.435124995037764, "core_hours": 19.435124995037764} {"step": 48900, "global_schedule": 0.6853446960449219, "l2_grads": 1.237464189529419, "l2_params": 313.0931701660156, "l2_updates": 0.7282782196998596, "train/loss": 3.4826226234436035, "uptime": 9076.749749959, "examples_seen": 50073600.0, "progress": 0.43426906920774755, "epoch": 39.084366050639765, "img/sec/core": 760.3283374092422, "core_hours_NVIDIA A100-SXM4-40GB": 19.453830364182206, "core_hours": 19.453830364182206} {"step": 48950, "global_schedule": 0.6846334934234619, "l2_grads": 1.4809879064559937, "l2_params": 313.0121154785156, "l2_updates": 0.7261528372764587, "train/loss": 2.4390838146209717, "uptime": 9085.260974505001, "examples_seen": 50124800.0, "progress": 0.434713107110823, "epoch": 39.12432961510873, "img/sec/core": 751.9482026834147, "core_hours_NVIDIA A100-SXM4-40GB": 19.472744196506653, "core_hours": 19.472744196506653} {"step": 49000, "global_schedule": 0.6839219331741333, "l2_grads": 1.2816778421401978, "l2_params": 312.9706115722656, "l2_updates": 0.7153688669204712, "train/loss": 4.723204135894775, "uptime": 9094.732437498, "examples_seen": 50176000.0, "progress": 0.4351571450138984, "epoch": 39.16429317957768, "img/sec/core": 675.7139847065829, "core_hours_NVIDIA A100-SXM4-40GB": 19.49379189204665, "core_hours": 19.49379189204665} {"step": 49050, "global_schedule": 0.6832098960876465, "l2_grads": 1.2740553617477417, "l2_params": 312.8968200683594, "l2_updates": 0.7107272744178772, "train/loss": 4.418487071990967, "uptime": 9104.800715592, "examples_seen": 50227200.0, "progress": 0.4356011829169738, "epoch": 39.20425674404664, "img/sec/core": 700.14190664337, "core_hours_NVIDIA A100-SXM4-40GB": 19.51410523436665, "core_hours": 19.51410523436665} {"step": 49100, "global_schedule": 0.6824974417686462, "l2_grads": 1.484922170639038, "l2_params": 312.8253479003906, "l2_updates": 0.7188537120819092, "train/loss": 2.3786168098449707, "uptime": 9113.438604265002, "examples_seen": 50278400.0, "progress": 0.4360452208200492, "epoch": 39.244220308515594, "img/sec/core": 740.9217972446913, "core_hours_NVIDIA A100-SXM4-40GB": 19.533300542528874, "core_hours": 19.533300542528874} {"step": 49150, "global_schedule": 0.6817845702171326, "l2_grads": 1.254643201828003, "l2_params": 312.7560119628906, "l2_updates": 0.7223966121673584, "train/loss": 4.175282955169678, "uptime": 9122.516855478001, "examples_seen": 50329600.0, "progress": 0.4364892587231246, "epoch": 39.28418387298455, "img/sec/core": 704.9815928023593, "core_hours_NVIDIA A100-SXM4-40GB": 19.553474434113316, "core_hours": 19.553474434113316} {"step": 49200, "global_schedule": 0.6810712218284607, "l2_grads": 1.3758045434951782, "l2_params": 312.6809997558594, "l2_updates": 0.7168247699737549, "train/loss": 2.714931011199951, "uptime": 9131.982607332002, "examples_seen": 50380800.0, "progress": 0.4369332966262, "epoch": 39.32414743745351, "img/sec/core": 676.1216751414247, "core_hours_NVIDIA A100-SXM4-40GB": 19.574509438233317, "core_hours": 19.574509438233317} {"step": 49250, "global_schedule": 0.6803575754165649, "l2_grads": 1.4474174976348877, "l2_params": 312.5964660644531, "l2_updates": 0.7229138612747192, "train/loss": 2.3377413749694824, "uptime": 9141.49439243, "examples_seen": 50432000.0, "progress": 0.4373773345292754, "epoch": 39.36411100192247, "img/sec/core": 672.8495160542057, "core_hours_NVIDIA A100-SXM4-40GB": 19.59564673845109, "core_hours": 19.59564673845109} {"step": 49300, "global_schedule": 0.6796433925628662, "l2_grads": 1.4220993518829346, "l2_params": 312.5002746582031, "l2_updates": 0.7287890315055847, "train/loss": 2.668111801147461, "uptime": 9150.753493055001, "examples_seen": 50483200.0, "progress": 0.4378213724323508, "epoch": 39.40407456639142, "img/sec/core": 691.2118421868543, "core_hours_NVIDIA A100-SXM4-40GB": 19.61622251761776, "core_hours": 19.61622251761776} {"step": 49350, "global_schedule": 0.6789288520812988, "l2_grads": 1.5691661834716797, "l2_params": 312.4329833984375, "l2_updates": 0.7203434109687805, "train/loss": 2.2433061599731445, "uptime": 9160.415309940001, "examples_seen": 50534400.0, "progress": 0.4382654103354262, "epoch": 39.44403813086038, "img/sec/core": 662.4012932739405, "core_hours_NVIDIA A100-SXM4-40GB": 19.63769322180665, "core_hours": 19.63769322180665} {"step": 49400, "global_schedule": 0.6782138347625732, "l2_grads": 1.4744974374771118, "l2_params": 312.35675048828125, "l2_updates": 0.7231329679489136, "train/loss": 2.353437662124634, "uptime": 9169.825621312999, "examples_seen": 50585600.0, "progress": 0.43870944823850166, "epoch": 39.48400169532933, "img/sec/core": 680.1050195176557, "core_hours_NVIDIA A100-SXM4-40GB": 19.658605024857756, "core_hours": 19.658605024857756} {"step": 49450, "global_schedule": 0.677498459815979, "l2_grads": 1.4587666988372803, "l2_params": 312.2714538574219, "l2_updates": 0.6994084715843201, "train/loss": 2.588195562362671, "uptime": 9179.295164417, "examples_seen": 50636800.0, "progress": 0.43915348614157707, "epoch": 39.523965259798295, "img/sec/core": 675.850981373683, "core_hours_NVIDIA A100-SXM4-40GB": 19.67964845397776, "core_hours": 19.67964845397776} {"step": 49500, "global_schedule": 0.6767826080322266, "l2_grads": 1.5428383350372314, "l2_params": 312.1896667480469, "l2_updates": 0.7365725636482239, "train/loss": 2.487206220626831, "uptime": 9188.181685713002, "examples_seen": 50688000.0, "progress": 0.43959752404465247, "epoch": 39.56392882426725, "img/sec/core": 720.191826117622, "core_hours_NVIDIA A100-SXM4-40GB": 19.699396279079984, "core_hours": 19.699396279079984} {"step": 49550, "global_schedule": 0.6760663986206055, "l2_grads": 1.5346099138259888, "l2_params": 312.1398010253906, "l2_updates": 0.7116280198097229, "train/loss": 2.3334178924560547, "uptime": 9197.628692115, "examples_seen": 50739200.0, "progress": 0.44004156194772787, "epoch": 39.603892388736206, "img/sec/core": 677.4632860041127, "core_hours_NVIDIA A100-SXM4-40GB": 19.72038962663998, "core_hours": 19.72038962663998} {"step": 49600, "global_schedule": 0.6753497123718262, "l2_grads": 1.645927906036377, "l2_params": 312.0738525390625, "l2_updates": 0.7153205275535583, "train/loss": 2.274017333984375, "uptime": 9206.669906647001, "examples_seen": 50790400.0, "progress": 0.44048559985080327, "epoch": 39.64385595320516, "img/sec/core": 707.8694988762577, "core_hours_NVIDIA A100-SXM4-40GB": 19.74048121448887, "core_hours": 19.74048121448887} {"step": 49650, "global_schedule": 0.6746326684951782, "l2_grads": 1.6804542541503906, "l2_params": 311.9885559082031, "l2_updates": 0.7052160501480103, "train/loss": 2.3757989406585693, "uptime": 9215.260903626002, "examples_seen": 50841600.0, "progress": 0.44092963775387867, "epoch": 39.683819517674124, "img/sec/core": 744.9659237040356, "core_hours_NVIDIA A100-SXM4-40GB": 19.75957231888665, "core_hours": 19.75957231888665} {"step": 49700, "global_schedule": 0.6739151477813721, "l2_grads": 1.450444221496582, "l2_params": 311.9180908203125, "l2_updates": 0.7026258707046509, "train/loss": 4.365716934204102, "uptime": 9223.945935421, "examples_seen": 50892800.0, "progress": 0.44137367565695407, "epoch": 39.72378308214308, "img/sec/core": 736.900008090512, "core_hours_NVIDIA A100-SXM4-40GB": 19.7788723895422, "core_hours": 19.7788723895422} {"step": 49750, "global_schedule": 0.673197329044342, "l2_grads": 1.5616487264633179, "l2_params": 311.85601806640625, "l2_updates": 0.6994342803955078, "train/loss": 2.376511812210083, "uptime": 9232.91029102, "examples_seen": 50944000.0, "progress": 0.44181771356002947, "epoch": 39.763746646612034, "img/sec/core": 713.9386573100181, "core_hours_NVIDIA A100-SXM4-40GB": 19.798793179762203, "core_hours": 19.798793179762203} {"step": 49800, "global_schedule": 0.672478973865509, "l2_grads": 1.4065301418304443, "l2_params": 311.806396484375, "l2_updates": 0.7078844308853149, "train/loss": 3.084308624267578, "uptime": 9242.387561161, "examples_seen": 50995200.0, "progress": 0.44226175146310487, "epoch": 39.80371021108099, "img/sec/core": 675.2999444758437, "core_hours_NVIDIA A100-SXM4-40GB": 19.819853780075537, "core_hours": 19.819853780075537} {"step": 49850, "global_schedule": 0.6717603206634521, "l2_grads": 1.2852511405944824, "l2_params": 311.7103271484375, "l2_updates": 0.708105206489563, "train/loss": 3.170785427093506, "uptime": 9251.436299881001, "examples_seen": 51046400.0, "progress": 0.4427057893661803, "epoch": 39.843673775549945, "img/sec/core": 707.2808927341097, "core_hours_NVIDIA A100-SXM4-40GB": 19.839962088342205, "core_hours": 19.839962088342205} {"step": 49900, "global_schedule": 0.6710412502288818, "l2_grads": 1.4563747644424438, "l2_params": 311.6585998535156, "l2_updates": 0.7147619128227234, "train/loss": 2.6815428733825684, "uptime": 9260.656511563999, "examples_seen": 51097600.0, "progress": 0.4431498272692557, "epoch": 39.88363734001891, "img/sec/core": 694.1272304845038, "core_hours_NVIDIA A100-SXM4-40GB": 19.860451447637754, "core_hours": 19.860451447637754} {"step": 49950, "global_schedule": 0.6703217625617981, "l2_grads": 1.4227957725524902, "l2_params": 311.5770568847656, "l2_updates": 0.7122108936309814, "train/loss": 2.4499258995056152, "uptime": 9269.246222071002, "examples_seen": 51148800.0, "progress": 0.4435938651723311, "epoch": 39.92360090448786, "img/sec/core": 745.0774964746331, "core_hours_NVIDIA A100-SXM4-40GB": 19.879539693208873, "core_hours": 19.879539693208873} {"step": 50000, "global_schedule": 0.6696017980575562, "l2_grads": 1.2794365882873535, "l2_params": 311.51690673828125, "l2_updates": 0.7172866463661194, "train/loss": 2.956483840942383, "uptime": 9278.807698347, "examples_seen": 51200000.0, "progress": 0.4440379030754065, "epoch": 39.96356446895682, "img/sec/core": 669.3527040448665, "core_hours_NVIDIA A100-SXM4-40GB": 19.90078741826665, "core_hours": 19.90078741826665, "val/acc@1": 0.64688, "val/loss": 1.4731106518554689, "z/secs/eval/val": 4.518826633000572} {"step": 50050, "global_schedule": 0.6688815355300903, "l2_grads": 1.3743776082992554, "l2_params": 311.451904296875, "l2_updates": 0.702544093132019, "train/loss": 2.672353744506836, "uptime": 9293.556167183999, "examples_seen": 51251200.0, "progress": 0.4444819409784819, "epoch": 40.00352803342577, "img/sec/core": 693.3011995681829, "core_hours_NVIDIA A100-SXM4-40GB": 19.92130118952664, "core_hours": 19.92130118952664} {"step": 50100, "global_schedule": 0.6681609153747559, "l2_grads": 1.5145381689071655, "l2_params": 311.36578369140625, "l2_updates": 0.7136157155036926, "train/loss": 2.3577685356140137, "uptime": 9302.182354992, "examples_seen": 51302400.0, "progress": 0.4449259788815573, "epoch": 40.04349159789473, "img/sec/core": 741.9268096695382, "core_hours_NVIDIA A100-SXM4-40GB": 19.940470495766643, "core_hours": 19.940470495766643} {"step": 50150, "global_schedule": 0.6674398183822632, "l2_grads": 1.4789433479309082, "l2_params": 311.2806701660156, "l2_updates": 0.715661883354187, "train/loss": 2.3635401725769043, "uptime": 9311.413191686, "examples_seen": 51353600.0, "progress": 0.4453700167846327, "epoch": 40.08345516236369, "img/sec/core": 693.3282661320335, "core_hours_NVIDIA A100-SXM4-40GB": 19.96098346619776, "core_hours": 19.96098346619776} {"step": 50200, "global_schedule": 0.6667183637619019, "l2_grads": 1.4294875860214233, "l2_params": 311.2147521972656, "l2_updates": 0.6822181940078735, "train/loss": 4.733086585998535, "uptime": 9320.181545703, "examples_seen": 51404800.0, "progress": 0.44581405468770813, "epoch": 40.12341872683265, "img/sec/core": 729.897536936998, "core_hours_NVIDIA A100-SXM4-40GB": 19.980468697346645, "core_hours": 19.980468697346645} {"step": 50250, "global_schedule": 0.6659964919090271, "l2_grads": 1.4790129661560059, "l2_params": 311.1252136230469, "l2_updates": 0.7070373892784119, "train/loss": 2.334184408187866, "uptime": 9328.91317976, "examples_seen": 51456000.0, "progress": 0.44625809259078353, "epoch": 40.1633822913016, "img/sec/core": 732.9670435363146, "core_hours_NVIDIA A100-SXM4-40GB": 19.999872328584427, "core_hours": 19.999872328584427} {"step": 50300, "global_schedule": 0.6652742028236389, "l2_grads": 1.4926388263702393, "l2_params": 311.083251953125, "l2_updates": 0.7074370980262756, "train/loss": 2.2107536792755127, "uptime": 9338.687858445, "examples_seen": 51507200.0, "progress": 0.44670213049385893, "epoch": 40.20334585577056, "img/sec/core": 654.7529802510162, "core_hours_NVIDIA A100-SXM4-40GB": 20.021593836773313, "core_hours": 20.021593836773313} {"step": 50350, "global_schedule": 0.6645516157150269, "l2_grads": 1.2771673202514648, "l2_params": 311.01409912109375, "l2_updates": 0.6870745420455933, "train/loss": 3.844709634780884, "uptime": 9348.53685947, "examples_seen": 51558400.0, "progress": 0.4471461683969344, "epoch": 40.24330942023951, "img/sec/core": 649.8120960446072, "core_hours_NVIDIA A100-SXM4-40GB": 20.043480505717756, "core_hours": 20.043480505717756} {"step": 50400, "global_schedule": 0.6638285517692566, "l2_grads": 1.647254467010498, "l2_params": 310.9320068359375, "l2_updates": 0.7052188515663147, "train/loss": 2.3663718700408936, "uptime": 9357.709912582, "examples_seen": 51609600.0, "progress": 0.4475902063000098, "epoch": 40.283272984708475, "img/sec/core": 697.6957313837968, "core_hours_NVIDIA A100-SXM4-40GB": 20.06386506818887, "core_hours": 20.06386506818887} {"step": 50450, "global_schedule": 0.6631051301956177, "l2_grads": 1.3436228036880493, "l2_params": 310.8522033691406, "l2_updates": 0.7017800807952881, "train/loss": 3.746232032775879, "uptime": 9366.361780867, "examples_seen": 51660800.0, "progress": 0.4480342442030852, "epoch": 40.32323654917743, "img/sec/core": 739.7246223796312, "core_hours_NVIDIA A100-SXM4-40GB": 20.083091442155535, "core_hours": 20.083091442155535} {"step": 50500, "global_schedule": 0.6623813509941101, "l2_grads": 1.565311074256897, "l2_params": 310.7795104980469, "l2_updates": 0.6957878470420837, "train/loss": 2.3335511684417725, "uptime": 9375.745230339, "examples_seen": 51712000.0, "progress": 0.4484782821061606, "epoch": 40.363200113646386, "img/sec/core": 682.0519489232405, "core_hours_NVIDIA A100-SXM4-40GB": 20.103943552093313, "core_hours": 20.103943552093313} {"step": 50550, "global_schedule": 0.6616572141647339, "l2_grads": 1.4070998430252075, "l2_params": 310.7049255371094, "l2_updates": 0.6802411675453186, "train/loss": 3.7151942253112793, "uptime": 9385.330883376, "examples_seen": 51763200.0, "progress": 0.448922320009236, "epoch": 40.40316367811534, "img/sec/core": 667.6644747411898, "core_hours_NVIDIA A100-SXM4-40GB": 20.125245003286647, "core_hours": 20.125245003286647} {"step": 50600, "global_schedule": 0.6609326004981995, "l2_grads": 1.5273514986038208, "l2_params": 310.61322021484375, "l2_updates": 0.6966013312339783, "train/loss": 2.5309391021728516, "uptime": 9394.700478232002, "examples_seen": 51814400.0, "progress": 0.4493663579123114, "epoch": 40.4431272425843, "img/sec/core": 683.0604842962358, "core_hours_NVIDIA A100-SXM4-40GB": 20.146066325188873, "core_hours": 20.146066325188873} {"step": 50650, "global_schedule": 0.6602077484130859, "l2_grads": 1.309847116470337, "l2_params": 310.54681396484375, "l2_updates": 0.7014920115470886, "train/loss": 4.173873424530029, "uptime": 9403.547288329, "examples_seen": 51865600.0, "progress": 0.4498103958153868, "epoch": 40.48309080705326, "img/sec/core": 723.424593704271, "core_hours_NVIDIA A100-SXM4-40GB": 20.165725903182203, "core_hours": 20.165725903182203} {"step": 50700, "global_schedule": 0.659482479095459, "l2_grads": 1.2726013660430908, "l2_params": 310.464111328125, "l2_updates": 0.6876250505447388, "train/loss": 4.0940117835998535, "uptime": 9412.755762597002, "examples_seen": 51916800.0, "progress": 0.4502544337184622, "epoch": 40.523054371522214, "img/sec/core": 695.0119871908831, "core_hours_NVIDIA A100-SXM4-40GB": 20.18618917933332, "core_hours": 20.18618917933332} {"step": 50750, "global_schedule": 0.6587567329406738, "l2_grads": 1.448661208152771, "l2_params": 310.3868408203125, "l2_updates": 0.7054049968719482, "train/loss": 2.8074817657470703, "uptime": 9422.527589095002, "examples_seen": 51968000.0, "progress": 0.4506984716215376, "epoch": 40.56301793599117, "img/sec/core": 654.9440886317684, "core_hours_NVIDIA A100-SXM4-40GB": 20.20790434932887, "core_hours": 20.20790434932887} {"step": 50800, "global_schedule": 0.6580307483673096, "l2_grads": 1.4590696096420288, "l2_params": 310.31768798828125, "l2_updates": 0.6908320188522339, "train/loss": 4.4490461349487305, "uptime": 9431.147595676002, "examples_seen": 52019200.0, "progress": 0.45114250952461304, "epoch": 40.602981500460125, "img/sec/core": 742.4588299162252, "core_hours_NVIDIA A100-SXM4-40GB": 20.22705991950887, "core_hours": 20.22705991950887} {"step": 50850, "global_schedule": 0.6573042869567871, "l2_grads": 1.4140784740447998, "l2_params": 310.2294921875, "l2_updates": 0.6932961940765381, "train/loss": 4.836941719055176, "uptime": 9440.411080919, "examples_seen": 52070400.0, "progress": 0.45158654742768845, "epoch": 40.64294506492909, "img/sec/core": 690.884675920154, "core_hours_NVIDIA A100-SXM4-40GB": 20.247645442271093, "core_hours": 20.247645442271093} {"step": 50900, "global_schedule": 0.656577467918396, "l2_grads": 1.4169089794158936, "l2_params": 310.1591491699219, "l2_updates": 0.6922234296798706, "train/loss": 3.4993655681610107, "uptime": 9449.190840104, "examples_seen": 52121600.0, "progress": 0.45203058533076385, "epoch": 40.68290862939804, "img/sec/core": 728.9493783536414, "core_hours_NVIDIA A100-SXM4-40GB": 20.267156018237756, "core_hours": 20.267156018237756} {"step": 50950, "global_schedule": 0.655850350856781, "l2_grads": 1.4951591491699219, "l2_params": 310.09002685546875, "l2_updates": 0.6885425448417664, "train/loss": 4.964856147766113, "uptime": 9458.289229313, "examples_seen": 52172800.0, "progress": 0.45247462323383925, "epoch": 40.722872193867, "img/sec/core": 703.4212158860698, "core_hours_NVIDIA A100-SXM4-40GB": 20.287374660924424, "core_hours": 20.287374660924424} {"step": 51000, "global_schedule": 0.6551227569580078, "l2_grads": 1.3604679107666016, "l2_params": 310.0234069824219, "l2_updates": 0.680009126663208, "train/loss": 4.617013454437256, "uptime": 9467.430152857001, "examples_seen": 52224000.0, "progress": 0.45291866113691465, "epoch": 40.76283575833595, "img/sec/core": 700.148072477918, "core_hours_NVIDIA A100-SXM4-40GB": 20.307687824355536, "core_hours": 20.307687824355536} {"step": 51050, "global_schedule": 0.6543949246406555, "l2_grads": 1.2687875032424927, "l2_params": 309.9460144042969, "l2_updates": 0.6943193674087524, "train/loss": 4.679922580718994, "uptime": 9476.534281306, "examples_seen": 52275200.0, "progress": 0.45336269903999005, "epoch": 40.80279932280491, "img/sec/core": 763.3133569291846, "core_hours_NVIDIA A100-SXM4-40GB": 20.326320044128867, "core_hours": 20.326320044128867} {"step": 51100, "global_schedule": 0.6536666750907898, "l2_grads": 1.5247126817703247, "l2_params": 309.85992431640625, "l2_updates": 0.6927635669708252, "train/loss": 2.28033185005188, "uptime": 9485.866054332002, "examples_seen": 52326400.0, "progress": 0.45380673694306545, "epoch": 40.84276288727387, "img/sec/core": 685.8289397059748, "core_hours_NVIDIA A100-SXM4-40GB": 20.347057317519987, "core_hours": 20.347057317519987} {"step": 51150, "global_schedule": 0.6529380679130554, "l2_grads": 1.3815619945526123, "l2_params": 309.7787170410156, "l2_updates": 0.6907303929328918, "train/loss": 4.648556232452393, "uptime": 9495.273296021, "examples_seen": 52377600.0, "progress": 0.45425077484614085, "epoch": 40.882726451742826, "img/sec/core": 680.3269450901031, "core_hours_NVIDIA A100-SXM4-40GB": 20.36796229905109, "core_hours": 20.36796229905109} {"step": 51200, "global_schedule": 0.6522091031074524, "l2_grads": 1.4652879238128662, "l2_params": 309.7068786621094, "l2_updates": 0.6987223625183105, "train/loss": 2.336747169494629, "uptime": 9503.9706445, "examples_seen": 52428800.0, "progress": 0.45469481274921625, "epoch": 40.92269001621178, "img/sec/core": 735.8564527399653, "core_hours_NVIDIA A100-SXM4-40GB": 20.387289740115534, "core_hours": 20.387289740115534} {"step": 51250, "global_schedule": 0.6514797806739807, "l2_grads": 1.693884015083313, "l2_params": 309.6208801269531, "l2_updates": 0.6638837456703186, "train/loss": 2.371304988861084, "uptime": 9513.340886157, "examples_seen": 52480000.0, "progress": 0.4551388506522917, "epoch": 40.96265358068074, "img/sec/core": 683.0133345833198, "core_hours_NVIDIA A100-SXM4-40GB": 20.40811249935331, "core_hours": 20.40811249935331} {"step": 51300, "global_schedule": 0.6507501006126404, "l2_grads": 1.5178054571151733, "l2_params": 309.5271911621094, "l2_updates": 0.6922597885131836, "train/loss": 2.4181087017059326, "uptime": 9523.778640237999, "examples_seen": 52531200.0, "progress": 0.4555828885553671, "epoch": 41.00261714514969, "img/sec/core": 613.1587265167584, "core_hours_NVIDIA A100-SXM4-40GB": 20.4313075084222, "core_hours": 20.4313075084222} {"step": 51350, "global_schedule": 0.6500201225280762, "l2_grads": 1.6130424737930298, "l2_params": 309.4588623046875, "l2_updates": 0.6963689923286438, "train/loss": 2.355130672454834, "uptime": 9532.384861861, "examples_seen": 52582400.0, "progress": 0.4560269264584425, "epoch": 41.042580709618655, "img/sec/core": 743.6480583877326, "core_hours_NVIDIA A100-SXM4-40GB": 20.450432445362203, "core_hours": 20.450432445362203} {"step": 51400, "global_schedule": 0.6492897272109985, "l2_grads": 1.4666346311569214, "l2_params": 309.37420654296875, "l2_updates": 0.6856540441513062, "train/loss": 2.685155153274536, "uptime": 9540.85176295, "examples_seen": 52633600.0, "progress": 0.4564709643615179, "epoch": 41.08254427408761, "img/sec/core": 755.884583122775, "core_hours_NVIDIA A100-SXM4-40GB": 20.469247781115534, "core_hours": 20.469247781115534} {"step": 51450, "global_schedule": 0.6485589742660522, "l2_grads": 1.5370895862579346, "l2_params": 309.2958679199219, "l2_updates": 0.6808220744132996, "train/loss": 2.364229440689087, "uptime": 9550.114991525, "examples_seen": 52684800.0, "progress": 0.4569150022645933, "epoch": 41.122507838556565, "img/sec/core": 690.9038191362591, "core_hours_NVIDIA A100-SXM4-40GB": 20.489832733504425, "core_hours": 20.489832733504425} {"step": 51500, "global_schedule": 0.6478278636932373, "l2_grads": 1.5646138191223145, "l2_params": 309.2246398925781, "l2_updates": 0.6731495261192322, "train/loss": 2.281834125518799, "uptime": 9559.304054544, "examples_seen": 52736000.0, "progress": 0.4573590401676687, "epoch": 41.16247140302552, "img/sec/core": 696.4801511065349, "core_hours_NVIDIA A100-SXM4-40GB": 20.510252873546644, "core_hours": 20.510252873546644} {"step": 51550, "global_schedule": 0.6470965147018433, "l2_grads": 1.4909553527832031, "l2_params": 309.14239501953125, "l2_updates": 0.6774449944496155, "train/loss": 3.5477957725524902, "uptime": 9569.196234731002, "examples_seen": 52787200.0, "progress": 0.4578030780707441, "epoch": 41.20243496749448, "img/sec/core": 646.9756796797361, "core_hours_NVIDIA A100-SXM4-40GB": 20.53223549618443, "core_hours": 20.53223549618443} {"step": 51600, "global_schedule": 0.646364688873291, "l2_grads": 1.5600820779800415, "l2_params": 309.04888916015625, "l2_updates": 0.6865316033363342, "train/loss": 2.2914090156555176, "uptime": 9578.783055458001, "examples_seen": 52838400.0, "progress": 0.4582471159738195, "epoch": 41.24239853196344, "img/sec/core": 667.583152147149, "core_hours_NVIDIA A100-SXM4-40GB": 20.553539542244426, "core_hours": 20.553539542244426} {"step": 51650, "global_schedule": 0.6456326246261597, "l2_grads": 1.3113189935684204, "l2_params": 308.9656066894531, "l2_updates": 0.6807501316070557, "train/loss": 3.6828463077545166, "uptime": 9588.302911186, "examples_seen": 52889600.0, "progress": 0.4586911538768949, "epoch": 41.282362096432394, "img/sec/core": 672.2790956986231, "core_hours_NVIDIA A100-SXM4-40GB": 20.574694777195532, "core_hours": 20.574694777195532} {"step": 51700, "global_schedule": 0.6449000835418701, "l2_grads": 1.225186824798584, "l2_params": 308.87255859375, "l2_updates": 0.6784974336624146, "train/loss": 3.783341884613037, "uptime": 9598.061276522001, "examples_seen": 52940800.0, "progress": 0.45913519177997036, "epoch": 41.32232566090135, "img/sec/core": 655.8475502437326, "core_hours_NVIDIA A100-SXM4-40GB": 20.59638003349776, "core_hours": 20.59638003349776} {"step": 51750, "global_schedule": 0.6441673636436462, "l2_grads": 1.261705756187439, "l2_params": 308.7956237792969, "l2_updates": 0.6836134195327759, "train/loss": 3.5213119983673096, "uptime": 9607.665169746999, "examples_seen": 52992000.0, "progress": 0.45957922968304576, "epoch": 41.362289225370304, "img/sec/core": 666.3964134192678, "core_hours_NVIDIA A100-SXM4-40GB": 20.617722018442198, "core_hours": 20.617722018442198} {"step": 51800, "global_schedule": 0.6434341669082642, "l2_grads": 1.2970666885375977, "l2_params": 308.7203674316406, "l2_updates": 0.6867634057998657, "train/loss": 4.4224853515625, "uptime": 9617.353169488999, "examples_seen": 53043200.0, "progress": 0.46002326758612117, "epoch": 41.40225278983927, "img/sec/core": 660.6110828279926, "core_hours_NVIDIA A100-SXM4-40GB": 20.639250906757756, "core_hours": 20.639250906757756} {"step": 51850, "global_schedule": 0.6427006721496582, "l2_grads": 1.3405380249023438, "l2_params": 308.65167236328125, "l2_updates": 0.6763172745704651, "train/loss": 3.885841131210327, "uptime": 9625.891512791002, "examples_seen": 53094400.0, "progress": 0.46046730548919657, "epoch": 41.44221635430822, "img/sec/core": 749.5599290905035, "core_hours_NVIDIA A100-SXM4-40GB": 20.658225002984427, "core_hours": 20.658225002984427} {"step": 51900, "global_schedule": 0.6419669389724731, "l2_grads": 1.5383251905441284, "l2_params": 308.5615234375, "l2_updates": 0.6806886792182922, "train/loss": 2.4158036708831787, "uptime": 9634.660020705001, "examples_seen": 53145600.0, "progress": 0.46091134339227197, "epoch": 41.48217991877718, "img/sec/core": 729.8847264290196, "core_hours_NVIDIA A100-SXM4-40GB": 20.677710576126646, "core_hours": 20.677710576126646} {"step": 51950, "global_schedule": 0.6412328481674194, "l2_grads": 1.2507555484771729, "l2_params": 308.4858093261719, "l2_updates": 0.6816542744636536, "train/loss": 4.141085147857666, "uptime": 9643.387117197, "examples_seen": 53196800.0, "progress": 0.46135538129534737, "epoch": 41.52214348324613, "img/sec/core": 733.3481422908003, "core_hours_NVIDIA A100-SXM4-40GB": 20.69710412388665, "core_hours": 20.69710412388665} {"step": 52000, "global_schedule": 0.6404983997344971, "l2_grads": 1.5693622827529907, "l2_params": 308.4143981933594, "l2_updates": 0.6737325191497803, "train/loss": 2.3001091480255127, "uptime": 9653.063637266, "examples_seen": 53248000.0, "progress": 0.46179941919842277, "epoch": 41.56210704771509, "img/sec/core": 661.3947942405487, "core_hours_NVIDIA A100-SXM4-40GB": 20.718607501817754, "core_hours": 20.718607501817754} {"step": 52050, "global_schedule": 0.6397635340690613, "l2_grads": 1.4774340391159058, "l2_params": 308.345947265625, "l2_updates": 0.6813518404960632, "train/loss": 2.389467477798462, "uptime": 9662.330605297999, "examples_seen": 53299200.0, "progress": 0.46224345710149817, "epoch": 41.60207061218405, "img/sec/core": 741.8628248349391, "core_hours_NVIDIA A100-SXM4-40GB": 20.737778461388867, "core_hours": 20.737778461388867} {"step": 52100, "global_schedule": 0.6390284299850464, "l2_grads": 1.277623176574707, "l2_params": 308.2608947753906, "l2_updates": 0.6688383221626282, "train/loss": 4.4615068435668945, "uptime": 9671.709522808002, "examples_seen": 53350400.0, "progress": 0.46268749500457357, "epoch": 41.642034176653006, "img/sec/core": 682.3815214468278, "core_hours_NVIDIA A100-SXM4-40GB": 20.758620500299983, "core_hours": 20.758620500299983} {"step": 52150, "global_schedule": 0.6382929682731628, "l2_grads": 1.5066944360733032, "l2_params": 308.1698303222656, "l2_updates": 0.676705002784729, "train/loss": 2.3437788486480713, "uptime": 9680.675655443001, "examples_seen": 53401600.0, "progress": 0.463131532907649, "epoch": 41.68199774112196, "img/sec/core": 713.7971587680219, "core_hours_NVIDIA A100-SXM4-40GB": 20.778545239488874, "core_hours": 20.778545239488874} {"step": 52200, "global_schedule": 0.6375571489334106, "l2_grads": 1.5984488725662231, "l2_params": 308.0919494628906, "l2_updates": 0.672659695148468, "train/loss": 2.397078514099121, "uptime": 9690.634102339, "examples_seen": 53452800.0, "progress": 0.4635755708107244, "epoch": 41.721961305590916, "img/sec/core": 642.6704953933873, "core_hours_NVIDIA A100-SXM4-40GB": 20.80067512147998, "core_hours": 20.80067512147998} {"step": 52250, "global_schedule": 0.6368211507797241, "l2_grads": 1.4638842344284058, "l2_params": 307.9975280761719, "l2_updates": 0.6810303330421448, "train/loss": 2.6322951316833496, "uptime": 9700.375431486, "examples_seen": 53504000.0, "progress": 0.4640196087137998, "epoch": 41.76192487005987, "img/sec/core": 656.9945336433727, "core_hours_NVIDIA A100-SXM4-40GB": 20.822322519584425, "core_hours": 20.822322519584425} {"step": 52300, "global_schedule": 0.6360846757888794, "l2_grads": 1.4961605072021484, "l2_params": 307.9372863769531, "l2_updates": 0.679079532623291, "train/loss": 2.576754331588745, "uptime": 9710.119787056, "examples_seen": 53555200.0, "progress": 0.4644636466168752, "epoch": 41.801888434528834, "img/sec/core": 656.7904828619983, "core_hours_NVIDIA A100-SXM4-40GB": 20.843976643073315, "core_hours": 20.843976643073315} {"step": 52350, "global_schedule": 0.6353479623794556, "l2_grads": 1.6756051778793335, "l2_params": 307.86029052734375, "l2_updates": 0.6758036613464355, "train/loss": 2.1148011684417725, "uptime": 9719.434365512001, "examples_seen": 53606400.0, "progress": 0.4649076845199506, "epoch": 41.84185199899779, "img/sec/core": 687.0949694859587, "core_hours_NVIDIA A100-SXM4-40GB": 20.86467570630887, "core_hours": 20.86467570630887} {"step": 52400, "global_schedule": 0.6346108913421631, "l2_grads": 1.772540807723999, "l2_params": 307.7851257324219, "l2_updates": 0.6543031334877014, "train/loss": 2.3543052673339844, "uptime": 9728.087242147, "examples_seen": 53657600.0, "progress": 0.465351722423026, "epoch": 41.881815563466745, "img/sec/core": 739.6384196804383, "core_hours_NVIDIA A100-SXM4-40GB": 20.883904321053315, "core_hours": 20.883904321053315} {"step": 52450, "global_schedule": 0.633873462677002, "l2_grads": 1.4129711389541626, "l2_params": 307.6946716308594, "l2_updates": 0.661363422870636, "train/loss": 4.836592674255371, "uptime": 9736.761439995002, "examples_seen": 53708800.0, "progress": 0.4657957603261014, "epoch": 41.9217791279357, "img/sec/core": 737.8203854865958, "core_hours_NVIDIA A100-SXM4-40GB": 20.903180316271097, "core_hours": 20.903180316271097} {"step": 52500, "global_schedule": 0.6331358551979065, "l2_grads": 1.5094108581542969, "l2_params": 307.638427734375, "l2_updates": 0.6742914319038391, "train/loss": 2.264031410217285, "uptime": 9745.379841651002, "examples_seen": 53760000.0, "progress": 0.4662397982291768, "epoch": 41.96174269240466, "img/sec/core": 742.5970911374701, "core_hours_NVIDIA A100-SXM4-40GB": 20.9223323199511, "core_hours": 20.9223323199511, "val/acc@1": 0.6558, "val/loss": 1.4224783081054688, "z/secs/eval/val": 2.751949677000084} {"step": 52550, "global_schedule": 0.6323978900909424, "l2_grads": 1.3654272556304932, "l2_params": 307.5448303222656, "l2_updates": 0.6715793013572693, "train/loss": 3.0708930492401123, "uptime": 9757.200155188, "examples_seen": 53811200.0, "progress": 0.4666838361322522, "epoch": 42.00170625687362, "img/sec/core": 705.8427883770537, "core_hours_NVIDIA A100-SXM4-40GB": 20.9424815974622, "core_hours": 20.9424815974622} {"step": 52600, "global_schedule": 0.6316596269607544, "l2_grads": 1.3514164686203003, "l2_params": 307.45184326171875, "l2_updates": 0.665386974811554, "train/loss": 2.999256134033203, "uptime": 9765.941809967002, "examples_seen": 53862400.0, "progress": 0.46712787403532763, "epoch": 42.04166982134257, "img/sec/core": 732.126829736336, "core_hours_NVIDIA A100-SXM4-40GB": 20.961907496971094, "core_hours": 20.961907496971094} {"step": 52650, "global_schedule": 0.630920946598053, "l2_grads": 1.5101648569107056, "l2_params": 307.37799072265625, "l2_updates": 0.6676438450813293, "train/loss": 2.2620365619659424, "uptime": 9775.632386316001, "examples_seen": 53913600.0, "progress": 0.4675719119384031, "epoch": 42.08163338581153, "img/sec/core": 660.4354343341812, "core_hours_NVIDIA A100-SXM4-40GB": 20.98344211107998, "core_hours": 20.98344211107998} {"step": 52700, "global_schedule": 0.6301820278167725, "l2_grads": 1.412743091583252, "l2_params": 307.30084228515625, "l2_updates": 0.6577250361442566, "train/loss": 2.733288288116455, "uptime": 9785.360919370001, "examples_seen": 53964800.0, "progress": 0.4680159498414785, "epoch": 42.121596950280484, "img/sec/core": 657.8586889180236, "core_hours_NVIDIA A100-SXM4-40GB": 21.005061073422205, "core_hours": 21.005061073422205} {"step": 52750, "global_schedule": 0.6294428110122681, "l2_grads": 1.4485728740692139, "l2_params": 307.2298889160156, "l2_updates": 0.6714591979980469, "train/loss": 2.374164581298828, "uptime": 9794.306121427, "examples_seen": 54016000.0, "progress": 0.4684599877445539, "epoch": 42.161560514749446, "img/sec/core": 715.4673487775013, "core_hours_NVIDIA A100-SXM4-40GB": 21.024939300215536, "core_hours": 21.024939300215536} {"step": 52800, "global_schedule": 0.628703236579895, "l2_grads": 1.5103075504302979, "l2_params": 307.14569091796875, "l2_updates": 0.6626713275909424, "train/loss": 2.405097007751465, "uptime": 9803.228308083, "examples_seen": 54067200.0, "progress": 0.4689040256476293, "epoch": 42.2015240792184, "img/sec/core": 717.312946562941, "core_hours_NVIDIA A100-SXM4-40GB": 21.044766381673313, "core_hours": 21.044766381673313} {"step": 52850, "global_schedule": 0.6279634237289429, "l2_grads": 1.5243006944656372, "l2_params": 307.0726623535156, "l2_updates": 0.659514844417572, "train/loss": 2.41129207611084, "uptime": 9812.346478559002, "examples_seen": 54118400.0, "progress": 0.4693480635507047, "epoch": 42.24148764368736, "img/sec/core": 701.8951901419365, "core_hours_NVIDIA A100-SXM4-40GB": 21.065028982731096, "core_hours": 21.065028982731096} {"step": 52900, "global_schedule": 0.6272233128547668, "l2_grads": 1.4346935749053955, "l2_params": 306.9937744140625, "l2_updates": 0.6578906178474426, "train/loss": 2.704936981201172, "uptime": 9820.947502218, "examples_seen": 54169600.0, "progress": 0.4697921014537801, "epoch": 42.28145120815631, "img/sec/core": 744.0974765027112, "core_hours_NVIDIA A100-SXM4-40GB": 21.084142368639977, "core_hours": 21.084142368639977} {"step": 52950, "global_schedule": 0.6264828443527222, "l2_grads": 1.5163401365280151, "l2_params": 306.91900634765625, "l2_updates": 0.6750123500823975, "train/loss": 2.390340805053711, "uptime": 9829.643556312001, "examples_seen": 54220800.0, "progress": 0.4702361393568555, "epoch": 42.32141477262527, "img/sec/core": 735.9659830559835, "core_hours_NVIDIA A100-SXM4-40GB": 21.103466933293316, "core_hours": 21.103466933293316} {"step": 53000, "global_schedule": 0.6257421374320984, "l2_grads": 1.4187543392181396, "l2_params": 306.8415222167969, "l2_updates": 0.6534008979797363, "train/loss": 4.500828742980957, "uptime": 9838.361798246, "examples_seen": 54272000.0, "progress": 0.4706801772599309, "epoch": 42.36137833709423, "img/sec/core": 734.0929568657326, "core_hours_NVIDIA A100-SXM4-40GB": 21.122840804257756, "core_hours": 21.122840804257756} {"step": 53050, "global_schedule": 0.625001072883606, "l2_grads": 1.569814682006836, "l2_params": 306.7688903808594, "l2_updates": 0.6692389249801636, "train/loss": 2.3235626220703125, "uptime": 9848.217984301, "examples_seen": 54323200.0, "progress": 0.4711242151630063, "epoch": 42.401341901563185, "img/sec/core": 719.1394023355317, "core_hours_NVIDIA A100-SXM4-40GB": 21.14261752929331, "core_hours": 21.14261752929331} {"step": 53100, "global_schedule": 0.6242598295211792, "l2_grads": 1.3882509469985962, "l2_params": 306.6887512207031, "l2_updates": 0.650177001953125, "train/loss": 4.314540863037109, "uptime": 9856.980967439, "examples_seen": 54374400.0, "progress": 0.47156825306608174, "epoch": 42.44130546603214, "img/sec/core": 730.3448950217544, "core_hours_NVIDIA A100-SXM4-40GB": 21.162090825155534, "core_hours": 21.162090825155534} {"step": 53150, "global_schedule": 0.6235182285308838, "l2_grads": 1.5015348196029663, "l2_params": 306.6195373535156, "l2_updates": 0.6392885446548462, "train/loss": 3.015864849090576, "uptime": 9866.623829738002, "examples_seen": 54425600.0, "progress": 0.47201229096915714, "epoch": 42.481269030501096, "img/sec/core": 663.7033488139804, "core_hours_NVIDIA A100-SXM4-40GB": 21.18351940804221, "core_hours": 21.18351940804221} {"step": 53200, "global_schedule": 0.6227763295173645, "l2_grads": 1.6506741046905518, "l2_params": 306.5337829589844, "l2_updates": 0.6538631916046143, "train/loss": 2.519071340560913, "uptime": 9876.311094745999, "examples_seen": 54476800.0, "progress": 0.47245632887223254, "epoch": 42.52123259497005, "img/sec/core": 660.6611871066656, "core_hours_NVIDIA A100-SXM4-40GB": 21.20504666361553, "core_hours": 21.20504666361553} {"step": 53250, "global_schedule": 0.6220341920852661, "l2_grads": 1.6352880001068115, "l2_params": 306.44744873046875, "l2_updates": 0.6562982797622681, "train/loss": 2.4287943840026855, "uptime": 9885.971455981, "examples_seen": 54528000.0, "progress": 0.47290036677530795, "epoch": 42.561196159439014, "img/sec/core": 662.5011057362815, "core_hours_NVIDIA A100-SXM4-40GB": 21.226514133026644, "core_hours": 21.226514133026644} {"step": 53300, "global_schedule": 0.6212916970252991, "l2_grads": 1.503448724746704, "l2_params": 306.376953125, "l2_updates": 0.6635541319847107, "train/loss": 2.3619070053100586, "uptime": 9894.674658025002, "examples_seen": 54579200.0, "progress": 0.47334440467838335, "epoch": 42.60115972390797, "img/sec/core": 735.361533334818, "core_hours_NVIDIA A100-SXM4-40GB": 21.245854582013315, "core_hours": 21.245854582013315} {"step": 53350, "global_schedule": 0.6205489635467529, "l2_grads": 1.4657336473464966, "l2_params": 306.2914123535156, "l2_updates": 0.6466558575630188, "train/loss": 4.671845436096191, "uptime": 9903.24419006, "examples_seen": 54630400.0, "progress": 0.47378844258145875, "epoch": 42.641123288376924, "img/sec/core": 746.831912625083, "core_hours_NVIDIA A100-SXM4-40GB": 21.264897986535534, "core_hours": 21.264897986535534} {"step": 53400, "global_schedule": 0.6198058724403381, "l2_grads": 1.3039308786392212, "l2_params": 306.2045593261719, "l2_updates": 0.6609634757041931, "train/loss": 4.620832920074463, "uptime": 9911.889227714999, "examples_seen": 54681600.0, "progress": 0.47423248048453415, "epoch": 42.68108685284588, "img/sec/core": 740.3090946977784, "core_hours_NVIDIA A100-SXM4-40GB": 21.28410918132442, "core_hours": 21.28410918132442} {"step": 53450, "global_schedule": 0.619062602519989, "l2_grads": 1.5359930992126465, "l2_params": 306.1252746582031, "l2_updates": 0.6465016603469849, "train/loss": 2.9179275035858154, "uptime": 9920.551950041, "examples_seen": 54732800.0, "progress": 0.47467651838760955, "epoch": 42.72105041731484, "img/sec/core": 738.7977773212348, "core_hours_NVIDIA A100-SXM4-40GB": 21.303359675382197, "core_hours": 21.303359675382197} {"step": 53500, "global_schedule": 0.6183189749717712, "l2_grads": 1.4519723653793335, "l2_params": 306.0487060546875, "l2_updates": 0.647079348564148, "train/loss": 4.739753723144531, "uptime": 9929.152898667, "examples_seen": 54784000.0, "progress": 0.47512055629068495, "epoch": 42.7610139817838, "img/sec/core": 744.1039678638036, "core_hours_NVIDIA A100-SXM4-40GB": 21.32247289455109, "core_hours": 21.32247289455109} {"step": 53550, "global_schedule": 0.6175751090049744, "l2_grads": 1.5101847648620605, "l2_params": 305.9662170410156, "l2_updates": 0.6440611481666565, "train/loss": 2.4448366165161133, "uptime": 9937.636147723, "examples_seen": 54835200.0, "progress": 0.4755645941937604, "epoch": 42.80097754625275, "img/sec/core": 754.4279270538779, "core_hours_NVIDIA A100-SXM4-40GB": 21.34132455911998, "core_hours": 21.34132455911998} {"step": 53600, "global_schedule": 0.6168309450149536, "l2_grads": 1.5642080307006836, "l2_params": 305.87457275390625, "l2_updates": 0.6601574420928955, "train/loss": 2.3956313133239746, "uptime": 9946.305181864, "examples_seen": 54886400.0, "progress": 0.4760086320968358, "epoch": 42.84094111072171, "img/sec/core": 738.2598679282813, "core_hours_NVIDIA A100-SXM4-40GB": 21.360589079433314, "core_hours": 21.360589079433314} {"step": 53650, "global_schedule": 0.6160865426063538, "l2_grads": 1.4128094911575317, "l2_params": 305.7962951660156, "l2_updates": 0.6521305441856384, "train/loss": 3.896117687225342, "uptime": 9955.05647433, "examples_seen": 54937600.0, "progress": 0.4764526699999112, "epoch": 42.88090467519066, "img/sec/core": 731.3205477778934, "core_hours_NVIDIA A100-SXM4-40GB": 21.380036396024423, "core_hours": 21.380036396024423} {"step": 53700, "global_schedule": 0.61534184217453, "l2_grads": 1.566683292388916, "l2_params": 305.722900390625, "l2_updates": 0.6466110944747925, "train/loss": 3.0785014629364014, "uptime": 9963.875972521999, "examples_seen": 54988800.0, "progress": 0.4768967079029866, "epoch": 42.920868239659626, "img/sec/core": 725.6648689838441, "core_hours_NVIDIA A100-SXM4-40GB": 21.39963528089553, "core_hours": 21.39963528089553} {"step": 53750, "global_schedule": 0.6145968437194824, "l2_grads": 1.34964919090271, "l2_params": 305.6392822265625, "l2_updates": 0.6446720361709595, "train/loss": 3.1678214073181152, "uptime": 9972.608081297001, "examples_seen": 55040000.0, "progress": 0.477340745806062, "epoch": 42.96083180412858, "img/sec/core": 732.9271960424278, "core_hours_NVIDIA A100-SXM4-40GB": 21.4190399670622, "core_hours": 21.4190399670622} {"step": 53800, "global_schedule": 0.6138516664505005, "l2_grads": 1.4592223167419434, "l2_params": 305.53753662109375, "l2_updates": 0.6488744020462036, "train/loss": 2.5772480964660645, "uptime": 9982.122145754, "examples_seen": 55091200.0, "progress": 0.4777847837091374, "epoch": 43.00079536859754, "img/sec/core": 672.6883162213934, "core_hours_NVIDIA A100-SXM4-40GB": 21.440182332522202, "core_hours": 21.440182332522202} {"step": 53850, "global_schedule": 0.6131061911582947, "l2_grads": 1.6260361671447754, "l2_params": 305.4508361816406, "l2_updates": 0.6533123850822449, "train/loss": 2.488295316696167, "uptime": 9990.716062583999, "examples_seen": 55142400.0, "progress": 0.4782288216122128, "epoch": 43.04075893306649, "img/sec/core": 744.712815658071, "core_hours_NVIDIA A100-SXM4-40GB": 21.45927992547775, "core_hours": 21.45927992547775} {"step": 53900, "global_schedule": 0.612360417842865, "l2_grads": 1.4425281286239624, "l2_params": 305.382568359375, "l2_updates": 0.6417940855026245, "train/loss": 2.4407284259796143, "uptime": 9999.476990203, "examples_seen": 55193600.0, "progress": 0.4786728595152882, "epoch": 43.08072249753545, "img/sec/core": 730.5162510553257, "core_hours_NVIDIA A100-SXM4-40GB": 21.47874865351998, "core_hours": 21.47874865351998} {"step": 53950, "global_schedule": 0.6116144061088562, "l2_grads": 1.6069616079330444, "l2_params": 305.29547119140625, "l2_updates": 0.6294806003570557, "train/loss": 2.601043939590454, "uptime": 10008.119551519, "examples_seen": 55244800.0, "progress": 0.4791168974183636, "epoch": 43.12068606200441, "img/sec/core": 740.5212142553581, "core_hours_NVIDIA A100-SXM4-40GB": 21.49795434533331, "core_hours": 21.49795434533331} {"step": 54000, "global_schedule": 0.6108680963516235, "l2_grads": 1.5505635738372803, "l2_params": 305.2066345214844, "l2_updates": 0.6371201872825623, "train/loss": 4.673409938812256, "uptime": 10016.796904049, "examples_seen": 55296000.0, "progress": 0.47956093532143906, "epoch": 43.160649626473365, "img/sec/core": 737.5521482932062, "core_hours_NVIDIA A100-SXM4-40GB": 21.517237350955536, "core_hours": 21.517237350955536} {"step": 54050, "global_schedule": 0.6101216077804565, "l2_grads": 1.6109713315963745, "l2_params": 305.1218566894531, "l2_updates": 0.6562816500663757, "train/loss": 2.3011395931243896, "uptime": 10026.569588667002, "examples_seen": 55347200.0, "progress": 0.48000497322451446, "epoch": 43.20061319094232, "img/sec/core": 727.2883334751205, "core_hours_NVIDIA A100-SXM4-40GB": 21.536792486886654, "core_hours": 21.536792486886654} {"step": 54100, "global_schedule": 0.6093747615814209, "l2_grads": 1.4320344924926758, "l2_params": 305.0281677246094, "l2_updates": 0.6443023085594177, "train/loss": 2.8631863594055176, "uptime": 10036.136303276, "examples_seen": 55398400.0, "progress": 0.48044901112758986, "epoch": 43.240576755411276, "img/sec/core": 668.9861944852373, "core_hours_NVIDIA A100-SXM4-40GB": 21.558051852684425, "core_hours": 21.558051852684425} {"step": 54150, "global_schedule": 0.6086276769638062, "l2_grads": 1.388229489326477, "l2_params": 304.952880859375, "l2_updates": 0.6410827040672302, "train/loss": 4.644575119018555, "uptime": 10045.444742587, "examples_seen": 55449600.0, "progress": 0.48089304903066526, "epoch": 43.28054031988023, "img/sec/core": 687.5481255420331, "core_hours_NVIDIA A100-SXM4-40GB": 21.57873727337554, "core_hours": 21.57873727337554} {"step": 54200, "global_schedule": 0.6078803539276123, "l2_grads": 1.3614641427993774, "l2_params": 304.8727111816406, "l2_updates": 0.6330508589744568, "train/loss": 4.608335494995117, "uptime": 10054.025431138, "examples_seen": 55500800.0, "progress": 0.48133708693374067, "epoch": 43.32050388434919, "img/sec/core": 745.8608900628083, "core_hours_NVIDIA A100-SXM4-40GB": 21.59780547015554, "core_hours": 21.59780547015554} {"step": 54250, "global_schedule": 0.6071327924728394, "l2_grads": 1.6203327178955078, "l2_params": 304.7847900390625, "l2_updates": 0.6493428349494934, "train/loss": 2.25481915473938, "uptime": 10062.612150867999, "examples_seen": 55552000.0, "progress": 0.48178112483681607, "epoch": 43.36046744881815, "img/sec/core": 745.3370089209146, "core_hours_NVIDIA A100-SXM4-40GB": 21.61688706955554, "core_hours": 21.61688706955554} {"step": 54300, "global_schedule": 0.6063849925994873, "l2_grads": 1.342129111289978, "l2_params": 304.723388671875, "l2_updates": 0.6456826329231262, "train/loss": 4.634005546569824, "uptime": 10071.474384310002, "examples_seen": 55603200.0, "progress": 0.48222516273989147, "epoch": 43.400431013287104, "img/sec/core": 722.1655852199323, "core_hours_NVIDIA A100-SXM4-40GB": 21.63658092164888, "core_hours": 21.63658092164888} {"step": 54350, "global_schedule": 0.6056368947029114, "l2_grads": 1.5726841688156128, "l2_params": 304.6285705566406, "l2_updates": 0.6474576592445374, "train/loss": 2.304208517074585, "uptime": 10079.974678202, "examples_seen": 55654400.0, "progress": 0.48266920064296687, "epoch": 43.44039457775606, "img/sec/core": 752.9151440311479, "core_hours_NVIDIA A100-SXM4-40GB": 21.655470463631094, "core_hours": 21.655470463631094} {"step": 54400, "global_schedule": 0.6048885583877563, "l2_grads": 1.5318472385406494, "l2_params": 304.55419921875, "l2_updates": 0.6408045887947083, "train/loss": 2.241492748260498, "uptime": 10089.151010847001, "examples_seen": 55705600.0, "progress": 0.48311323854604227, "epoch": 43.48035814222502, "img/sec/core": 697.4463816420127, "core_hours_NVIDIA A100-SXM4-40GB": 21.675862313953317, "core_hours": 21.675862313953317} {"step": 54450, "global_schedule": 0.604140043258667, "l2_grads": 1.4937924146652222, "l2_params": 304.4705505371094, "l2_updates": 0.6392737030982971, "train/loss": 2.5285937786102295, "uptime": 10099.015205204001, "examples_seen": 55756800.0, "progress": 0.4835572764491177, "epoch": 43.52032170669398, "img/sec/core": 648.8112225260712, "core_hours_NVIDIA A100-SXM4-40GB": 21.69778274585776, "core_hours": 21.69778274585776} {"step": 54500, "global_schedule": 0.6033912301063538, "l2_grads": 1.4430066347122192, "l2_params": 304.3947448730469, "l2_updates": 0.6422523260116577, "train/loss": 2.8849945068359375, "uptime": 10108.42384895, "examples_seen": 55808000.0, "progress": 0.4840013143521931, "epoch": 43.56028527116293, "img/sec/core": 680.2255641490821, "core_hours_NVIDIA A100-SXM4-40GB": 21.718690843071094, "core_hours": 21.718690843071094} {"step": 54550, "global_schedule": 0.6026421785354614, "l2_grads": 1.438356876373291, "l2_params": 304.31231689453125, "l2_updates": 0.6331837773323059, "train/loss": 3.4497833251953125, "uptime": 10117.747039181, "examples_seen": 55859200.0, "progress": 0.4844453522552685, "epoch": 43.60024883563189, "img/sec/core": 686.4603039761862, "core_hours_NVIDIA A100-SXM4-40GB": 21.739409043584427, "core_hours": 21.739409043584427} {"step": 54600, "global_schedule": 0.60189288854599, "l2_grads": 1.651167869567871, "l2_params": 304.2444152832031, "l2_updates": 0.6287528276443481, "train/loss": 2.314094305038452, "uptime": 10127.659484746999, "examples_seen": 55910400.0, "progress": 0.4848893901583439, "epoch": 43.64021240010084, "img/sec/core": 645.6529781059452, "core_hours_NVIDIA A100-SXM4-40GB": 21.76143670039776, "core_hours": 21.76143670039776} {"step": 54650, "global_schedule": 0.6011433601379395, "l2_grads": 1.3248943090438843, "l2_params": 304.1644287109375, "l2_updates": 0.6412506699562073, "train/loss": 3.3604369163513184, "uptime": 10137.246039704, "examples_seen": 55961600.0, "progress": 0.4853334280614193, "epoch": 43.680175964569806, "img/sec/core": 667.6016596896754, "core_hours_NVIDIA A100-SXM4-40GB": 21.78274015585776, "core_hours": 21.78274015585776} {"step": 54700, "global_schedule": 0.6003935933113098, "l2_grads": 1.3372749090194702, "l2_params": 304.0826416015625, "l2_updates": 0.6288556456565857, "train/loss": 4.025509834289551, "uptime": 10146.201224518, "examples_seen": 56012800.0, "progress": 0.4857774659644947, "epoch": 43.72013952903876, "img/sec/core": 714.6697843683426, "core_hours_NVIDIA A100-SXM4-40GB": 21.802640566555535, "core_hours": 21.802640566555535} {"step": 54750, "global_schedule": 0.5996435284614563, "l2_grads": 1.2978825569152832, "l2_params": 303.9941711425781, "l2_updates": 0.6260387301445007, "train/loss": 4.273636341094971, "uptime": 10155.970636689, "examples_seen": 56064000.0, "progress": 0.4862215038675701, "epoch": 43.760103093507716, "img/sec/core": 655.1059457801773, "core_hours_NVIDIA A100-SXM4-40GB": 21.824350371379982, "core_hours": 21.824350371379982} {"step": 54800, "global_schedule": 0.5988933444023132, "l2_grads": 1.4775364398956299, "l2_params": 303.9147644042969, "l2_updates": 0.6362437605857849, "train/loss": 2.2354700565338135, "uptime": 10165.787527292001, "examples_seen": 56115200.0, "progress": 0.4866655417706455, "epoch": 43.80006665797667, "img/sec/core": 651.9375898967296, "core_hours_NVIDIA A100-SXM4-40GB": 21.846165683831096, "core_hours": 21.846165683831096} {"step": 54850, "global_schedule": 0.5981428623199463, "l2_grads": 1.6342467069625854, "l2_params": 303.8172912597656, "l2_updates": 0.6394461393356323, "train/loss": 2.248473644256592, "uptime": 10175.652914166001, "examples_seen": 56166400.0, "progress": 0.4871095796737209, "epoch": 43.84003022244563, "img/sec/core": 648.732794946632, "core_hours_NVIDIA A100-SXM4-40GB": 21.86808876577332, "core_hours": 21.86808876577332} {"step": 54900, "global_schedule": 0.597392201423645, "l2_grads": 1.5544674396514893, "l2_params": 303.7635803222656, "l2_updates": 0.6332225799560547, "train/loss": 4.670480251312256, "uptime": 10185.404108533, "examples_seen": 56217600.0, "progress": 0.4875536175767963, "epoch": 43.87999378691459, "img/sec/core": 656.3298565413775, "core_hours_NVIDIA A100-SXM4-40GB": 21.889758086588873, "core_hours": 21.889758086588873} {"step": 54950, "global_schedule": 0.5966412425041199, "l2_grads": 1.4941757917404175, "l2_params": 303.7153625488281, "l2_updates": 0.6428508162498474, "train/loss": 2.710559129714966, "uptime": 10195.333234676002, "examples_seen": 56268800.0, "progress": 0.4879976554798718, "epoch": 43.919957351383545, "img/sec/core": 644.5683041816817, "core_hours_NVIDIA A100-SXM4-40GB": 21.911822811351097, "core_hours": 21.911822811351097} {"step": 55000, "global_schedule": 0.5958901047706604, "l2_grads": 1.4328583478927612, "l2_params": 303.6346130371094, "l2_updates": 0.6267683506011963, "train/loss": 2.961815118789673, "uptime": 10205.085501956999, "examples_seen": 56320000.0, "progress": 0.4884416933829472, "epoch": 43.9599209158525, "img/sec/core": 656.2576491797603, "core_hours_NVIDIA A100-SXM4-40GB": 21.93349451641998, "core_hours": 21.93349451641998, "val/acc@1": 0.66232, "val/loss": 1.3781276879882813, "z/secs/eval/val": 2.644616600999143} {"step": 55050, "global_schedule": 0.5951387882232666, "l2_grads": 1.5226681232452393, "l2_params": 303.5618896484375, "l2_updates": 0.6225785613059998, "train/loss": 2.647831916809082, "uptime": 10216.707097231001, "examples_seen": 56371200.0, "progress": 0.4888857312860226, "epoch": 43.999884480321455, "img/sec/core": 770.451154599291, "core_hours_NVIDIA A100-SXM4-40GB": 21.95195411913109, "core_hours": 21.95195411913109} {"step": 55100, "global_schedule": 0.5943871140480042, "l2_grads": 1.5867042541503906, "l2_params": 303.4727783203125, "l2_updates": 0.6307452321052551, "train/loss": 2.5659611225128174, "uptime": 10226.556921874, "examples_seen": 56422400.0, "progress": 0.489329769189098, "epoch": 44.03984804479041, "img/sec/core": 649.7577603626627, "core_hours_NVIDIA A100-SXM4-40GB": 21.97384261833776, "core_hours": 21.97384261833776} {"step": 55150, "global_schedule": 0.5936353206634521, "l2_grads": 1.4061481952667236, "l2_params": 303.3857116699219, "l2_updates": 0.6147282123565674, "train/loss": 4.574446678161621, "uptime": 10235.562327479, "examples_seen": 56473600.0, "progress": 0.4897738070921734, "epoch": 44.07981160925937, "img/sec/core": 710.6842579580211, "core_hours_NVIDIA A100-SXM4-40GB": 21.99385463079331, "core_hours": 21.99385463079331} {"step": 55200, "global_schedule": 0.592883288860321, "l2_grads": 1.5342578887939453, "l2_params": 303.3073425292969, "l2_updates": 0.6404469609260559, "train/loss": 2.2234954833984375, "uptime": 10244.313341224, "examples_seen": 56524800.0, "progress": 0.4902178449952488, "epoch": 44.11977517372833, "img/sec/core": 731.3438404386144, "core_hours_NVIDIA A100-SXM4-40GB": 22.013301328004427, "core_hours": 22.013301328004427} {"step": 55250, "global_schedule": 0.5921310186386108, "l2_grads": 1.5804336071014404, "l2_params": 303.22454833984375, "l2_updates": 0.6276599168777466, "train/loss": 2.270806074142456, "uptime": 10253.061521365, "examples_seen": 56576000.0, "progress": 0.4906618828983242, "epoch": 44.159738738197284, "img/sec/core": 731.5807284312289, "core_hours_NVIDIA A100-SXM4-40GB": 22.03274172831776, "core_hours": 22.03274172831776} {"step": 55300, "global_schedule": 0.5913785696029663, "l2_grads": 1.5774881839752197, "l2_params": 303.12890625, "l2_updates": 0.6252732872962952, "train/loss": 2.672541856765747, "uptime": 10262.228278159002, "examples_seen": 56627200.0, "progress": 0.4911059208013996, "epoch": 44.19970230266624, "img/sec/core": 698.1749536747343, "core_hours_NVIDIA A100-SXM4-40GB": 22.053112298971097, "core_hours": 22.053112298971097} {"step": 55350, "global_schedule": 0.5906258225440979, "l2_grads": 1.5606142282485962, "l2_params": 303.0549011230469, "l2_updates": 0.6229596138000488, "train/loss": 2.3650999069213867, "uptime": 10271.051711044, "examples_seen": 56678400.0, "progress": 0.491549958704475, "epoch": 44.239665867135194, "img/sec/core": 725.3412683494039, "core_hours_NVIDIA A100-SXM4-40GB": 22.07271992760442, "core_hours": 22.07271992760442} {"step": 55400, "global_schedule": 0.5898729562759399, "l2_grads": 1.585042953491211, "l2_params": 302.9680480957031, "l2_updates": 0.6292617321014404, "train/loss": 2.293130397796631, "uptime": 10279.890825171, "examples_seen": 56729600.0, "progress": 0.49199399660755044, "epoch": 44.27962943160416, "img/sec/core": 724.0544593094766, "core_hours_NVIDIA A100-SXM4-40GB": 22.092362403442205, "core_hours": 22.092362403442205} {"step": 55450, "global_schedule": 0.5891197919845581, "l2_grads": 1.5050840377807617, "l2_params": 302.9043884277344, "l2_updates": 0.6335341334342957, "train/loss": 2.310183048248291, "uptime": 10288.626494364, "examples_seen": 56780800.0, "progress": 0.49243803451062584, "epoch": 44.31959299607311, "img/sec/core": 732.6284751176769, "core_hours_NVIDIA A100-SXM4-40GB": 22.11177500164887, "core_hours": 22.11177500164887} {"step": 55500, "global_schedule": 0.5883665084838867, "l2_grads": 1.5793521404266357, "l2_params": 302.82177734375, "l2_updates": 0.6165016889572144, "train/loss": 4.311335563659668, "uptime": 10297.370350192, "examples_seen": 56832000.0, "progress": 0.49288207241370124, "epoch": 44.35955656054207, "img/sec/core": 731.9425349517894, "core_hours_NVIDIA A100-SXM4-40GB": 22.131205792377763, "core_hours": 22.131205792377763} {"step": 55550, "global_schedule": 0.5876129865646362, "l2_grads": 1.5469443798065186, "l2_params": 302.712158203125, "l2_updates": 0.6265491247177124, "train/loss": 2.3083841800689697, "uptime": 10306.557954163001, "examples_seen": 56883200.0, "progress": 0.49332611031677664, "epoch": 44.39952012501102, "img/sec/core": 696.5907564366928, "core_hours_NVIDIA A100-SXM4-40GB": 22.151622690091095, "core_hours": 22.151622690091095} {"step": 55600, "global_schedule": 0.5868592858314514, "l2_grads": 1.3716306686401367, "l2_params": 302.6331481933594, "l2_updates": 0.6243539452552795, "train/loss": 3.2362289428710938, "uptime": 10316.029042949, "examples_seen": 56934400.0, "progress": 0.49377014821985205, "epoch": 44.439483689479985, "img/sec/core": 675.740682471642, "core_hours_NVIDIA A100-SXM4-40GB": 22.172669554059983, "core_hours": 22.172669554059983} {"step": 55650, "global_schedule": 0.5861052870750427, "l2_grads": 1.4566645622253418, "l2_params": 302.5581970214844, "l2_updates": 0.6301755905151367, "train/loss": 2.527691125869751, "uptime": 10324.794674350002, "examples_seen": 56985600.0, "progress": 0.49421418612292745, "epoch": 44.47944725394894, "img/sec/core": 730.1242440183488, "core_hours_NVIDIA A100-SXM4-40GB": 22.192148734951097, "core_hours": 22.192148734951097} {"step": 55700, "global_schedule": 0.5853512287139893, "l2_grads": 1.4173932075500488, "l2_params": 302.46331787109375, "l2_updates": 0.6024299263954163, "train/loss": 4.689558506011963, "uptime": 10333.829670406, "examples_seen": 57036800.0, "progress": 0.49465822402600285, "epoch": 44.519410818417896, "img/sec/core": 708.3567010249376, "core_hours_NVIDIA A100-SXM4-40GB": 22.212226503964423, "core_hours": 22.212226503964423} {"step": 55750, "global_schedule": 0.5845968723297119, "l2_grads": 1.517661690711975, "l2_params": 302.3753967285156, "l2_updates": 0.6114862561225891, "train/loss": 4.08290958404541, "uptime": 10343.396169638001, "examples_seen": 57088000.0, "progress": 0.49510226192907825, "epoch": 44.55937438288685, "img/sec/core": 669.0012558189362, "core_hours_NVIDIA A100-SXM4-40GB": 22.23348539114665, "core_hours": 22.23348539114665} {"step": 55800, "global_schedule": 0.5838423371315002, "l2_grads": 1.5143524408340454, "l2_params": 302.2916259765625, "l2_updates": 0.6105530858039856, "train/loss": 2.961463212966919, "uptime": 10352.535856672, "examples_seen": 57139200.0, "progress": 0.49554629983215365, "epoch": 44.59933794735581, "img/sec/core": 700.2427956441057, "core_hours_NVIDIA A100-SXM4-40GB": 22.25379580677776, "core_hours": 22.25379580677776} {"step": 55850, "global_schedule": 0.5830876231193542, "l2_grads": 1.6152678728103638, "l2_params": 302.2019958496094, "l2_updates": 0.6177962422370911, "train/loss": 2.469407558441162, "uptime": 10361.309165899, "examples_seen": 57190400.0, "progress": 0.4959903377352291, "epoch": 44.63930151182477, "img/sec/core": 729.4852870687084, "core_hours_NVIDIA A100-SXM4-40GB": 22.273292049504427, "core_hours": 22.273292049504427} {"step": 55900, "global_schedule": 0.5823326706886292, "l2_grads": 1.4598524570465088, "l2_params": 302.127685546875, "l2_updates": 0.6163038015365601, "train/loss": 2.8089284896850586, "uptime": 10369.964433042, "examples_seen": 57241600.0, "progress": 0.4964343756383045, "epoch": 44.679265076293724, "img/sec/core": 739.4341381104659, "core_hours_NVIDIA A100-SXM4-40GB": 22.29252597648887, "core_hours": 22.29252597648887} {"step": 55950, "global_schedule": 0.5815775394439697, "l2_grads": 1.4857264757156372, "l2_params": 302.0369873046875, "l2_updates": 0.602643609046936, "train/loss": 2.7916975021362305, "uptime": 10378.633508247001, "examples_seen": 57292800.0, "progress": 0.4968784135413799, "epoch": 44.71922864076268, "img/sec/core": 738.2563709111037, "core_hours_NVIDIA A100-SXM4-40GB": 22.31179058805554, "core_hours": 22.31179058805554} {"step": 56000, "global_schedule": 0.580822229385376, "l2_grads": 1.4232555627822876, "l2_params": 301.95465087890625, "l2_updates": 0.6096186637878418, "train/loss": 3.363635540008545, "uptime": 10388.544018229002, "examples_seen": 57344000.0, "progress": 0.4973224514444553, "epoch": 44.759192205231635, "img/sec/core": 645.7790781325588, "core_hours_NVIDIA A100-SXM4-40GB": 22.333813943571098, "core_hours": 22.333813943571098} {"step": 56050, "global_schedule": 0.5800666809082031, "l2_grads": 1.4221097230911255, "l2_params": 301.87335205078125, "l2_updates": 0.6145057678222656, "train/loss": 2.7418718338012695, "uptime": 10398.526159523002, "examples_seen": 57395200.0, "progress": 0.4977664893475307, "epoch": 44.79915576970059, "img/sec/core": 688.7247626284382, "core_hours_NVIDIA A100-SXM4-40GB": 22.354464024697766, "core_hours": 22.354464024697766} {"step": 56100, "global_schedule": 0.5793110132217407, "l2_grads": 1.520082712173462, "l2_params": 301.7806701660156, "l2_updates": 0.6080060005187988, "train/loss": 2.176640510559082, "uptime": 10408.447996943001, "examples_seen": 57446400.0, "progress": 0.4982105272506061, "epoch": 44.83911933416955, "img/sec/core": 645.0418132330778, "core_hours_NVIDIA A100-SXM4-40GB": 22.37651255229776, "core_hours": 22.37651255229776} {"step": 56150, "global_schedule": 0.578555166721344, "l2_grads": 1.446927547454834, "l2_params": 301.68914794921875, "l2_updates": 0.6179660558700562, "train/loss": 2.537313222885132, "uptime": 10417.768474416001, "examples_seen": 57497600.0, "progress": 0.4986545651536815, "epoch": 44.87908289863851, "img/sec/core": 686.6601006804295, "core_hours_NVIDIA A100-SXM4-40GB": 22.397224724459985, "core_hours": 22.397224724459985} {"step": 56200, "global_schedule": 0.5777990818023682, "l2_grads": 1.5127285718917847, "l2_params": 301.6171875, "l2_updates": 0.6083469986915588, "train/loss": 2.686537504196167, "uptime": 10426.609120989002, "examples_seen": 57548800.0, "progress": 0.4990986030567569, "epoch": 44.91904646310746, "img/sec/core": 723.9289510278335, "core_hours_NVIDIA A100-SXM4-40GB": 22.41687060573332, "core_hours": 22.41687060573332} {"step": 56250, "global_schedule": 0.577042818069458, "l2_grads": 1.6443532705307007, "l2_params": 301.5328369140625, "l2_updates": 0.6048460006713867, "train/loss": 2.1367456912994385, "uptime": 10435.886326758, "examples_seen": 57600000.0, "progress": 0.4995426409598323, "epoch": 44.95901002757642, "img/sec/core": 689.8628918404569, "core_hours_NVIDIA A100-SXM4-40GB": 22.437486618553315, "core_hours": 22.437486618553315} {"step": 56300, "global_schedule": 0.5762864351272583, "l2_grads": 1.6394308805465698, "l2_params": 301.4425354003906, "l2_updates": 0.5995638370513916, "train/loss": 2.3343844413757324, "uptime": 10444.861950641001, "examples_seen": 57651200.0, "progress": 0.49998667886290776, "epoch": 44.998973592045374, "img/sec/core": 713.0423559882817, "core_hours_NVIDIA A100-SXM4-40GB": 22.45743244940443, "core_hours": 22.45743244940443} {"step": 56350, "global_schedule": 0.5755298733711243, "l2_grads": 1.548143744468689, "l2_params": 301.3521728515625, "l2_updates": 0.6195613741874695, "train/loss": 2.1665146350860596, "uptime": 10454.931263559001, "examples_seen": 57702400.0, "progress": 0.5004307167659832, "epoch": 45.038937156514336, "img/sec/core": 635.5945089917057, "core_hours_NVIDIA A100-SXM4-40GB": 22.47980870033332, "core_hours": 22.47980870033332} {"step": 56400, "global_schedule": 0.5747730731964111, "l2_grads": 1.5999261140823364, "l2_params": 301.2726745605469, "l2_updates": 0.6131128668785095, "train/loss": 2.2096593379974365, "uptime": 10464.486067443, "examples_seen": 57753600.0, "progress": 0.5008747546690585, "epoch": 45.07890072098329, "img/sec/core": 669.8201321241042, "core_hours_NVIDIA A100-SXM4-40GB": 22.501041597853316, "core_hours": 22.501041597853316} {"step": 56450, "global_schedule": 0.5740161538124084, "l2_grads": 1.4433337450027466, "l2_params": 301.2100524902344, "l2_updates": 0.6170706748962402, "train/loss": 3.6140406131744385, "uptime": 10474.004953863, "examples_seen": 57804800.0, "progress": 0.501318792572134, "epoch": 45.11886428545225, "img/sec/core": 672.3475538644623, "core_hours_NVIDIA A100-SXM4-40GB": 22.522194678786647, "core_hours": 22.522194678786647} {"step": 56500, "global_schedule": 0.5732589960098267, "l2_grads": 1.5605039596557617, "l2_params": 301.123779296875, "l2_updates": 0.6134424209594727, "train/loss": 2.1025397777557373, "uptime": 10482.896470796002, "examples_seen": 57856000.0, "progress": 0.5017628304752093, "epoch": 45.1588278499212, "img/sec/core": 719.7871913446918, "core_hours_NVIDIA A100-SXM4-40GB": 22.541953605304432, "core_hours": 22.541953605304432} {"step": 56550, "global_schedule": 0.5725016593933105, "l2_grads": 1.396654725074768, "l2_params": 301.0453186035156, "l2_updates": 0.5973944664001465, "train/loss": 4.497744560241699, "uptime": 10491.540626446002, "examples_seen": 57907200.0, "progress": 0.5022068683782848, "epoch": 45.198791414390165, "img/sec/core": 740.3846320143956, "core_hours_NVIDIA A100-SXM4-40GB": 22.561162840082208, "core_hours": 22.561162840082208} {"step": 56600, "global_schedule": 0.5717442035675049, "l2_grads": 1.539355993270874, "l2_params": 300.9612121582031, "l2_updates": 0.5967110991477966, "train/loss": 2.0760412216186523, "uptime": 10500.245344427001, "examples_seen": 57958400.0, "progress": 0.5026509062813602, "epoch": 45.23875497885912, "img/sec/core": 735.2334692484758, "core_hours_NVIDIA A100-SXM4-40GB": 22.58050665781776, "core_hours": 22.58050665781776} {"step": 56650, "global_schedule": 0.5709865689277649, "l2_grads": 1.441484808921814, "l2_params": 300.8730163574219, "l2_updates": 0.6032845377922058, "train/loss": 2.5200185775756836, "uptime": 10509.038383037, "examples_seen": 58009600.0, "progress": 0.5030949441844356, "epoch": 45.278718543328075, "img/sec/core": 727.8485042386882, "core_hours_NVIDIA A100-SXM4-40GB": 22.60004674361776, "core_hours": 22.60004674361776} {"step": 56700, "global_schedule": 0.5702288150787354, "l2_grads": 1.4555199146270752, "l2_params": 300.7848205566406, "l2_updates": 0.6058158278465271, "train/loss": 2.9425365924835205, "uptime": 10517.639096134002, "examples_seen": 58060800.0, "progress": 0.503538982087511, "epoch": 45.31868210779703, "img/sec/core": 744.1243450185809, "core_hours_NVIDIA A100-SXM4-40GB": 22.619159439388874, "core_hours": 22.619159439388874} {"step": 56750, "global_schedule": 0.5694708228111267, "l2_grads": 1.6779210567474365, "l2_params": 300.69647216796875, "l2_updates": 0.5986951589584351, "train/loss": 2.130650281906128, "uptime": 10526.389760553002, "examples_seen": 58112000.0, "progress": 0.5039830199905864, "epoch": 45.358645672265986, "img/sec/core": 731.3730356410487, "core_hours_NVIDIA A100-SXM4-40GB": 22.63860536031999, "core_hours": 22.63860536031999} {"step": 56800, "global_schedule": 0.5687127113342285, "l2_grads": 1.612148642539978, "l2_params": 300.6031799316406, "l2_updates": 0.5935470461845398, "train/loss": 2.2217297554016113, "uptime": 10535.145618303, "examples_seen": 58163200.0, "progress": 0.5044270578936618, "epoch": 45.39860923673495, "img/sec/core": 730.9392389341943, "core_hours_NVIDIA A100-SXM4-40GB": 22.65806282198665, "core_hours": 22.65806282198665} {"step": 56850, "global_schedule": 0.5679543614387512, "l2_grads": 1.4766030311584473, "l2_params": 300.52947998046875, "l2_updates": 0.5960376858711243, "train/loss": 2.9417059421539307, "uptime": 10544.877006949, "examples_seen": 58214400.0, "progress": 0.5048710957967372, "epoch": 45.438572801203904, "img/sec/core": 657.6656459641932, "core_hours_NVIDIA A100-SXM4-40GB": 22.679688130088874, "core_hours": 22.679688130088874} {"step": 56900, "global_schedule": 0.5671959519386292, "l2_grads": 1.664641261100769, "l2_params": 300.4326171875, "l2_updates": 0.5961818099021912, "train/loss": 2.331864833831787, "uptime": 10553.696405272001, "examples_seen": 58265600.0, "progress": 0.5053151336998126, "epoch": 45.47853636567286, "img/sec/core": 725.6730862590287, "core_hours_NVIDIA A100-SXM4-40GB": 22.699286793028875, "core_hours": 22.699286793028875} {"step": 56950, "global_schedule": 0.566437304019928, "l2_grads": 1.3749382495880127, "l2_params": 300.33514404296875, "l2_updates": 0.5949767231941223, "train/loss": 4.216611385345459, "uptime": 10562.483462720002, "examples_seen": 58316800.0, "progress": 0.505759171602888, "epoch": 45.518499930141815, "img/sec/core": 728.3439351425308, "core_hours_NVIDIA A100-SXM4-40GB": 22.718813587357765, "core_hours": 22.718813587357765} {"step": 57000, "global_schedule": 0.565678596496582, "l2_grads": 1.4359817504882812, "l2_params": 300.265625, "l2_updates": 0.5994187593460083, "train/loss": 4.355073928833008, "uptime": 10571.250750663, "examples_seen": 58368000.0, "progress": 0.5062032095059634, "epoch": 45.55846349461077, "img/sec/core": 729.9862901286884, "core_hours_NVIDIA A100-SXM4-40GB": 22.73829644945332, "core_hours": 22.73829644945332} {"step": 57050, "global_schedule": 0.5649197101593018, "l2_grads": 1.4457124471664429, "l2_params": 300.1805114746094, "l2_updates": 0.5911545157432556, "train/loss": 4.5685834884643555, "uptime": 10580.466421675, "examples_seen": 58419200.0, "progress": 0.5066472474090389, "epoch": 45.59842705907973, "img/sec/core": 750.6772903453218, "core_hours_NVIDIA A100-SXM4-40GB": 22.757242303291097, "core_hours": 22.757242303291097} {"step": 57100, "global_schedule": 0.5641605854034424, "l2_grads": 1.578940510749817, "l2_params": 300.10418701171875, "l2_updates": 0.5948674082756042, "train/loss": 2.4699764251708984, "uptime": 10589.565018604999, "examples_seen": 58470400.0, "progress": 0.5070912853121142, "epoch": 45.63839062354869, "img/sec/core": 703.4051567774296, "core_hours_NVIDIA A100-SXM4-40GB": 22.77746140757998, "core_hours": 22.77746140757998} {"step": 57150, "global_schedule": 0.5634013414382935, "l2_grads": 1.4147109985351562, "l2_params": 300.0318603515625, "l2_updates": 0.5833374261856079, "train/loss": 3.9772567749023438, "uptime": 10598.630461496, "examples_seen": 58521600.0, "progress": 0.5075353232151897, "epoch": 45.67835418801764, "img/sec/core": 705.9776424549949, "core_hours_NVIDIA A100-SXM4-40GB": 22.79760683622665, "core_hours": 22.79760683622665} {"step": 57200, "global_schedule": 0.5626420378684998, "l2_grads": 1.686728596687317, "l2_params": 299.9146728515625, "l2_updates": 0.5993010401725769, "train/loss": 2.1815614700317383, "uptime": 10608.275659208002, "examples_seen": 58572800.0, "progress": 0.507979361118265, "epoch": 45.7183177524866, "img/sec/core": 663.5426448580276, "core_hours_NVIDIA A100-SXM4-40GB": 22.819040608919988, "core_hours": 22.819040608919988} {"step": 57250, "global_schedule": 0.561882495880127, "l2_grads": 1.5727112293243408, "l2_params": 299.8554992675781, "l2_updates": 0.5991101264953613, "train/loss": 2.315150499343872, "uptime": 10617.456440786, "examples_seen": 58624000.0, "progress": 0.5084233990213405, "epoch": 45.758281316955554, "img/sec/core": 697.1084047286446, "core_hours_NVIDIA A100-SXM4-40GB": 22.839442345759984, "core_hours": 22.839442345759984} {"step": 57300, "global_schedule": 0.5611228346824646, "l2_grads": 1.4280571937561035, "l2_params": 299.7751159667969, "l2_updates": 0.5908946394920349, "train/loss": 4.598111152648926, "uptime": 10627.185561532, "examples_seen": 58675200.0, "progress": 0.5088674369244158, "epoch": 45.798244881424516, "img/sec/core": 657.8189506622274, "core_hours_NVIDIA A100-SXM4-40GB": 22.861062614084425, "core_hours": 22.861062614084425} {"step": 57350, "global_schedule": 0.5603629946708679, "l2_grads": 1.6032079458236694, "l2_params": 299.6780700683594, "l2_updates": 0.5935912728309631, "train/loss": 2.305251121520996, "uptime": 10637.051629889002, "examples_seen": 58726400.0, "progress": 0.5093114748274913, "epoch": 45.83820844589347, "img/sec/core": 648.6879847592191, "core_hours_NVIDIA A100-SXM4-40GB": 22.88298721043332, "core_hours": 22.88298721043332} {"step": 57400, "global_schedule": 0.5596030950546265, "l2_grads": 1.6753839254379272, "l2_params": 299.5937805175781, "l2_updates": 0.5956265330314636, "train/loss": 2.2700705528259277, "uptime": 10646.914535652, "examples_seen": 58777600.0, "progress": 0.5097555127305666, "epoch": 45.87817201036243, "img/sec/core": 648.8959900651175, "core_hours_NVIDIA A100-SXM4-40GB": 22.904904778795537, "core_hours": 22.904904778795537} {"step": 57450, "global_schedule": 0.5588430166244507, "l2_grads": 1.4757835865020752, "l2_params": 299.5068054199219, "l2_updates": 0.5914632081985474, "train/loss": 2.4751217365264893, "uptime": 10656.746574638002, "examples_seen": 58828800.0, "progress": 0.5101995506336421, "epoch": 45.91813557483138, "img/sec/core": 650.9331390072651, "core_hours_NVIDIA A100-SXM4-40GB": 22.926753754319986, "core_hours": 22.926753754319986} {"step": 57500, "global_schedule": 0.5580827593803406, "l2_grads": 1.5756462812423706, "l2_params": 299.4075927734375, "l2_updates": 0.5836994051933289, "train/loss": 2.2108681201934814, "uptime": 10666.544715529, "examples_seen": 58880000.0, "progress": 0.5106435885367175, "epoch": 45.958099139300344, "img/sec/core": 653.185136976327, "core_hours_NVIDIA A100-SXM4-40GB": 22.948527400744428, "core_hours": 22.948527400744428, "val/acc@1": 0.6718, "val/loss": 1.3726512329101563, "z/secs/eval/val": 2.675586571000167} {"step": 57550, "global_schedule": 0.5573223829269409, "l2_grads": 1.55401611328125, "l2_params": 299.3213806152344, "l2_updates": 0.5998737215995789, "train/loss": 2.7669382095336914, "uptime": 10678.617848303, "examples_seen": 58931200.0, "progress": 0.5110876264397929, "epoch": 45.9980627037693, "img/sec/core": 681.0824391273145, "core_hours_NVIDIA A100-SXM4-40GB": 22.969409193322203, "core_hours": 22.969409193322203} {"step": 57600, "global_schedule": 0.5565619468688965, "l2_grads": 1.6959872245788574, "l2_params": 299.24932861328125, "l2_updates": 0.585313618183136, "train/loss": 2.103163242340088, "uptime": 10689.248119693, "examples_seen": 58982400.0, "progress": 0.5115316643428683, "epoch": 46.038026268238255, "img/sec/core": 602.0542435088056, "core_hours_NVIDIA A100-SXM4-40GB": 22.993032018633315, "core_hours": 22.993032018633315} {"step": 57650, "global_schedule": 0.5558013319969177, "l2_grads": 1.4393796920776367, "l2_params": 299.15155029296875, "l2_updates": 0.5841436982154846, "train/loss": 3.7557830810546875, "uptime": 10699.132676064002, "examples_seen": 59033600.0, "progress": 0.5119757022459437, "epoch": 46.07798983270721, "img/sec/core": 647.4746827055885, "core_hours_NVIDIA A100-SXM4-40GB": 23.014997699457766, "core_hours": 23.014997699457766} {"step": 57700, "global_schedule": 0.5550405383110046, "l2_grads": 1.575676679611206, "l2_params": 299.0570373535156, "l2_updates": 0.586364209651947, "train/loss": 2.165043354034424, "uptime": 10708.940016417999, "examples_seen": 59084800.0, "progress": 0.5124197401490191, "epoch": 46.117953397176166, "img/sec/core": 652.5724374796436, "core_hours_NVIDIA A100-SXM4-40GB": 23.03679178913331, "core_hours": 23.03679178913331} {"step": 57750, "global_schedule": 0.554279625415802, "l2_grads": 1.471960425376892, "l2_params": 298.9586181640625, "l2_updates": 0.5816581845283508, "train/loss": 3.746616840362549, "uptime": 10718.878856481, "examples_seen": 59136000.0, "progress": 0.5128637780520945, "epoch": 46.15791696164513, "img/sec/core": 643.9383227248833, "core_hours_NVIDIA A100-SXM4-40GB": 23.05887810038443, "core_hours": 23.05887810038443} {"step": 57800, "global_schedule": 0.5535186529159546, "l2_grads": 1.580340027809143, "l2_params": 298.8755798339844, "l2_updates": 0.5815961360931396, "train/loss": 2.236917495727539, "uptime": 10727.943298103999, "examples_seen": 59187200.0, "progress": 0.5133078159551699, "epoch": 46.19788052611408, "img/sec/core": 706.0556255072048, "core_hours_NVIDIA A100-SXM4-40GB": 23.07902130399109, "core_hours": 23.07902130399109} {"step": 57850, "global_schedule": 0.5527575016021729, "l2_grads": 1.609938383102417, "l2_params": 298.795166015625, "l2_updates": 0.5853175520896912, "train/loss": 2.353127956390381, "uptime": 10736.636903232002, "examples_seen": 59238400.0, "progress": 0.5137518538582453, "epoch": 46.23784409058304, "img/sec/core": 736.1733027631057, "core_hours_NVIDIA A100-SXM4-40GB": 23.098340426497764, "core_hours": 23.098340426497764} {"step": 57900, "global_schedule": 0.5519962906837463, "l2_grads": 1.4262399673461914, "l2_params": 298.7156066894531, "l2_updates": 0.5804643034934998, "train/loss": 3.3630547523498535, "uptime": 10745.352113973999, "examples_seen": 59289600.0, "progress": 0.5141958917613207, "epoch": 46.277807655051994, "img/sec/core": 734.3482779090558, "core_hours_NVIDIA A100-SXM4-40GB": 23.11770756147998, "core_hours": 23.11770756147998} {"step": 57950, "global_schedule": 0.5512348413467407, "l2_grads": 1.6577104330062866, "l2_params": 298.643310546875, "l2_updates": 0.5907861590385437, "train/loss": 2.3458948135375977, "uptime": 10754.716590177, "examples_seen": 59340800.0, "progress": 0.5146399296643962, "epoch": 46.31777121952095, "img/sec/core": 683.4338473676238, "core_hours_NVIDIA A100-SXM4-40GB": 23.13851750859776, "core_hours": 23.13851750859776} {"step": 58000, "global_schedule": 0.5504733920097351, "l2_grads": 1.4610222578048706, "l2_params": 298.5628662109375, "l2_updates": 0.5842603445053101, "train/loss": 4.35924768447876, "uptime": 10764.073999372, "examples_seen": 59392000.0, "progress": 0.5150839675674715, "epoch": 46.35773478398991, "img/sec/core": 683.9499979780833, "core_hours_NVIDIA A100-SXM4-40GB": 23.159311751253316, "core_hours": 23.159311751253316} {"step": 58050, "global_schedule": 0.5497117042541504, "l2_grads": 1.6364952325820923, "l2_params": 298.4776916503906, "l2_updates": 0.5801110863685608, "train/loss": 2.1751556396484375, "uptime": 10773.630271856002, "examples_seen": 59443200.0, "progress": 0.515528005470547, "epoch": 46.39769834845887, "img/sec/core": 746.6127968984657, "core_hours_NVIDIA A100-SXM4-40GB": 23.17836074462887, "core_hours": 23.17836074462887} {"step": 58100, "global_schedule": 0.5489499568939209, "l2_grads": 1.6193969249725342, "l2_params": 298.39849853515625, "l2_updates": 0.5926863551139832, "train/loss": 2.192812204360962, "uptime": 10782.758435572001, "examples_seen": 59494400.0, "progress": 0.5159720433736223, "epoch": 46.43766191292782, "img/sec/core": 701.1267763288029, "core_hours_NVIDIA A100-SXM4-40GB": 23.198645552886646, "core_hours": 23.198645552886646} {"step": 58150, "global_schedule": 0.5481881499290466, "l2_grads": 1.569339394569397, "l2_params": 298.3128662109375, "l2_updates": 0.5863422751426697, "train/loss": 2.5671894550323486, "uptime": 10792.747362979999, "examples_seen": 59545600.0, "progress": 0.5164160812766978, "epoch": 46.47762547739678, "img/sec/core": 640.709431412597, "core_hours_NVIDIA A100-SXM4-40GB": 23.220843169348864, "core_hours": 23.220843169348864} {"step": 58200, "global_schedule": 0.5474262237548828, "l2_grads": 1.6461207866668701, "l2_params": 298.2202453613281, "l2_updates": 0.5672675371170044, "train/loss": 1.9781520366668701, "uptime": 10802.560426074002, "examples_seen": 59596800.0, "progress": 0.5168601191797731, "epoch": 46.51758904186573, "img/sec/core": 652.1918730871193, "core_hours_NVIDIA A100-SXM4-40GB": 23.242649976224424, "core_hours": 23.242649976224424} {"step": 58250, "global_schedule": 0.5466641783714294, "l2_grads": 1.5568629503250122, "l2_params": 298.1272277832031, "l2_updates": 0.5795556902885437, "train/loss": 2.944570779800415, "uptime": 10812.551205991002, "examples_seen": 59648000.0, "progress": 0.5173041570828486, "epoch": 46.557552606334696, "img/sec/core": 640.590629877675, "core_hours_NVIDIA A100-SXM4-40GB": 23.264851709373314, "core_hours": 23.264851709373314} {"step": 58300, "global_schedule": 0.5459019541740417, "l2_grads": 1.4166007041931152, "l2_params": 298.0451354980469, "l2_updates": 0.5753706097602844, "train/loss": 4.552915096282959, "uptime": 10822.15108433, "examples_seen": 59699200.0, "progress": 0.517748194985924, "epoch": 46.59751617080365, "img/sec/core": 666.6751154543857, "core_hours_NVIDIA A100-SXM4-40GB": 23.286184772348864, "core_hours": 23.286184772348864} {"step": 58350, "global_schedule": 0.5451396107673645, "l2_grads": 1.6042958498001099, "l2_params": 297.96234130859375, "l2_updates": 0.5785541534423828, "train/loss": 2.1627519130706787, "uptime": 10831.690760528001, "examples_seen": 59750400.0, "progress": 0.5181922328889994, "epoch": 46.637479735272606, "img/sec/core": 670.8823095422379, "core_hours_NVIDIA A100-SXM4-40GB": 23.307384052788866, "core_hours": 23.307384052788866} {"step": 58400, "global_schedule": 0.5443772673606873, "l2_grads": 1.6361188888549805, "l2_params": 297.8718566894531, "l2_updates": 0.5736405253410339, "train/loss": 2.0735585689544678, "uptime": 10841.494555108, "examples_seen": 59801600.0, "progress": 0.5186362707920749, "epoch": 46.67744329974156, "img/sec/core": 652.8084557235579, "core_hours_NVIDIA A100-SXM4-40GB": 23.329170262966645, "core_hours": 23.329170262966645} {"step": 58450, "global_schedule": 0.5436147451400757, "l2_grads": 1.6171793937683105, "l2_params": 297.77911376953125, "l2_updates": 0.5800387263298035, "train/loss": 2.2028145790100098, "uptime": 10851.386777208, "examples_seen": 59852800.0, "progress": 0.5190803086951502, "epoch": 46.717406864210524, "img/sec/core": 646.9729384665175, "core_hours_NVIDIA A100-SXM4-40GB": 23.35115297874442, "core_hours": 23.35115297874442} {"step": 58500, "global_schedule": 0.5428521633148193, "l2_grads": 1.527069330215454, "l2_params": 297.6935729980469, "l2_updates": 0.5693304538726807, "train/loss": 2.212860107421875, "uptime": 10860.525890952, "examples_seen": 59904000.0, "progress": 0.5195243465982257, "epoch": 46.75737042867948, "img/sec/core": 700.2867213685104, "core_hours_NVIDIA A100-SXM4-40GB": 23.371462120397755, "core_hours": 23.371462120397755} {"step": 58550, "global_schedule": 0.5420894026756287, "l2_grads": 1.6340601444244385, "l2_params": 297.6231689453125, "l2_updates": 0.5679994821548462, "train/loss": 2.0113275051116943, "uptime": 10869.321746223, "examples_seen": 59955200.0, "progress": 0.519968384501301, "epoch": 46.797333993148435, "img/sec/core": 727.6154282688572, "core_hours_NVIDIA A100-SXM4-40GB": 23.391008465444422, "core_hours": 23.391008465444422} {"step": 58600, "global_schedule": 0.541326642036438, "l2_grads": 1.4670326709747314, "l2_params": 297.5242614746094, "l2_updates": 0.5814837217330933, "train/loss": 3.7224535942077637, "uptime": 10878.753688170002, "examples_seen": 60006400.0, "progress": 0.5204124224043765, "epoch": 46.83729755761739, "img/sec/core": 678.545312933657, "core_hours_NVIDIA A100-SXM4-40GB": 23.41196833643776, "core_hours": 23.41196833643776} {"step": 58650, "global_schedule": 0.540563702583313, "l2_grads": 1.638258457183838, "l2_params": 297.4429931640625, "l2_updates": 0.5680322051048279, "train/loss": 4.636116981506348, "uptime": 10888.587107813999, "examples_seen": 60057600.0, "progress": 0.5208564603074518, "epoch": 46.877261122086345, "img/sec/core": 650.8417449576442, "core_hours_NVIDIA A100-SXM4-40GB": 23.433820380091085, "core_hours": 23.433820380091085} {"step": 58700, "global_schedule": 0.5398006439208984, "l2_grads": 1.469749927520752, "l2_params": 297.3546447753906, "l2_updates": 0.5722917914390564, "train/loss": 4.56931209564209, "uptime": 10898.003188429999, "examples_seen": 60108800.0, "progress": 0.5213004982105273, "epoch": 46.91722468655531, "img/sec/core": 679.688318420417, "core_hours_NVIDIA A100-SXM4-40GB": 23.454745003682195, "core_hours": 23.454745003682195} {"step": 58750, "global_schedule": 0.5390375852584839, "l2_grads": 1.569490909576416, "l2_params": 297.26641845703125, "l2_updates": 0.5664621591567993, "train/loss": 4.587088584899902, "uptime": 10906.788104915, "examples_seen": 60160000.0, "progress": 0.5217445361136026, "epoch": 46.95718825102426, "img/sec/core": 728.5214390969876, "core_hours_NVIDIA A100-SXM4-40GB": 23.47426704031553, "core_hours": 23.47426704031553} {"step": 58800, "global_schedule": 0.5382744669914246, "l2_grads": 1.7866648435592651, "l2_params": 297.1779479980469, "l2_updates": 0.5688063502311707, "train/loss": 2.2064051628112793, "uptime": 10915.471593803, "examples_seen": 60211200.0, "progress": 0.5221885740166781, "epoch": 46.99715181549322, "img/sec/core": 737.0309425793315, "core_hours_NVIDIA A100-SXM4-40GB": 23.493563682288865, "core_hours": 23.493563682288865} {"step": 58850, "global_schedule": 0.5375111699104309, "l2_grads": 1.5692319869995117, "l2_params": 297.1068420410156, "l2_updates": 0.5770341753959656, "train/loss": 2.1104817390441895, "uptime": 10925.172833413, "examples_seen": 60262400.0, "progress": 0.5226326119197535, "epoch": 47.037115379962174, "img/sec/core": 659.7095069585715, "core_hours_NVIDIA A100-SXM4-40GB": 23.51512199253331, "core_hours": 23.51512199253331} {"step": 58900, "global_schedule": 0.5367478132247925, "l2_grads": 1.4732232093811035, "l2_params": 297.0198059082031, "l2_updates": 0.5642631649971008, "train/loss": 3.8004093170166016, "uptime": 10934.689806029999, "examples_seen": 60313600.0, "progress": 0.5230766498228289, "epoch": 47.07707894443113, "img/sec/core": 672.482758705072, "core_hours_NVIDIA A100-SXM4-40GB": 23.536270820571083, "core_hours": 23.536270820571083} {"step": 58950, "global_schedule": 0.5359843373298645, "l2_grads": 1.4233031272888184, "l2_params": 296.942626953125, "l2_updates": 0.5721193552017212, "train/loss": 4.013753890991211, "uptime": 10944.675649957999, "examples_seen": 60364800.0, "progress": 0.5235206877259043, "epoch": 47.11704250890009, "img/sec/core": 640.9072729501419, "core_hours_NVIDIA A100-SXM4-40GB": 23.55846158485553, "core_hours": 23.55846158485553} {"step": 59000, "global_schedule": 0.5352208614349365, "l2_grads": 1.3842016458511353, "l2_params": 296.86016845703125, "l2_updates": 0.569247305393219, "train/loss": 4.1045427322387695, "uptime": 10953.99573298, "examples_seen": 60416000.0, "progress": 0.5239647256289797, "epoch": 47.15700607336905, "img/sec/core": 686.6891619840741, "core_hours_NVIDIA A100-SXM4-40GB": 23.579172880459975, "core_hours": 23.579172880459975} {"step": 59050, "global_schedule": 0.5344572067260742, "l2_grads": 1.7768328189849854, "l2_params": 296.78668212890625, "l2_updates": 0.5595182776451111, "train/loss": 2.341026544570923, "uptime": 10963.908834263, "examples_seen": 60467200.0, "progress": 0.5244087635320551, "epoch": 47.196969637838, "img/sec/core": 711.8494089685854, "core_hours_NVIDIA A100-SXM4-40GB": 23.599152137368865, "core_hours": 23.599152137368865} {"step": 59100, "global_schedule": 0.5336935520172119, "l2_grads": 1.6462889909744263, "l2_params": 296.6840515136719, "l2_updates": 0.5631344318389893, "train/loss": 2.2587900161743164, "uptime": 10973.461369365, "examples_seen": 60518400.0, "progress": 0.5248528014351305, "epoch": 47.23693320230696, "img/sec/core": 669.9792182558612, "core_hours_NVIDIA A100-SXM4-40GB": 23.620379993151083, "core_hours": 23.620379993151083} {"step": 59150, "global_schedule": 0.5329297184944153, "l2_grads": 1.6045823097229004, "l2_params": 296.590576171875, "l2_updates": 0.5675126314163208, "train/loss": 2.3923561573028564, "uptime": 10982.911831207, "examples_seen": 60569600.0, "progress": 0.5252968393382059, "epoch": 47.27689676677591, "img/sec/core": 677.215580254204, "core_hours_NVIDIA A100-SXM4-40GB": 23.64138101946664, "core_hours": 23.64138101946664} {"step": 59200, "global_schedule": 0.5321659445762634, "l2_grads": 1.485648512840271, "l2_params": 296.498291015625, "l2_updates": 0.5684865117073059, "train/loss": 2.93552827835083, "uptime": 10991.912865659002, "examples_seen": 60620800.0, "progress": 0.5257408772412813, "epoch": 47.316860331244875, "img/sec/core": 711.0293860253907, "core_hours_NVIDIA A100-SXM4-40GB": 23.661383318248866, "core_hours": 23.661383318248866} {"step": 59250, "global_schedule": 0.5314019918441772, "l2_grads": 1.5669784545898438, "l2_params": 296.4069519042969, "l2_updates": 0.5681851506233215, "train/loss": 2.1832518577575684, "uptime": 11001.779367122, "examples_seen": 60672000.0, "progress": 0.5261849151443567, "epoch": 47.35682389571383, "img/sec/core": 648.6595095537397, "core_hours_NVIDIA A100-SXM4-40GB": 23.68330887705553, "core_hours": 23.68330887705553} {"step": 59300, "global_schedule": 0.5306379199028015, "l2_grads": 1.6514384746551514, "l2_params": 296.317626953125, "l2_updates": 0.5703004002571106, "train/loss": 2.194096803665161, "uptime": 11011.594223409002, "examples_seen": 60723200.0, "progress": 0.5266289530474322, "epoch": 47.396787460182786, "img/sec/core": 652.0727163856978, "core_hours_NVIDIA A100-SXM4-40GB": 23.705119668804418, "core_hours": 23.705119668804418} {"step": 59350, "global_schedule": 0.5298739075660706, "l2_grads": 1.5494024753570557, "l2_params": 296.239501953125, "l2_updates": 0.5597413778305054, "train/loss": 2.192133903503418, "uptime": 11020.673237920002, "examples_seen": 60774400.0, "progress": 0.5270729909505075, "epoch": 47.43675102465174, "img/sec/core": 704.9223230390871, "core_hours_NVIDIA A100-SXM4-40GB": 23.725295256606646, "core_hours": 23.725295256606646} {"step": 59400, "global_schedule": 0.5291097164154053, "l2_grads": 1.459877371788025, "l2_params": 296.1606750488281, "l2_updates": 0.5594131946563721, "train/loss": 3.3309836387634277, "uptime": 11029.396615095002, "examples_seen": 60825600.0, "progress": 0.527517028853583, "epoch": 47.476714589120704, "img/sec/core": 733.6608141101235, "core_hours_NVIDIA A100-SXM4-40GB": 23.744680539217754, "core_hours": 23.744680539217754} {"step": 59450, "global_schedule": 0.5283455848693848, "l2_grads": 1.588286280632019, "l2_params": 296.053955078125, "l2_updates": 0.5638666749000549, "train/loss": 2.174464225769043, "uptime": 11038.839051163, "examples_seen": 60876800.0, "progress": 0.5279610667566583, "epoch": 47.51667815358966, "img/sec/core": 677.7911922210666, "core_hours_NVIDIA A100-SXM4-40GB": 23.76566373047997, "core_hours": 23.76566373047997} {"step": 59500, "global_schedule": 0.5275813341140747, "l2_grads": 1.773189663887024, "l2_params": 295.9598693847656, "l2_updates": 0.5629239082336426, "train/loss": 2.238952159881592, "uptime": 11048.532509015002, "examples_seen": 60928000.0, "progress": 0.5284051046597338, "epoch": 47.556641718058614, "img/sec/core": 660.2391115445622, "core_hours_NVIDIA A100-SXM4-40GB": 23.787204747928865, "core_hours": 23.787204747928865} {"step": 59550, "global_schedule": 0.5268169641494751, "l2_grads": 1.561228632926941, "l2_params": 295.85626220703125, "l2_updates": 0.5537832975387573, "train/loss": 4.648093223571777, "uptime": 11058.338102828, "examples_seen": 60979200.0, "progress": 0.5288491425628091, "epoch": 47.59660528252757, "img/sec/core": 652.6886715943891, "core_hours_NVIDIA A100-SXM4-40GB": 23.808994956402195, "core_hours": 23.808994956402195} {"step": 59600, "global_schedule": 0.5260525941848755, "l2_grads": 1.5891636610031128, "l2_params": 295.78350830078125, "l2_updates": 0.5549264550209045, "train/loss": 2.272343158721924, "uptime": 11068.250100506002, "examples_seen": 61030400.0, "progress": 0.5292931804658846, "epoch": 47.636568846996525, "img/sec/core": 645.6821528725399, "core_hours_NVIDIA A100-SXM4-40GB": 23.831021617908863, "core_hours": 23.831021617908863} {"step": 59650, "global_schedule": 0.5252881050109863, "l2_grads": 1.5684410333633423, "l2_params": 295.7117919921875, "l2_updates": 0.5439926385879517, "train/loss": 2.284238338470459, "uptime": 11078.118116735002, "examples_seen": 61081600.0, "progress": 0.5297372183689599, "epoch": 47.67653241146549, "img/sec/core": 648.5599386421385, "core_hours_NVIDIA A100-SXM4-40GB": 23.8529505428622, "core_hours": 23.8529505428622} {"step": 59700, "global_schedule": 0.5245236158370972, "l2_grads": 1.65854012966156, "l2_params": 295.61688232421875, "l2_updates": 0.5642654895782471, "train/loss": 2.2254128456115723, "uptime": 11088.095955632, "examples_seen": 61132800.0, "progress": 0.5301812562720354, "epoch": 47.71649597593444, "img/sec/core": 641.4214607058956, "core_hours_NVIDIA A100-SXM4-40GB": 23.875123518188857, "core_hours": 23.875123518188857} {"step": 59750, "global_schedule": 0.5237589478492737, "l2_grads": 1.4808731079101562, "l2_params": 295.5197448730469, "l2_updates": 0.5559613108634949, "train/loss": 3.1245288848876953, "uptime": 11097.13157692, "examples_seen": 61184000.0, "progress": 0.5306252941751108, "epoch": 47.7564595404034, "img/sec/core": 708.307685327618, "core_hours_NVIDIA A100-SXM4-40GB": 23.895202676606637, "core_hours": 23.895202676606637} {"step": 59800, "global_schedule": 0.5229943990707397, "l2_grads": 1.6394442319869995, "l2_params": 295.4320373535156, "l2_updates": 0.557735025882721, "train/loss": 2.141774892807007, "uptime": 11105.921291790002, "examples_seen": 61235200.0, "progress": 0.5310693320781862, "epoch": 47.79642310487235, "img/sec/core": 728.1237326413702, "core_hours_NVIDIA A100-SXM4-40GB": 23.914735376317754, "core_hours": 23.914735376317754} {"step": 59850, "global_schedule": 0.5222296714782715, "l2_grads": 1.3635926246643066, "l2_params": 295.337646484375, "l2_updates": 0.5550578832626343, "train/loss": 3.5076351165771484, "uptime": 11114.747420943002, "examples_seen": 61286400.0, "progress": 0.5315133699812616, "epoch": 47.83638666934131, "img/sec/core": 725.1196859978871, "core_hours_NVIDIA A100-SXM4-40GB": 23.934348996657757, "core_hours": 23.934348996657757} {"step": 59900, "global_schedule": 0.5214648842811584, "l2_grads": 1.450289011001587, "l2_params": 295.2449645996094, "l2_updates": 0.541169285774231, "train/loss": 3.763767719268799, "uptime": 11123.981423481999, "examples_seen": 61337600.0, "progress": 0.531957407884337, "epoch": 47.87635023381027, "img/sec/core": 693.0905609968962, "core_hours_NVIDIA A100-SXM4-40GB": 23.95486900229997, "core_hours": 23.95486900229997} {"step": 59950, "global_schedule": 0.5207000970840454, "l2_grads": 1.6312766075134277, "l2_params": 295.1590576171875, "l2_updates": 0.5526771545410156, "train/loss": 2.215017557144165, "uptime": 11133.212937180002, "examples_seen": 61388800.0, "progress": 0.5324014457874124, "epoch": 47.916313798279226, "img/sec/core": 693.2774200816382, "core_hours_NVIDIA A100-SXM4-40GB": 23.975383477184423, "core_hours": 23.975383477184423} {"step": 60000, "global_schedule": 0.5199352502822876, "l2_grads": 1.5781383514404297, "l2_params": 295.067138671875, "l2_updates": 0.5471721887588501, "train/loss": 2.1423020362854004, "uptime": 11142.474851481, "examples_seen": 61440000.0, "progress": 0.5328454836904878, "epoch": 47.95627736274818, "img/sec/core": 691.0018590120682, "core_hours_NVIDIA A100-SXM4-40GB": 23.995965508964414, "core_hours": 23.995965508964414, "val/acc@1": 0.67798, "val/loss": 1.3455853540039062, "z/secs/eval/val": 3.024726286999794} {"step": 60050, "global_schedule": 0.5191704034805298, "l2_grads": 1.7068296670913696, "l2_params": 294.9808044433594, "l2_updates": 0.5496967434883118, "train/loss": 2.0674331188201904, "uptime": 11154.543571054002, "examples_seen": 61491200.0, "progress": 0.5332895215935632, "epoch": 47.99624092721714, "img/sec/core": 765.7335373408706, "core_hours_NVIDIA A100-SXM4-40GB": 24.01453883967109, "core_hours": 24.01453883967109} {"step": 60100, "global_schedule": 0.5184054970741272, "l2_grads": 1.670082926750183, "l2_params": 294.87274169921875, "l2_updates": 0.5639182329177856, "train/loss": 2.076134443283081, "uptime": 11164.230362342, "examples_seen": 61542400.0, "progress": 0.5337335594966386, "epoch": 48.03620449168609, "img/sec/core": 660.6934958875679, "core_hours_NVIDIA A100-SXM4-40GB": 24.036065042533306, "core_hours": 24.036065042533306} {"step": 60150, "global_schedule": 0.5176404714584351, "l2_grads": 1.571462631225586, "l2_params": 294.7975769042969, "l2_updates": 0.5514849424362183, "train/loss": 2.089076042175293, "uptime": 11173.884051027, "examples_seen": 61593600.0, "progress": 0.534177597399714, "epoch": 48.076168056155055, "img/sec/core": 662.9590210365748, "core_hours_NVIDIA A100-SXM4-40GB": 24.05751768405553, "core_hours": 24.05751768405553} {"step": 60200, "global_schedule": 0.5168755054473877, "l2_grads": 1.784474492073059, "l2_params": 294.709716796875, "l2_updates": 0.5353713631629944, "train/loss": 2.2623164653778076, "uptime": 11182.949970271, "examples_seen": 61644800.0, "progress": 0.5346216353027895, "epoch": 48.11613162062401, "img/sec/core": 705.9405480846053, "core_hours_NVIDIA A100-SXM4-40GB": 24.077664171264416, "core_hours": 24.077664171264416} {"step": 60250, "global_schedule": 0.5161104202270508, "l2_grads": 1.4677491188049316, "l2_params": 294.622314453125, "l2_updates": 0.5408992171287537, "train/loss": 3.143773078918457, "uptime": 11192.831038153001, "examples_seen": 61696000.0, "progress": 0.5350656732058648, "epoch": 48.156095185092965, "img/sec/core": 647.7032721997643, "core_hours_NVIDIA A100-SXM4-40GB": 24.099622099891086, "core_hours": 24.099622099891086} {"step": 60300, "global_schedule": 0.5153453350067139, "l2_grads": 1.8048558235168457, "l2_params": 294.53192138671875, "l2_updates": 0.5269392132759094, "train/loss": 2.093621015548706, "uptime": 11202.561577213999, "examples_seen": 61747200.0, "progress": 0.5355097111089403, "epoch": 48.19605874956192, "img/sec/core": 657.7230675382037, "core_hours_NVIDIA A100-SXM4-40GB": 24.12124552002664, "core_hours": 24.12124552002664} {"step": 60350, "global_schedule": 0.5145801901817322, "l2_grads": 1.6785085201263428, "l2_params": 294.4440002441406, "l2_updates": 0.5457051992416382, "train/loss": 4.67310094833374, "uptime": 11211.721010694999, "examples_seen": 61798400.0, "progress": 0.5359537490120156, "epoch": 48.236022314030876, "img/sec/core": 698.7331709189355, "core_hours_NVIDIA A100-SXM4-40GB": 24.14159981665108, "core_hours": 24.14159981665108} {"step": 60400, "global_schedule": 0.5138149857521057, "l2_grads": 1.508156180381775, "l2_params": 294.36566162109375, "l2_updates": 0.5418408513069153, "train/loss": 4.160609245300293, "uptime": 11221.057496305, "examples_seen": 61849600.0, "progress": 0.5363977869150911, "epoch": 48.27598587849984, "img/sec/core": 685.4827680711159, "core_hours_NVIDIA A100-SXM4-40GB": 24.162347562451085, "core_hours": 24.162347562451085} {"step": 60450, "global_schedule": 0.513049840927124, "l2_grads": 1.7231625318527222, "l2_params": 294.2826843261719, "l2_updates": 0.5466393828392029, "train/loss": 2.146012306213379, "uptime": 11230.826122498, "examples_seen": 61900800.0, "progress": 0.5368418248181664, "epoch": 48.315949442968794, "img/sec/core": 655.1586552248798, "core_hours_NVIDIA A100-SXM4-40GB": 24.18405562065775, "core_hours": 24.18405562065775} {"step": 60500, "global_schedule": 0.5122845768928528, "l2_grads": 1.412792444229126, "l2_params": 294.20050048828125, "l2_updates": 0.5456413626670837, "train/loss": 3.1798582077026367, "uptime": 11240.543299485, "examples_seen": 61952000.0, "progress": 0.5372858627212419, "epoch": 48.35591300743775, "img/sec/core": 658.627501440189, "core_hours_NVIDIA A100-SXM4-40GB": 24.20564934729553, "core_hours": 24.20564934729553} {"step": 60550, "global_schedule": 0.5115193724632263, "l2_grads": 1.6844221353530884, "l2_params": 294.1084289550781, "l2_updates": 0.5427906513214111, "train/loss": 2.424774408340454, "uptime": 11250.472482449999, "examples_seen": 62003200.0, "progress": 0.5377299006243172, "epoch": 48.395876571906705, "img/sec/core": 644.5646154935686, "core_hours_NVIDIA A100-SXM4-40GB": 24.227714198328858, "core_hours": 24.227714198328858} {"step": 60600, "global_schedule": 0.5107540488243103, "l2_grads": 1.6283880472183228, "l2_params": 294.0263671875, "l2_updates": 0.5381343364715576, "train/loss": 2.0416808128356934, "uptime": 11259.424381122002, "examples_seen": 62054400.0, "progress": 0.5381739385273927, "epoch": 48.43584013637567, "img/sec/core": 714.9321316622858, "core_hours_NVIDIA A100-SXM4-40GB": 24.247607306488867, "core_hours": 24.247607306488867} {"step": 60650, "global_schedule": 0.5099887251853943, "l2_grads": 1.4377628564834595, "l2_params": 293.9279479980469, "l2_updates": 0.5392786264419556, "train/loss": 4.563318252563477, "uptime": 11267.949721161001, "examples_seen": 62105600.0, "progress": 0.5386179764304682, "epoch": 48.47580370084462, "img/sec/core": 750.7031943269266, "core_hours_NVIDIA A100-SXM4-40GB": 24.266552506575533, "core_hours": 24.266552506575533} {"step": 60700, "global_schedule": 0.509223461151123, "l2_grads": 1.644106149673462, "l2_params": 293.85565185546875, "l2_updates": 0.5408337116241455, "train/loss": 2.1676721572875977, "uptime": 11276.806222392, "examples_seen": 62156800.0, "progress": 0.5390620143335435, "epoch": 48.51576726531358, "img/sec/core": 722.6329938959424, "core_hours_NVIDIA A100-SXM4-40GB": 24.286233620422195, "core_hours": 24.286233620422195} {"step": 60750, "global_schedule": 0.5084580779075623, "l2_grads": 1.547994613647461, "l2_params": 293.7611389160156, "l2_updates": 0.538081705570221, "train/loss": 4.556400299072266, "uptime": 11285.806409511, "examples_seen": 62208000.0, "progress": 0.539506052236619, "epoch": 48.55573082978253, "img/sec/core": 711.0963267074025, "core_hours_NVIDIA A100-SXM4-40GB": 24.306234036242195, "core_hours": 24.306234036242195} {"step": 60800, "global_schedule": 0.5076927542686462, "l2_grads": 1.6008884906768799, "l2_params": 293.67657470703125, "l2_updates": 0.533514142036438, "train/loss": 3.727517604827881, "uptime": 11295.400001388001, "examples_seen": 62259200.0, "progress": 0.5399500901396943, "epoch": 48.59569439425149, "img/sec/core": 667.1119724555822, "core_hours_NVIDIA A100-SXM4-40GB": 24.3275531293022, "core_hours": 24.3275531293022} {"step": 60850, "global_schedule": 0.5069273114204407, "l2_grads": 1.6661053895950317, "l2_params": 293.5828857421875, "l2_updates": 0.5419501066207886, "train/loss": 2.272733688354492, "uptime": 11304.333625785, "examples_seen": 62310400.0, "progress": 0.5403941280427698, "epoch": 48.63565795872045, "img/sec/core": 716.3945690564002, "core_hours_NVIDIA A100-SXM4-40GB": 24.347405627962196, "core_hours": 24.347405627962196} {"step": 60900, "global_schedule": 0.5061619281768799, "l2_grads": 1.7681121826171875, "l2_params": 293.4971618652344, "l2_updates": 0.5319827198982239, "train/loss": 2.1828577518463135, "uptime": 11313.038888529, "examples_seen": 62361600.0, "progress": 0.5408381659458451, "epoch": 48.675621523189406, "img/sec/core": 735.1874593804688, "core_hours_NVIDIA A100-SXM4-40GB": 24.366750656282193, "core_hours": 24.366750656282193} {"step": 60950, "global_schedule": 0.5053964853286743, "l2_grads": 1.6052879095077515, "l2_params": 293.39019775390625, "l2_updates": 0.5282848477363586, "train/loss": 2.4868247509002686, "uptime": 11321.691357131001, "examples_seen": 62412800.0, "progress": 0.5412822038489206, "epoch": 48.71558508765836, "img/sec/core": 739.6732995389478, "core_hours_NVIDIA A100-SXM4-40GB": 24.385978364286643, "core_hours": 24.385978364286643} {"step": 61000, "global_schedule": 0.5046310424804688, "l2_grads": 1.4258862733840942, "l2_params": 293.3011169433594, "l2_updates": 0.5266477465629578, "train/loss": 3.5659196376800537, "uptime": 11330.500459926001, "examples_seen": 62464000.0, "progress": 0.5417262417519959, "epoch": 48.75554865212732, "img/sec/core": 726.521207543744, "core_hours_NVIDIA A100-SXM4-40GB": 24.40555414827553, "core_hours": 24.40555414827553} {"step": 61050, "global_schedule": 0.5038655996322632, "l2_grads": 1.5121040344238281, "l2_params": 293.21160888671875, "l2_updates": 0.5236237645149231, "train/loss": 4.6815338134765625, "uptime": 11339.961303418002, "examples_seen": 62515200.0, "progress": 0.5421702796550714, "epoch": 48.79551221659627, "img/sec/core": 728.7158445812094, "core_hours_NVIDIA A100-SXM4-40GB": 24.42507097685553, "core_hours": 24.42507097685553} {"step": 61100, "global_schedule": 0.5031000971794128, "l2_grads": 1.6391469240188599, "l2_params": 293.1274719238281, "l2_updates": 0.5375751852989197, "train/loss": 2.5049822330474854, "uptime": 11348.641385232002, "examples_seen": 62566400.0, "progress": 0.5426143175581467, "epoch": 48.835475781065234, "img/sec/core": 737.320239272113, "core_hours_NVIDIA A100-SXM4-40GB": 24.444360047553307, "core_hours": 24.444360047553307} {"step": 61150, "global_schedule": 0.5023346543312073, "l2_grads": 1.5884462594985962, "l2_params": 293.0348205566406, "l2_updates": 0.5276637077331543, "train/loss": 2.4497883319854736, "uptime": 11357.429959068, "examples_seen": 62617600.0, "progress": 0.5430583554612222, "epoch": 48.87543934553419, "img/sec/core": 728.2182660610322, "core_hours_NVIDIA A100-SXM4-40GB": 24.463890211633306, "core_hours": 24.463890211633306} {"step": 61200, "global_schedule": 0.5015692114830017, "l2_grads": 1.4464274644851685, "l2_params": 292.94085693359375, "l2_updates": 0.5295217037200928, "train/loss": 3.9596505165100098, "uptime": 11366.173633651999, "examples_seen": 62668800.0, "progress": 0.5435023933642976, "epoch": 48.915402910003145, "img/sec/core": 731.9577070848803, "core_hours_NVIDIA A100-SXM4-40GB": 24.483320599597747, "core_hours": 24.483320599597747} {"step": 61250, "global_schedule": 0.5008037686347961, "l2_grads": 1.5530787706375122, "l2_params": 292.8519592285156, "l2_updates": 0.5243369936943054, "train/loss": 2.6914119720458984, "uptime": 11375.189552408001, "examples_seen": 62720000.0, "progress": 0.543946431267373, "epoch": 48.9553664744721, "img/sec/core": 709.855553627233, "core_hours_NVIDIA A100-SXM4-40GB": 24.503355974611086, "core_hours": 24.503355974611086} {"step": 61300, "global_schedule": 0.5000382661819458, "l2_grads": 1.5589301586151123, "l2_params": 292.7694091796875, "l2_updates": 0.5243014097213745, "train/loss": 2.3926198482513428, "uptime": 11384.921463681001, "examples_seen": 62771200.0, "progress": 0.5443904691704484, "epoch": 48.995330038941056, "img/sec/core": 657.6303277400319, "core_hours_NVIDIA A100-SXM4-40GB": 24.52498244410664, "core_hours": 24.52498244410664} {"step": 61350, "global_schedule": 0.49927279353141785, "l2_grads": 1.6684353351593018, "l2_params": 292.6858215332031, "l2_updates": 0.5347222089767456, "train/loss": 2.166851043701172, "uptime": 11395.485876844, "examples_seen": 62822400.0, "progress": 0.5448345070735238, "epoch": 49.03529360341002, "img/sec/core": 605.8074311609714, "core_hours_NVIDIA A100-SXM4-40GB": 24.548458917802193, "core_hours": 24.548458917802193} {"step": 61400, "global_schedule": 0.4985072910785675, "l2_grads": 1.630683183670044, "l2_params": 292.60345458984375, "l2_updates": 0.536857545375824, "train/loss": 2.095633029937744, "uptime": 11404.784854218002, "examples_seen": 62873600.0, "progress": 0.5452785449765992, "epoch": 49.07525716787897, "img/sec/core": 688.2477225822458, "core_hours_NVIDIA A100-SXM4-40GB": 24.569123311966642, "core_hours": 24.569123311966642} {"step": 61450, "global_schedule": 0.4977419376373291, "l2_grads": 1.6543561220169067, "l2_params": 292.52972412109375, "l2_updates": 0.5265747308731079, "train/loss": 2.0690200328826904, "uptime": 11414.499540117, "examples_seen": 62924800.0, "progress": 0.5457225828796746, "epoch": 49.11522073234793, "img/sec/core": 658.7963899748958, "core_hours_NVIDIA A100-SXM4-40GB": 24.590711502853306, "core_hours": 24.590711502853306} {"step": 61500, "global_schedule": 0.49697643518447876, "l2_grads": 1.6765222549438477, "l2_params": 292.4413146972656, "l2_updates": 0.5245898365974426, "train/loss": 2.098067283630371, "uptime": 11423.141639866999, "examples_seen": 62976000.0, "progress": 0.54616662078275, "epoch": 49.155184296816884, "img/sec/core": 740.5607647609849, "core_hours_NVIDIA A100-SXM4-40GB": 24.60991616896441, "core_hours": 24.60991616896441} {"step": 61550, "global_schedule": 0.4962109327316284, "l2_grads": 1.6133732795715332, "l2_params": 292.3465576171875, "l2_updates": 0.5160700082778931, "train/loss": 2.783623218536377, "uptime": 11432.053019281999, "examples_seen": 63027200.0, "progress": 0.5466106586858254, "epoch": 49.19514786128585, "img/sec/core": 718.1828650710776, "core_hours_NVIDIA A100-SXM4-40GB": 24.62971923433108, "core_hours": 24.62971923433108} {"step": 61600, "global_schedule": 0.49544546008110046, "l2_grads": 1.6757265329360962, "l2_params": 292.2434997558594, "l2_updates": 0.5210773944854736, "train/loss": 2.183758020401001, "uptime": 11440.802577449, "examples_seen": 63078400.0, "progress": 0.5470546965889008, "epoch": 49.2351114257548, "img/sec/core": 731.4655069255581, "core_hours_NVIDIA A100-SXM4-40GB": 24.649162696924414, "core_hours": 24.649162696924414} {"step": 61650, "global_schedule": 0.4946800172328949, "l2_grads": 1.5976688861846924, "l2_params": 292.1671142578125, "l2_updates": 0.5147562623023987, "train/loss": 4.632476806640625, "uptime": 11449.671514826, "examples_seen": 63129600.0, "progress": 0.5474987344919763, "epoch": 49.27507499022376, "img/sec/core": 721.6197079706187, "core_hours_NVIDIA A100-SXM4-40GB": 24.668871446651078, "core_hours": 24.668871446651078} {"step": 61700, "global_schedule": 0.4939146637916565, "l2_grads": 1.5862892866134644, "l2_params": 292.0691833496094, "l2_updates": 0.5298694372177124, "train/loss": 2.6671862602233887, "uptime": 11458.453858427, "examples_seen": 63180800.0, "progress": 0.5479427723950516, "epoch": 49.31503855469271, "img/sec/core": 728.7348674528097, "core_hours_NVIDIA A100-SXM4-40GB": 24.688387765764414, "core_hours": 24.688387765764414} {"step": 61750, "global_schedule": 0.4931492209434509, "l2_grads": 1.7687864303588867, "l2_params": 291.98455810546875, "l2_updates": 0.5173996686935425, "train/loss": 2.1692442893981934, "uptime": 11467.304365068, "examples_seen": 63232000.0, "progress": 0.5483868102981271, "epoch": 49.35500211916167, "img/sec/core": 723.1224448046981, "core_hours_NVIDIA A100-SXM4-40GB": 24.70805555829997, "core_hours": 24.70805555829997} {"step": 61800, "global_schedule": 0.49238380789756775, "l2_grads": 1.6999567747116089, "l2_params": 291.9090270996094, "l2_updates": 0.5260985493659973, "train/loss": 2.160996913909912, "uptime": 11476.089684917, "examples_seen": 63283200.0, "progress": 0.5488308482012024, "epoch": 49.39496568363063, "img/sec/core": 728.4879901928315, "core_hours_NVIDIA A100-SXM4-40GB": 24.727578491297752, "core_hours": 24.727578491297752} {"step": 61850, "global_schedule": 0.49161839485168457, "l2_grads": 1.6589664220809937, "l2_params": 291.8172302246094, "l2_updates": 0.5021741390228271, "train/loss": 4.396081924438477, "uptime": 11484.991840679, "examples_seen": 63334400.0, "progress": 0.5492748861042779, "epoch": 49.434929248099586, "img/sec/core": 718.926984778148, "core_hours_NVIDIA A100-SXM4-40GB": 24.74736105965775, "core_hours": 24.74736105965775} {"step": 61900, "global_schedule": 0.49085307121276855, "l2_grads": 1.6122936010360718, "l2_params": 291.71624755859375, "l2_updates": 0.5262173414230347, "train/loss": 2.019509792327881, "uptime": 11493.728665019002, "examples_seen": 63385600.0, "progress": 0.5497189240073532, "epoch": 49.47489281256854, "img/sec/core": 732.5316099921632, "core_hours_NVIDIA A100-SXM4-40GB": 24.766776224857754, "core_hours": 24.766776224857754} {"step": 61950, "global_schedule": 0.4900877773761749, "l2_grads": 1.6764156818389893, "l2_params": 291.6340637207031, "l2_updates": 0.5331822633743286, "train/loss": 2.172581195831299, "uptime": 11502.714316198, "examples_seen": 63436800.0, "progress": 0.5501629619104287, "epoch": 49.514856377037496, "img/sec/core": 712.2466555298998, "core_hours_NVIDIA A100-SXM4-40GB": 24.78674433858886, "core_hours": 24.78674433858886} {"step": 62000, "global_schedule": 0.4893224835395813, "l2_grads": 1.6477559804916382, "l2_params": 291.542724609375, "l2_updates": 0.521976888179779, "train/loss": 2.1647586822509766, "uptime": 11511.561838815001, "examples_seen": 63488000.0, "progress": 0.550606999813504, "epoch": 49.55481994150645, "img/sec/core": 723.3663339500123, "core_hours_NVIDIA A100-SXM4-40GB": 24.806405499959975, "core_hours": 24.806405499959975} {"step": 62050, "global_schedule": 0.48855718970298767, "l2_grads": 1.7133346796035767, "l2_params": 291.4578857421875, "l2_updates": 0.5248113870620728, "train/loss": 2.08998703956604, "uptime": 11521.683339271001, "examples_seen": 63539200.0, "progress": 0.5510510377165795, "epoch": 49.594783505975414, "img/sec/core": 702.9745130053416, "core_hours_NVIDIA A100-SXM4-40GB": 24.826636990517745, "core_hours": 24.826636990517745} {"step": 62100, "global_schedule": 0.48779189586639404, "l2_grads": 1.673596978187561, "l2_params": 291.3644714355469, "l2_updates": 0.5116366147994995, "train/loss": 2.13344407081604, "uptime": 11531.416273761, "examples_seen": 63590400.0, "progress": 0.5514950756196549, "epoch": 49.63474707044437, "img/sec/core": 657.561191496383, "core_hours_NVIDIA A100-SXM4-40GB": 24.848265733828857, "core_hours": 24.848265733828857} {"step": 62150, "global_schedule": 0.48702675104141235, "l2_grads": 1.4923608303070068, "l2_params": 291.2796325683594, "l2_updates": 0.5078017115592957, "train/loss": 3.1419053077697754, "uptime": 11540.722768522, "examples_seen": 63641600.0, "progress": 0.5519391135227303, "epoch": 49.674710634913325, "img/sec/core": 687.6917856140567, "core_hours_NVIDIA A100-SXM4-40GB": 24.868946833297745, "core_hours": 24.868946833297745} {"step": 62200, "global_schedule": 0.4862615168094635, "l2_grads": 1.5369727611541748, "l2_params": 291.1910705566406, "l2_updates": 0.5126484632492065, "train/loss": 3.1679978370666504, "uptime": 11549.636735286002, "examples_seen": 63692800.0, "progress": 0.5523831514258057, "epoch": 49.71467419938228, "img/sec/core": 717.9744068427871, "core_hours_NVIDIA A100-SXM4-40GB": 24.88875564832886, "core_hours": 24.88875564832886} {"step": 62250, "global_schedule": 0.4854963421821594, "l2_grads": 1.650309443473816, "l2_params": 291.08380126953125, "l2_updates": 0.5219364762306213, "train/loss": 2.4132988452911377, "uptime": 11558.889863068, "examples_seen": 63744000.0, "progress": 0.5528271893288811, "epoch": 49.754637763851235, "img/sec/core": 691.6580156226953, "core_hours_NVIDIA A100-SXM4-40GB": 24.909318154511077, "core_hours": 24.909318154511077} {"step": 62300, "global_schedule": 0.48473116755485535, "l2_grads": 1.6137535572052002, "l2_params": 291.00299072265625, "l2_updates": 0.5056082606315613, "train/loss": 2.5832948684692383, "uptime": 11568.599492426, "examples_seen": 63795200.0, "progress": 0.5532712272319565, "epoch": 49.7946013283202, "img/sec/core": 659.1394752598887, "core_hours_NVIDIA A100-SXM4-40GB": 24.930895108639966, "core_hours": 24.930895108639966} {"step": 62350, "global_schedule": 0.48396605253219604, "l2_grads": 1.7839871644973755, "l2_params": 290.9041748046875, "l2_updates": 0.5072832703590393, "train/loss": 4.653111934661865, "uptime": 11578.40602168, "examples_seen": 63846400.0, "progress": 0.5537152651350319, "epoch": 49.83456489278915, "img/sec/core": 652.6264118764144, "core_hours_NVIDIA A100-SXM4-40GB": 24.952687395871077, "core_hours": 24.952687395871077} {"step": 62400, "global_schedule": 0.4832010567188263, "l2_grads": 1.4919865131378174, "l2_params": 290.82196044921875, "l2_updates": 0.5105322599411011, "train/loss": 4.512603282928467, "uptime": 11587.437833355, "examples_seen": 63897600.0, "progress": 0.5541593030381073, "epoch": 49.87452845725811, "img/sec/core": 708.6064491043528, "core_hours_NVIDIA A100-SXM4-40GB": 24.972758088482188, "core_hours": 24.972758088482188} {"step": 62450, "global_schedule": 0.48243603110313416, "l2_grads": 1.4879941940307617, "l2_params": 290.7393798828125, "l2_updates": 0.5112389326095581, "train/loss": 3.2689993381500244, "uptime": 11596.01639712, "examples_seen": 63948800.0, "progress": 0.5546033409411827, "epoch": 49.914492021727064, "img/sec/core": 746.0456290027432, "core_hours_NVIDIA A100-SXM4-40GB": 24.991821563515522, "core_hours": 24.991821563515522} {"step": 62500, "global_schedule": 0.481671005487442, "l2_grads": 1.675563097000122, "l2_params": 290.6316833496094, "l2_updates": 0.5149970650672913, "train/loss": 2.1252870559692383, "uptime": 11605.172979152, "examples_seen": 64000000.0, "progress": 0.5550473788442581, "epoch": 49.954455586196026, "img/sec/core": 698.950763247037, "core_hours_NVIDIA A100-SXM4-40GB": 25.012169523586632, "core_hours": 25.012169523586632, "val/acc@1": 0.68242, "val/loss": 1.279830390625, "z/secs/eval/val": 5.32851047299846} {"step": 62550, "global_schedule": 0.48090609908103943, "l2_grads": 1.6789871454238892, "l2_params": 290.5427551269531, "l2_updates": 0.499982088804245, "train/loss": 2.1705322265625, "uptime": 11618.956716477, "examples_seen": 64051200.0, "progress": 0.5554914167473336, "epoch": 49.99441915066498, "img/sec/core": 757.0216002903038, "core_hours_NVIDIA A100-SXM4-40GB": 25.030956599433303, "core_hours": 25.030956599433303} {"step": 62600, "global_schedule": 0.48014119267463684, "l2_grads": 1.5658149719238281, "l2_params": 290.45513916015625, "l2_updates": 0.5084957480430603, "train/loss": 2.726487159729004, "uptime": 11628.393106921, "examples_seen": 64102400.0, "progress": 0.5559354546504089, "epoch": 50.03438271513394, "img/sec/core": 678.2254335469509, "core_hours_NVIDIA A100-SXM4-40GB": 25.051926355975525, "core_hours": 25.051926355975525} {"step": 62650, "global_schedule": 0.4793763756752014, "l2_grads": 1.505605697631836, "l2_params": 290.3702392578125, "l2_updates": 0.5092558860778809, "train/loss": 3.8133087158203125, "uptime": 11637.38136039, "examples_seen": 64153600.0, "progress": 0.5563794925534844, "epoch": 50.07434627960289, "img/sec/core": 712.0404450178124, "core_hours_NVIDIA A100-SXM4-40GB": 25.071900252573304, "core_hours": 25.071900252573304} {"step": 62700, "global_schedule": 0.4786115884780884, "l2_grads": 1.698696494102478, "l2_params": 290.27777099609375, "l2_updates": 0.514374315738678, "train/loss": 2.0754342079162598, "uptime": 11646.011285303002, "examples_seen": 64204800.0, "progress": 0.5568235304565597, "epoch": 50.11430984407185, "img/sec/core": 741.6055254846189, "core_hours_NVIDIA A100-SXM4-40GB": 25.091077863491087, "core_hours": 25.091077863491087} {"step": 62750, "global_schedule": 0.47784683108329773, "l2_grads": 1.5609723329544067, "l2_params": 290.1966857910156, "l2_updates": 0.5048277378082275, "train/loss": 4.1668243408203125, "uptime": 11654.46910067, "examples_seen": 64256000.0, "progress": 0.5572675683596352, "epoch": 50.15427340854081, "img/sec/core": 756.69658443634, "core_hours_NVIDIA A100-SXM4-40GB": 25.10987300875108, "core_hours": 25.10987300875108} {"step": 62800, "global_schedule": 0.47708210349082947, "l2_grads": 1.5870428085327148, "l2_params": 290.1036376953125, "l2_updates": 0.5093359351158142, "train/loss": 3.513751983642578, "uptime": 11663.100394063002, "examples_seen": 64307200.0, "progress": 0.5577116062627105, "epoch": 50.194236973009765, "img/sec/core": 741.4879449224655, "core_hours_NVIDIA A100-SXM4-40GB": 25.12905366073553, "core_hours": 25.12905366073553} {"step": 62850, "global_schedule": 0.476317435503006, "l2_grads": 1.4784296751022339, "l2_params": 290.023681640625, "l2_updates": 0.507732629776001, "train/loss": 3.757829427719116, "uptime": 11672.487805903, "examples_seen": 64358400.0, "progress": 0.558155644165786, "epoch": 50.23420053747872, "img/sec/core": 681.7640590488144, "core_hours_NVIDIA A100-SXM4-40GB": 25.149914575935522, "core_hours": 25.149914575935522} {"step": 62900, "global_schedule": 0.47555291652679443, "l2_grads": 1.4803229570388794, "l2_params": 289.9324951171875, "l2_updates": 0.511328935623169, "train/loss": 2.891477108001709, "uptime": 11682.058266676, "examples_seen": 64409600.0, "progress": 0.5585996820688613, "epoch": 50.274164101947676, "img/sec/core": 668.7243333210565, "core_hours_NVIDIA A100-SXM4-40GB": 25.171182266542193, "core_hours": 25.171182266542193} {"step": 62950, "global_schedule": 0.4747883677482605, "l2_grads": 1.7114088535308838, "l2_params": 289.84136962890625, "l2_updates": 0.5132813453674316, "train/loss": 2.4864025115966797, "uptime": 11691.621589842, "examples_seen": 64460800.0, "progress": 0.5590437199719368, "epoch": 50.31412766641663, "img/sec/core": 669.2234371786113, "core_hours_NVIDIA A100-SXM4-40GB": 25.192434095799968, "core_hours": 25.192434095799968} {"step": 63000, "global_schedule": 0.47402387857437134, "l2_grads": 1.7872835397720337, "l2_params": 289.7613830566406, "l2_updates": 0.5031929612159729, "train/loss": 2.165510416030884, "uptime": 11701.240920485, "examples_seen": 64512000.0, "progress": 0.5594877578750123, "epoch": 50.354091230885594, "img/sec/core": 665.3269585506538, "core_hours_NVIDIA A100-SXM4-40GB": 25.213810386117746, "core_hours": 25.213810386117746} {"step": 63050, "global_schedule": 0.47325944900512695, "l2_grads": 1.7122201919555664, "l2_params": 289.6705017089844, "l2_updates": 0.5104068517684937, "train/loss": 2.1431632041931152, "uptime": 11710.490279497999, "examples_seen": 64563200.0, "progress": 0.5599317957780876, "epoch": 50.39405479535455, "img/sec/core": 745.8680120090219, "core_hours_NVIDIA A100-SXM4-40GB": 25.232878400824415, "core_hours": 25.232878400824415} {"step": 63100, "global_schedule": 0.47249510884284973, "l2_grads": 1.5781421661376953, "l2_params": 289.5827941894531, "l2_updates": 0.504723072052002, "train/loss": 2.625422239303589, "uptime": 11720.093699613999, "examples_seen": 64614400.0, "progress": 0.5603758336811631, "epoch": 50.434018359823504, "img/sec/core": 666.4292431960878, "core_hours_NVIDIA A100-SXM4-40GB": 25.254219334415527, "core_hours": 25.254219334415527} {"step": 63150, "global_schedule": 0.4717308580875397, "l2_grads": 1.7845070362091064, "l2_params": 289.497802734375, "l2_updates": 0.5009999871253967, "train/loss": 2.171513557434082, "uptime": 11728.699624873001, "examples_seen": 64665600.0, "progress": 0.5608198715842384, "epoch": 50.47398192429246, "img/sec/core": 743.6736675472949, "core_hours_NVIDIA A100-SXM4-40GB": 25.273343612768866, "core_hours": 25.273343612768866} {"step": 63200, "global_schedule": 0.470966637134552, "l2_grads": 1.741355299949646, "l2_params": 289.4144592285156, "l2_updates": 0.5008387565612793, "train/loss": 2.1033546924591064, "uptime": 11736.789300126, "examples_seen": 64716800.0, "progress": 0.5612639094873139, "epoch": 50.513945488761415, "img/sec/core": 791.1318810514065, "core_hours_NVIDIA A100-SXM4-40GB": 25.291320668886637, "core_hours": 25.291320668886637} {"step": 63250, "global_schedule": 0.4702025055885315, "l2_grads": 1.7176525592803955, "l2_params": 289.3423156738281, "l2_updates": 0.49952542781829834, "train/loss": 2.220961332321167, "uptime": 11745.349366099, "examples_seen": 64768000.0, "progress": 0.5617079473903892, "epoch": 50.55390905323038, "img/sec/core": 747.6577891088926, "core_hours_NVIDIA A100-SXM4-40GB": 25.31034303771553, "core_hours": 25.31034303771553} {"step": 63300, "global_schedule": 0.4694384038448334, "l2_grads": 1.7216277122497559, "l2_params": 289.2537536621094, "l2_updates": 0.5030471086502075, "train/loss": 2.1916606426239014, "uptime": 11754.109776029001, "examples_seen": 64819200.0, "progress": 0.5621519852934647, "epoch": 50.59387261769933, "img/sec/core": 730.5594202941091, "core_hours_NVIDIA A100-SXM4-40GB": 25.329810615337752, "core_hours": 25.329810615337752} {"step": 63350, "global_schedule": 0.4686744809150696, "l2_grads": 1.753218650817871, "l2_params": 289.1451110839844, "l2_updates": 0.49540990591049194, "train/loss": 2.3224971294403076, "uptime": 11763.512178519, "examples_seen": 64870400.0, "progress": 0.56259602319654, "epoch": 50.63383618216829, "img/sec/core": 680.6770936265917, "core_hours_NVIDIA A100-SXM4-40GB": 25.350704843093308, "core_hours": 25.350704843093308} {"step": 63400, "global_schedule": 0.4679105281829834, "l2_grads": 1.6431552171707153, "l2_params": 289.0600891113281, "l2_updates": 0.4959113597869873, "train/loss": 2.047410488128662, "uptime": 11773.238534598999, "examples_seen": 64921600.0, "progress": 0.5630400610996155, "epoch": 50.67379974663724, "img/sec/core": 658.0059322690429, "core_hours_NVIDIA A100-SXM4-40GB": 25.372318967715525, "core_hours": 25.372318967715525} {"step": 63450, "global_schedule": 0.467146635055542, "l2_grads": 1.81376051902771, "l2_params": 288.9745178222656, "l2_updates": 0.4982103705406189, "train/loss": 2.115041971206665, "uptime": 11782.831473575001, "examples_seen": 64972800.0, "progress": 0.5634840990026909, "epoch": 50.713763311106206, "img/sec/core": 667.157376483924, "core_hours_NVIDIA A100-SXM4-40GB": 25.39363660988442, "core_hours": 25.39363660988442} {"step": 63500, "global_schedule": 0.46638283133506775, "l2_grads": 1.730592966079712, "l2_params": 288.8861999511719, "l2_updates": 0.4912271201610565, "train/loss": 2.286778211593628, "uptime": 11791.894872452, "examples_seen": 65024000.0, "progress": 0.5639281369057663, "epoch": 50.75372687557516, "img/sec/core": 706.1368573595578, "core_hours_NVIDIA A100-SXM4-40GB": 25.41377749627775, "core_hours": 25.41377749627775} {"step": 63550, "global_schedule": 0.4656190872192383, "l2_grads": 1.71208655834198, "l2_params": 288.7911376953125, "l2_updates": 0.49747002124786377, "train/loss": 2.155242919921875, "uptime": 11801.599975873001, "examples_seen": 65075200.0, "progress": 0.5643721748088417, "epoch": 50.79369044004412, "img/sec/core": 659.4468623745419, "core_hours_NVIDIA A100-SXM4-40GB": 25.435344392768865, "core_hours": 25.435344392768865} {"step": 63600, "global_schedule": 0.4648555517196655, "l2_grads": 1.60942542552948, "l2_params": 288.69390869140625, "l2_updates": 0.4802576005458832, "train/loss": 3.9981932640075684, "uptime": 11811.151845497001, "examples_seen": 65126400.0, "progress": 0.5648162127119171, "epoch": 50.83365400451307, "img/sec/core": 670.025895654983, "core_hours_NVIDIA A100-SXM4-40GB": 25.45657076971109, "core_hours": 25.45657076971109} {"step": 63650, "global_schedule": 0.4640919864177704, "l2_grads": 1.577750325202942, "l2_params": 288.59393310546875, "l2_updates": 0.4789760708808899, "train/loss": 4.4117937088012695, "uptime": 11820.923991004, "examples_seen": 65177600.0, "progress": 0.5652602506149925, "epoch": 50.87361756898203, "img/sec/core": 654.9227081623408, "core_hours_NVIDIA A100-SXM4-40GB": 25.47828664861553, "core_hours": 25.47828664861553} {"step": 63700, "global_schedule": 0.4633285105228424, "l2_grads": 1.617362141609192, "l2_params": 288.4862365722656, "l2_updates": 0.4890870749950409, "train/loss": 2.087843656539917, "uptime": 11830.652633030999, "examples_seen": 65228800.0, "progress": 0.5657042885180679, "epoch": 50.91358113345099, "img/sec/core": 657.8513200751428, "core_hours_NVIDIA A100-SXM4-40GB": 25.49990585311997, "core_hours": 25.49990585311997} {"step": 63750, "global_schedule": 0.4625651240348816, "l2_grads": 1.6480505466461182, "l2_params": 288.4093933105469, "l2_updates": 0.4851861000061035, "train/loss": 2.5115110874176025, "uptime": 11839.609790235, "examples_seen": 65280000.0, "progress": 0.5661483264211433, "epoch": 50.953544697919945, "img/sec/core": 714.5124121681897, "core_hours_NVIDIA A100-SXM4-40GB": 25.519810646906638, "core_hours": 25.519810646906638} {"step": 63800, "global_schedule": 0.4618018567562103, "l2_grads": 1.5461432933807373, "l2_params": 288.3057861328125, "l2_updates": 0.4908742904663086, "train/loss": 4.036013126373291, "uptime": 11848.127252312, "examples_seen": 65331200.0, "progress": 0.5665923643242187, "epoch": 50.9935082623889, "img/sec/core": 751.397533929878, "core_hours_NVIDIA A100-SXM4-40GB": 25.538738340411086, "core_hours": 25.538738340411086} {"step": 63850, "global_schedule": 0.4610387086868286, "l2_grads": 1.7409712076187134, "l2_params": 288.2254638671875, "l2_updates": 0.487287312746048, "train/loss": 2.067500591278076, "uptime": 11857.609681930999, "examples_seen": 65382400.0, "progress": 0.5670364022272941, "epoch": 51.033471826857856, "img/sec/core": 674.9325075060444, "core_hours_NVIDIA A100-SXM4-40GB": 25.55981040623108, "core_hours": 25.55981040623108} {"step": 63900, "global_schedule": 0.46027565002441406, "l2_grads": 1.7243577241897583, "l2_params": 288.13934326171875, "l2_updates": 0.4916769862174988, "train/loss": 2.134110450744629, "uptime": 11867.093076736002, "examples_seen": 65433600.0, "progress": 0.5674804401303696, "epoch": 51.07343539132681, "img/sec/core": 674.8638152893553, "core_hours_NVIDIA A100-SXM4-40GB": 25.580884616908868, "core_hours": 25.580884616908868} {"step": 63950, "global_schedule": 0.4595125913619995, "l2_grads": 1.8360947370529175, "l2_params": 288.0559997558594, "l2_updates": 0.4949309527873993, "train/loss": 2.171231508255005, "uptime": 11876.054793796002, "examples_seen": 65484800.0, "progress": 0.5679244780334449, "epoch": 51.11339895579577, "img/sec/core": 714.1488575405165, "core_hours_NVIDIA A100-SXM4-40GB": 25.600799543708867, "core_hours": 25.600799543708867} {"step": 64000, "global_schedule": 0.4587496519088745, "l2_grads": 1.8446133136749268, "l2_params": 287.9627990722656, "l2_updates": 0.47624263167381287, "train/loss": 2.2201852798461914, "uptime": 11884.738397957002, "examples_seen": 65536000.0, "progress": 0.5683685159365204, "epoch": 51.15336252026473, "img/sec/core": 737.0211586501753, "core_hours_NVIDIA A100-SXM4-40GB": 25.62009644184442, "core_hours": 25.62009644184442} {"step": 64050, "global_schedule": 0.45798683166503906, "l2_grads": 1.62282133102417, "l2_params": 287.8699645996094, "l2_updates": 0.48356494307518005, "train/loss": 2.523153066635132, "uptime": 11893.620437542, "examples_seen": 65587200.0, "progress": 0.5688125538395957, "epoch": 51.193326084733684, "img/sec/core": 783.284829895125, "core_hours_NVIDIA A100-SXM4-40GB": 25.638253594491086, "core_hours": 25.638253594491086} {"step": 64100, "global_schedule": 0.45722419023513794, "l2_grads": 1.7638205289840698, "l2_params": 287.7843322753906, "l2_updates": 0.48728007078170776, "train/loss": 2.0769851207733154, "uptime": 11902.657400180002, "examples_seen": 65638400.0, "progress": 0.5692565917426712, "epoch": 51.23328964920264, "img/sec/core": 708.2025517165681, "core_hours_NVIDIA A100-SXM4-40GB": 25.65833573368665, "core_hours": 25.65833573368665} {"step": 64150, "global_schedule": 0.4564615488052368, "l2_grads": 1.6118230819702148, "l2_params": 287.6978454589844, "l2_updates": 0.47614917159080505, "train/loss": 4.450575828552246, "uptime": 11911.184684085, "examples_seen": 65689600.0, "progress": 0.5697006296457465, "epoch": 51.273253213671595, "img/sec/core": 750.5320652276089, "core_hours_NVIDIA A100-SXM4-40GB": 25.677285253475528, "core_hours": 25.677285253475528} {"step": 64200, "global_schedule": 0.45569899678230286, "l2_grads": 1.5207756757736206, "l2_params": 287.6111755371094, "l2_updates": 0.4824886620044708, "train/loss": 2.98306941986084, "uptime": 11919.886010306001, "examples_seen": 65740800.0, "progress": 0.570144667548822, "epoch": 51.31321677814056, "img/sec/core": 735.5200618214428, "core_hours_NVIDIA A100-SXM4-40GB": 25.696621533966646, "core_hours": 25.696621533966646} {"step": 64250, "global_schedule": 0.45493656396865845, "l2_grads": 1.827038049697876, "l2_params": 287.510986328125, "l2_updates": 0.48116108775138855, "train/loss": 2.151526689529419, "uptime": 11928.570534616001, "examples_seen": 65792000.0, "progress": 0.5705887054518973, "epoch": 51.35318034260951, "img/sec/core": 736.9430692514499, "core_hours_NVIDIA A100-SXM4-40GB": 25.715920476877752, "core_hours": 25.715920476877752} {"step": 64300, "global_schedule": 0.4541742205619812, "l2_grads": 1.6497273445129395, "l2_params": 287.4195556640625, "l2_updates": 0.4741954207420349, "train/loss": 3.1882848739624023, "uptime": 11937.134973080001, "examples_seen": 65843200.0, "progress": 0.5710327433549728, "epoch": 51.39314390707847, "img/sec/core": 747.2760796755042, "core_hours_NVIDIA A100-SXM4-40GB": 25.73495256235331, "core_hours": 25.73495256235331} {"step": 64350, "global_schedule": 0.45341211557388306, "l2_grads": 1.6543800830841064, "l2_params": 287.32379150390625, "l2_updates": 0.4875575602054596, "train/loss": 2.004314661026001, "uptime": 11945.764478817002, "examples_seen": 65894400.0, "progress": 0.5714767812580482, "epoch": 51.43310747154742, "img/sec/core": 741.6415487805662, "core_hours_NVIDIA A100-SXM4-40GB": 25.75412924176887, "core_hours": 25.75412924176887} {"step": 64400, "global_schedule": 0.4526500105857849, "l2_grads": 1.6139886379241943, "l2_params": 287.2471618652344, "l2_updates": 0.47197601199150085, "train/loss": 4.024373531341553, "uptime": 11954.390825495002, "examples_seen": 65945600.0, "progress": 0.5719208191611236, "epoch": 51.473071036016385, "img/sec/core": 741.9131457262205, "core_hours_NVIDIA A100-SXM4-40GB": 25.773298901053312, "core_hours": 25.773298901053312} {"step": 64450, "global_schedule": 0.4518880546092987, "l2_grads": 1.568906307220459, "l2_params": 287.1490478515625, "l2_updates": 0.475285142660141, "train/loss": 4.610140323638916, "uptime": 11964.059293311, "examples_seen": 65996800.0, "progress": 0.572364857064199, "epoch": 51.51303460048534, "img/sec/core": 661.9456279732442, "core_hours_NVIDIA A100-SXM4-40GB": 25.794784385088864, "core_hours": 25.794784385088864} {"step": 64500, "global_schedule": 0.4511261582374573, "l2_grads": 1.6455914974212646, "l2_params": 287.0628967285156, "l2_updates": 0.4786751866340637, "train/loss": 3.917559862136841, "uptime": 11973.504508154, "examples_seen": 66048000.0, "progress": 0.5728088949672744, "epoch": 51.552998164954296, "img/sec/core": 677.5917865694435, "core_hours_NVIDIA A100-SXM4-40GB": 25.815773751406642, "core_hours": 25.815773751406642} {"step": 64550, "global_schedule": 0.45036444067955017, "l2_grads": 1.7066789865493774, "l2_params": 286.97674560546875, "l2_updates": 0.470653235912323, "train/loss": 2.8350977897644043, "uptime": 11982.151362233, "examples_seen": 66099200.0, "progress": 0.5732529328703498, "epoch": 51.59296172942325, "img/sec/core": 740.1535797328235, "core_hours_NVIDIA A100-SXM4-40GB": 25.834988982693307, "core_hours": 25.834988982693307} {"step": 64600, "global_schedule": 0.4496028423309326, "l2_grads": 1.5512113571166992, "l2_params": 286.8908386230469, "l2_updates": 0.47613218426704407, "train/loss": 3.3775503635406494, "uptime": 11990.658236592002, "examples_seen": 66150400.0, "progress": 0.5736969707734252, "epoch": 51.63292529389221, "img/sec/core": 752.3327287921728, "core_hours_NVIDIA A100-SXM4-40GB": 25.853893147935537, "core_hours": 25.853893147935537} {"step": 64650, "global_schedule": 0.44884130358695984, "l2_grads": 1.7151811122894287, "l2_params": 286.8102111816406, "l2_updates": 0.48089689016342163, "train/loss": 2.1910762786865234, "uptime": 11999.196972994001, "examples_seen": 66201600.0, "progress": 0.5741410086765006, "epoch": 51.67288885836117, "img/sec/core": 749.5254214079932, "core_hours_NVIDIA A100-SXM4-40GB": 25.872868117717754, "core_hours": 25.872868117717754} {"step": 64700, "global_schedule": 0.4480798542499542, "l2_grads": 1.7003848552703857, "l2_params": 286.7137756347656, "l2_updates": 0.47903352975845337, "train/loss": 2.167238473892212, "uptime": 12007.842057005999, "examples_seen": 66252800.0, "progress": 0.574585046579576, "epoch": 51.712852422830125, "img/sec/core": 740.3051249840892, "core_hours_NVIDIA A100-SXM4-40GB": 25.892079415522193, "core_hours": 25.892079415522193} {"step": 64750, "global_schedule": 0.44731855392456055, "l2_grads": 1.7103608846664429, "l2_params": 286.61102294921875, "l2_updates": 0.47654837369918823, "train/loss": 2.0705924034118652, "uptime": 12016.390742129, "examples_seen": 66304000.0, "progress": 0.5750290844826514, "epoch": 51.75281598729908, "img/sec/core": 748.6531446549312, "core_hours_NVIDIA A100-SXM4-40GB": 25.91107649357331, "core_hours": 25.91107649357331} {"step": 64800, "global_schedule": 0.44655749201774597, "l2_grads": 1.5581690073013306, "l2_params": 286.5229797363281, "l2_updates": 0.47530150413513184, "train/loss": 2.7470245361328125, "uptime": 12025.768905821, "examples_seen": 66355200.0, "progress": 0.5754731223857269, "epoch": 51.792779551768035, "img/sec/core": 682.4363713612642, "core_hours_NVIDIA A100-SXM4-40GB": 25.93191685733331, "core_hours": 25.93191685733331} {"step": 64850, "global_schedule": 0.4457964599132538, "l2_grads": 1.557999849319458, "l2_params": 286.4271240234375, "l2_updates": 0.47188156843185425, "train/loss": 3.714937448501587, "uptime": 12034.465199361, "examples_seen": 66406400.0, "progress": 0.5759171602888022, "epoch": 51.83274311623699, "img/sec/core": 735.9457187779726, "core_hours_NVIDIA A100-SXM4-40GB": 25.951241954088864, "core_hours": 25.951241954088864} {"step": 64900, "global_schedule": 0.44503551721572876, "l2_grads": 1.6692562103271484, "l2_params": 286.3435974121094, "l2_updates": 0.4661714732646942, "train/loss": 2.439120292663574, "uptime": 12043.362156825, "examples_seen": 66457600.0, "progress": 0.5763611981918777, "epoch": 51.87270668070595, "img/sec/core": 719.3470381191327, "core_hours_NVIDIA A100-SXM4-40GB": 25.97101297067553, "core_hours": 25.97101297067553} {"step": 64950, "global_schedule": 0.4442747235298157, "l2_grads": 1.5818543434143066, "l2_params": 286.23968505859375, "l2_updates": 0.4820958375930786, "train/loss": 2.691359519958496, "uptime": 12053.000328158001, "examples_seen": 66508800.0, "progress": 0.576805236094953, "epoch": 51.91267024517491, "img/sec/core": 664.0263779173971, "core_hours_NVIDIA A100-SXM4-40GB": 25.992431129193314, "core_hours": 25.992431129193314} {"step": 65000, "global_schedule": 0.4435141086578369, "l2_grads": 1.6838563680648804, "l2_params": 286.15240478515625, "l2_updates": 0.4664704501628876, "train/loss": 2.0249366760253906, "uptime": 12062.102148970002, "examples_seen": 66560000.0, "progress": 0.5772492739980285, "epoch": 51.952633809643864, "img/sec/core": 703.1560093516529, "core_hours_NVIDIA A100-SXM4-40GB": 26.012657397664423, "core_hours": 26.012657397664423, "val/acc@1": 0.68678, "val/loss": 1.2913129931640626, "z/secs/eval/val": 2.6491948069997306} {"step": 65050, "global_schedule": 0.4427536427974701, "l2_grads": 1.5272914171218872, "l2_params": 286.0513916015625, "l2_updates": 0.4643000066280365, "train/loss": 3.954793691635132, "uptime": 12073.803499177002, "examples_seen": 66611200.0, "progress": 0.5776933119011038, "epoch": 51.99259737411282, "img/sec/core": 762.3072526921868, "core_hours_NVIDIA A100-SXM4-40GB": 26.031314208513322, "core_hours": 26.031314208513322} {"step": 65100, "global_schedule": 0.44199323654174805, "l2_grads": 1.5805121660232544, "l2_params": 285.979248046875, "l2_updates": 0.4666621685028076, "train/loss": 3.7351019382476807, "uptime": 12083.098937542001, "examples_seen": 66662400.0, "progress": 0.5781373498041793, "epoch": 52.032560938581774, "img/sec/core": 688.5097559355819, "core_hours_NVIDIA A100-SXM4-40GB": 26.05197073821332, "core_hours": 26.05197073821332} {"step": 65150, "global_schedule": 0.4412330389022827, "l2_grads": 1.7495629787445068, "l2_params": 285.88458251953125, "l2_updates": 0.4674721360206604, "train/loss": 2.275722026824951, "uptime": 12092.031133526, "examples_seen": 66713600.0, "progress": 0.5785813877072546, "epoch": 52.07252450305074, "img/sec/core": 716.50913296859, "core_hours_NVIDIA A100-SXM4-40GB": 26.071820062622205, "core_hours": 26.071820062622205} {"step": 65200, "global_schedule": 0.44047290086746216, "l2_grads": 1.7167881727218628, "l2_params": 285.7965087890625, "l2_updates": 0.4681723117828369, "train/loss": 2.0296781063079834, "uptime": 12101.554488603999, "examples_seen": 66764800.0, "progress": 0.5790254256103301, "epoch": 52.11248806751969, "img/sec/core": 672.0320672265052, "core_hours_NVIDIA A100-SXM4-40GB": 26.092983073906648, "core_hours": 26.092983073906648} {"step": 65250, "global_schedule": 0.43971291184425354, "l2_grads": 1.5700703859329224, "l2_params": 285.7068786621094, "l2_updates": 0.46150800585746765, "train/loss": 4.0578718185424805, "uptime": 12110.542103724, "examples_seen": 66816000.0, "progress": 0.5794694635134056, "epoch": 52.15245163198865, "img/sec/core": 712.0910179784829, "core_hours_NVIDIA A100-SXM4-40GB": 26.112955551951092, "core_hours": 26.112955551951092} {"step": 65300, "global_schedule": 0.4389531910419464, "l2_grads": 1.5922026634216309, "l2_params": 285.61029052734375, "l2_updates": 0.4692150354385376, "train/loss": 2.4624407291412354, "uptime": 12119.706719081, "examples_seen": 66867200.0, "progress": 0.5799135014164809, "epoch": 52.1924151964576, "img/sec/core": 698.3380917467127, "core_hours_NVIDIA A100-SXM4-40GB": 26.13332136385554, "core_hours": 26.13332136385554} {"step": 65350, "global_schedule": 0.43819350004196167, "l2_grads": 1.6953405141830444, "l2_params": 285.52581787109375, "l2_updates": 0.46772050857543945, "train/loss": 2.1252424716949463, "uptime": 12128.908897798, "examples_seen": 66918400.0, "progress": 0.5803575393195564, "epoch": 52.23237876092656, "img/sec/core": 695.4874706112432, "core_hours_NVIDIA A100-SXM4-40GB": 26.15377064989332, "core_hours": 26.15377064989332} {"step": 65400, "global_schedule": 0.4374339282512665, "l2_grads": 1.7293410301208496, "l2_params": 285.4352111816406, "l2_updates": 0.46733710169792175, "train/loss": 2.16120982170105, "uptime": 12138.632802544, "examples_seen": 66969600.0, "progress": 0.5808015772226317, "epoch": 52.27234232539552, "img/sec/core": 658.1718113429098, "core_hours_NVIDIA A100-SXM4-40GB": 26.17537932710665, "core_hours": 26.17537932710665} {"step": 65450, "global_schedule": 0.4366745054721832, "l2_grads": 1.7236493825912476, "l2_params": 285.3540344238281, "l2_updates": 0.4663788676261902, "train/loss": 2.0584840774536133, "uptime": 12147.987898246001, "examples_seen": 67020800.0, "progress": 0.5812456151257072, "epoch": 52.312305889864476, "img/sec/core": 684.1191371917972, "core_hours_NVIDIA A100-SXM4-40GB": 26.196168428666656, "core_hours": 26.196168428666656} {"step": 65500, "global_schedule": 0.4359152317047119, "l2_grads": 1.5405510663986206, "l2_params": 285.27166748046875, "l2_updates": 0.45552557706832886, "train/loss": 3.5063672065734863, "uptime": 12157.216293781, "examples_seen": 67072000.0, "progress": 0.5816896530287825, "epoch": 52.35226945433343, "img/sec/core": 693.5116701194138, "core_hours_NVIDIA A100-SXM4-40GB": 26.216675974299985, "core_hours": 26.216675974299985} {"step": 65550, "global_schedule": 0.4351562559604645, "l2_grads": 1.5415648221969604, "l2_params": 285.1905822753906, "l2_updates": 0.47068336606025696, "train/loss": 2.7326412200927734, "uptime": 12165.947995755001, "examples_seen": 67123200.0, "progress": 0.582133690931858, "epoch": 52.392233018802386, "img/sec/core": 732.9613423656423, "core_hours_NVIDIA A100-SXM4-40GB": 26.236079756464434, "core_hours": 26.236079756464434} {"step": 65600, "global_schedule": 0.43439728021621704, "l2_grads": 1.8208796977996826, "l2_params": 285.0943908691406, "l2_updates": 0.45770764350891113, "train/loss": 4.457228660583496, "uptime": 12174.935097797, "examples_seen": 67174400.0, "progress": 0.5825777288349333, "epoch": 52.43219658327135, "img/sec/core": 712.1316715990039, "core_hours_NVIDIA A100-SXM4-40GB": 26.25605109433554, "core_hours": 26.25605109433554} {"step": 65650, "global_schedule": 0.43363848328590393, "l2_grads": 1.7309566736221313, "l2_params": 285.0043640136719, "l2_updates": 0.46244099736213684, "train/loss": 2.098846435546875, "uptime": 12184.395055130999, "examples_seen": 67225600.0, "progress": 0.5830217667380088, "epoch": 52.472160147740304, "img/sec/core": 676.5358208328192, "core_hours_NVIDIA A100-SXM4-40GB": 26.277073221744427, "core_hours": 26.277073221744427} {"step": 65700, "global_schedule": 0.43287989497184753, "l2_grads": 1.709912896156311, "l2_params": 284.922119140625, "l2_updates": 0.4522880017757416, "train/loss": 2.2969422340393066, "uptime": 12194.017776742001, "examples_seen": 67276800.0, "progress": 0.5834658046410842, "epoch": 52.51212371220926, "img/sec/core": 665.0925027990744, "core_hours_NVIDIA A100-SXM4-40GB": 26.298457047546655, "core_hours": 26.298457047546655} {"step": 65750, "global_schedule": 0.4321214556694031, "l2_grads": 1.6104649305343628, "l2_params": 284.8275451660156, "l2_updates": 0.45738378167152405, "train/loss": 2.817919969558716, "uptime": 12202.723552626, "examples_seen": 67328000.0, "progress": 0.5839098425441596, "epoch": 52.552087276678215, "img/sec/core": 735.1441256101672, "core_hours_NVIDIA A100-SXM4-40GB": 26.31780321617776, "core_hours": 26.31780321617776} {"step": 65800, "global_schedule": 0.4313631057739258, "l2_grads": 1.758495807647705, "l2_params": 284.7439270019531, "l2_updates": 0.4568568766117096, "train/loss": 2.025193214416504, "uptime": 12211.473230894999, "examples_seen": 67379200.0, "progress": 0.584353880447235, "epoch": 52.59205084114717, "img/sec/core": 731.4554665027446, "core_hours_NVIDIA A100-SXM4-40GB": 26.33724694566443, "core_hours": 26.33724694566443} {"step": 65850, "global_schedule": 0.4306049942970276, "l2_grads": 1.6269476413726807, "l2_params": 284.6401672363281, "l2_updates": 0.45487359166145325, "train/loss": 3.8699231147766113, "uptime": 12220.723332222, "examples_seen": 67430400.0, "progress": 0.5847979183503104, "epoch": 52.63201440561613, "img/sec/core": 691.8843128040457, "core_hours_NVIDIA A100-SXM4-40GB": 26.357802726391093, "core_hours": 26.357802726391093} {"step": 65900, "global_schedule": 0.42984700202941895, "l2_grads": 1.8535600900650024, "l2_params": 284.5458679199219, "l2_updates": 0.4534273147583008, "train/loss": 2.085303783416748, "uptime": 12230.355287248001, "examples_seen": 67481600.0, "progress": 0.5852419562533858, "epoch": 52.67197797008509, "img/sec/core": 664.45492973371, "core_hours_NVIDIA A100-SXM4-40GB": 26.37920707089332, "core_hours": 26.37920707089332} {"step": 65950, "global_schedule": 0.42908912897109985, "l2_grads": 1.8636131286621094, "l2_params": 284.45806884765625, "l2_updates": 0.44243595004081726, "train/loss": 2.0904669761657715, "uptime": 12239.705458130002, "examples_seen": 67532800.0, "progress": 0.5856859941564612, "epoch": 52.71194153455404, "img/sec/core": 684.479468960334, "core_hours_NVIDIA A100-SXM4-40GB": 26.399985228408877, "core_hours": 26.399985228408877} {"step": 66000, "global_schedule": 0.428331583738327, "l2_grads": 1.7001526355743408, "l2_params": 284.3641052246094, "l2_updates": 0.4499160051345825, "train/loss": 4.63353967666626, "uptime": 12248.308430882002, "examples_seen": 67584000.0, "progress": 0.5861300320595366, "epoch": 52.751905099023, "img/sec/core": 743.928893476061, "core_hours_NVIDIA A100-SXM4-40GB": 26.419102945635544, "core_hours": 26.419102945635544} {"step": 66050, "global_schedule": 0.4275740683078766, "l2_grads": 1.6314244270324707, "l2_params": 284.27679443359375, "l2_updates": 0.4480111002922058, "train/loss": 2.8891420364379883, "uptime": 12257.548951237999, "examples_seen": 67635200.0, "progress": 0.586574069962612, "epoch": 52.791868663491954, "img/sec/core": 776.0122987378436, "core_hours_NVIDIA A100-SXM4-40GB": 26.437430261124426, "core_hours": 26.437430261124426} {"step": 66100, "global_schedule": 0.4268167316913605, "l2_grads": 1.7993319034576416, "l2_params": 284.1799011230469, "l2_updates": 0.4545363187789917, "train/loss": 2.0776586532592773, "uptime": 12266.378494949002, "examples_seen": 67686400.0, "progress": 0.5870181078656874, "epoch": 52.831832227960916, "img/sec/core": 724.8392679708646, "core_hours_NVIDIA A100-SXM4-40GB": 26.4570514693711, "core_hours": 26.4570514693711} {"step": 66150, "global_schedule": 0.4260595440864563, "l2_grads": 1.8442503213882446, "l2_params": 284.0934753417969, "l2_updates": 0.4462603032588959, "train/loss": 4.414790630340576, "uptime": 12275.026273051002, "examples_seen": 67737600.0, "progress": 0.5874621457687628, "epoch": 52.87179579242987, "img/sec/core": 740.0744936459027, "core_hours_NVIDIA A100-SXM4-40GB": 26.476268754042213, "core_hours": 26.476268754042213} {"step": 66200, "global_schedule": 0.42530256509780884, "l2_grads": 1.8386774063110352, "l2_params": 284.0086669921875, "l2_updates": 0.46510523557662964, "train/loss": 2.1443898677825928, "uptime": 12284.061187061, "examples_seen": 67788800.0, "progress": 0.5879061836718382, "epoch": 52.91175935689883, "img/sec/core": 708.3631336079665, "core_hours_NVIDIA A100-SXM4-40GB": 26.496346340731098, "core_hours": 26.496346340731098} {"step": 66250, "global_schedule": 0.42454585433006287, "l2_grads": 1.77524733543396, "l2_params": 283.9229431152344, "l2_updates": 0.45367464423179626, "train/loss": 2.2390427589416504, "uptime": 12293.227193646, "examples_seen": 67840000.0, "progress": 0.5883502215749137, "epoch": 52.95172292136778, "img/sec/core": 698.2320971133463, "core_hours_NVIDIA A100-SXM4-40GB": 26.51671524425332, "core_hours": 26.51671524425332} {"step": 66300, "global_schedule": 0.42378920316696167, "l2_grads": 1.629040002822876, "l2_params": 283.819091796875, "l2_updates": 0.44717609882354736, "train/loss": 4.488638401031494, "uptime": 12301.938914559001, "examples_seen": 67891200.0, "progress": 0.588794259477989, "epoch": 52.99168648583674, "img/sec/core": 734.6424505460087, "core_hours_NVIDIA A100-SXM4-40GB": 26.53607462405999, "core_hours": 26.53607462405999} {"step": 66350, "global_schedule": 0.4230327308177948, "l2_grads": 1.6603641510009766, "l2_params": 283.73114013671875, "l2_updates": 0.4506077468395233, "train/loss": 2.353626251220703, "uptime": 12311.984630844001, "examples_seen": 67942400.0, "progress": 0.5892382973810645, "epoch": 53.0316500503057, "img/sec/core": 637.0874727525842, "core_hours_NVIDIA A100-SXM4-40GB": 26.558398438026654, "core_hours": 26.558398438026654} {"step": 66400, "global_schedule": 0.42227649688720703, "l2_grads": 1.705607533454895, "l2_params": 283.6302185058594, "l2_updates": 0.44212064146995544, "train/loss": 2.866266965866089, "uptime": 12321.305626422001, "examples_seen": 67993600.0, "progress": 0.5896823352841398, "epoch": 53.071613614774655, "img/sec/core": 686.6219328657854, "core_hours_NVIDIA A100-SXM4-40GB": 26.579111761533323, "core_hours": 26.579111761533323} {"step": 66450, "global_schedule": 0.4215204119682312, "l2_grads": 1.747627854347229, "l2_params": 283.5421142578125, "l2_updates": 0.4440673589706421, "train/loss": 2.470625877380371, "uptime": 12329.879568915001, "examples_seen": 68044800.0, "progress": 0.5901263731872153, "epoch": 53.11157717924361, "img/sec/core": 746.4477403744311, "core_hours_NVIDIA A100-SXM4-40GB": 26.59816496707332, "core_hours": 26.59816496707332} {"step": 66500, "global_schedule": 0.42076459527015686, "l2_grads": 1.800994634628296, "l2_params": 283.454345703125, "l2_updates": 0.4458102285861969, "train/loss": 2.107034683227539, "uptime": 12338.518612201, "examples_seen": 68096000.0, "progress": 0.5905704110902906, "epoch": 53.151540743712566, "img/sec/core": 740.8227726295013, "core_hours_NVIDIA A100-SXM4-40GB": 26.61736284104221, "core_hours": 26.61736284104221} {"step": 66550, "global_schedule": 0.4200088381767273, "l2_grads": 1.7860641479492188, "l2_params": 283.3655700683594, "l2_updates": 0.4480479955673218, "train/loss": 2.034843921661377, "uptime": 12347.596083496, "examples_seen": 68147200.0, "progress": 0.5910144489933661, "epoch": 53.19150430818153, "img/sec/core": 705.0421633968485, "core_hours_NVIDIA A100-SXM4-40GB": 26.63753499947554, "core_hours": 26.63753499947554} {"step": 66600, "global_schedule": 0.41925328969955444, "l2_grads": 1.9117765426635742, "l2_params": 283.27392578125, "l2_updates": 0.4380185604095459, "train/loss": 2.180025100708008, "uptime": 12356.909920660999, "examples_seen": 68198400.0, "progress": 0.5914584868964414, "epoch": 53.231467872650484, "img/sec/core": 687.1496555738954, "core_hours_NVIDIA A100-SXM4-40GB": 26.658232415397762, "core_hours": 26.658232415397762} {"step": 66650, "global_schedule": 0.4184979498386383, "l2_grads": 1.7522249221801758, "l2_params": 283.1805419921875, "l2_updates": 0.4503691792488098, "train/loss": 2.141879081726074, "uptime": 12366.607800925, "examples_seen": 68249600.0, "progress": 0.5919025247995169, "epoch": 53.27143143711944, "img/sec/core": 659.9380303505499, "core_hours_NVIDIA A100-SXM4-40GB": 26.67978326042887, "core_hours": 26.67978326042887} {"step": 66700, "global_schedule": 0.4177427887916565, "l2_grads": 1.6219079494476318, "l2_params": 283.0965270996094, "l2_updates": 0.44012656807899475, "train/loss": 4.004917144775391, "uptime": 12375.423022033001, "examples_seen": 68300800.0, "progress": 0.5923465627025923, "epoch": 53.311395001588394, "img/sec/core": 726.0169565333796, "core_hours_NVIDIA A100-SXM4-40GB": 26.699372640668876, "core_hours": 26.699372640668876} {"step": 66750, "global_schedule": 0.41698792576789856, "l2_grads": 1.807450771331787, "l2_params": 283.0085754394531, "l2_updates": 0.44192758202552795, "train/loss": 2.106719732284546, "uptime": 12384.012415615, "examples_seen": 68352000.0, "progress": 0.5927906006056677, "epoch": 53.35135856605735, "img/sec/core": 745.10498778551, "core_hours_NVIDIA A100-SXM4-40GB": 26.718460181962207, "core_hours": 26.718460181962207} {"step": 66800, "global_schedule": 0.4162331521511078, "l2_grads": 1.9100099802017212, "l2_params": 282.9178771972656, "l2_updates": 0.43443480134010315, "train/loss": 2.0712618827819824, "uptime": 12392.782046636, "examples_seen": 68403200.0, "progress": 0.5932346385087431, "epoch": 53.39132213052631, "img/sec/core": 729.79125172695, "core_hours_NVIDIA A100-SXM4-40GB": 26.737948250897766, "core_hours": 26.737948250897766} {"step": 66850, "global_schedule": 0.41547855734825134, "l2_grads": 1.6894081830978394, "l2_params": 282.82427978515625, "l2_updates": 0.4296998679637909, "train/loss": 3.8230807781219482, "uptime": 12401.567201110001, "examples_seen": 68454400.0, "progress": 0.5936786764118185, "epoch": 53.43128569499527, "img/sec/core": 728.5017035204803, "core_hours_NVIDIA A100-SXM4-40GB": 26.757470816395543, "core_hours": 26.757470816395543} {"step": 66900, "global_schedule": 0.4147241711616516, "l2_grads": 1.848323106765747, "l2_params": 282.73907470703125, "l2_updates": 0.4417897164821625, "train/loss": 2.3171463012695312, "uptime": 12411.243958723999, "examples_seen": 68505600.0, "progress": 0.5941227143148939, "epoch": 53.47124925946422, "img/sec/core": 661.3785583243782, "core_hours_NVIDIA A100-SXM4-40GB": 26.778974722204428, "core_hours": 26.778974722204428} {"step": 66950, "global_schedule": 0.41397011280059814, "l2_grads": 1.6776611804962158, "l2_params": 282.6535949707031, "l2_updates": 0.44003167748451233, "train/loss": 4.430534362792969, "uptime": 12421.089143959, "examples_seen": 68556800.0, "progress": 0.5945667522179693, "epoch": 53.51121282393318, "img/sec/core": 650.0639497616788, "core_hours_NVIDIA A100-SXM4-40GB": 26.80085291161554, "core_hours": 26.80085291161554} {"step": 67000, "global_schedule": 0.41321611404418945, "l2_grads": 1.5994961261749268, "l2_params": 282.56231689453125, "l2_updates": 0.4412795603275299, "train/loss": 4.2732439041137695, "uptime": 12430.455804137002, "examples_seen": 68608000.0, "progress": 0.5950107901210447, "epoch": 53.55117638840213, "img/sec/core": 683.2744946838612, "core_hours_NVIDIA A100-SXM4-40GB": 26.821667712011102, "core_hours": 26.821667712011102} {"step": 67050, "global_schedule": 0.41246238350868225, "l2_grads": 1.810502529144287, "l2_params": 282.4751281738281, "l2_updates": 0.43670111894607544, "train/loss": 2.082655191421509, "uptime": 12440.543581223, "examples_seen": 68659200.0, "progress": 0.5954548280241201, "epoch": 53.591139952871096, "img/sec/core": 696.5737459004736, "core_hours_NVIDIA A100-SXM4-40GB": 26.842085108311096, "core_hours": 26.842085108311096} {"step": 67100, "global_schedule": 0.4117088317871094, "l2_grads": 1.7913329601287842, "l2_params": 282.3752136230469, "l2_updates": 0.4340771436691284, "train/loss": 2.1977882385253906, "uptime": 12449.705683344002, "examples_seen": 68710400.0, "progress": 0.5958988659271955, "epoch": 53.63110351734005, "img/sec/core": 698.5296513264157, "core_hours_NVIDIA A100-SXM4-40GB": 26.862445335246655, "core_hours": 26.862445335246655} {"step": 67150, "global_schedule": 0.41095542907714844, "l2_grads": 1.7314749956130981, "l2_params": 282.28460693359375, "l2_updates": 0.4300495386123657, "train/loss": 4.295117378234863, "uptime": 12459.343365667, "examples_seen": 68761600.0, "progress": 0.596342903830271, "epoch": 53.67106708180901, "img/sec/core": 664.060070202527, "core_hours_NVIDIA A100-SXM4-40GB": 26.88386240707554, "core_hours": 26.88386240707554} {"step": 67200, "global_schedule": 0.41020241379737854, "l2_grads": 1.910962700843811, "l2_params": 282.1925354003906, "l2_updates": 0.4290095567703247, "train/loss": 2.195584297180176, "uptime": 12468.332880779, "examples_seen": 68812800.0, "progress": 0.5967869417333463, "epoch": 53.71103064627796, "img/sec/core": 711.9405129489976, "core_hours_NVIDIA A100-SXM4-40GB": 26.903839107324426, "core_hours": 26.903839107324426} {"step": 67250, "global_schedule": 0.4094494581222534, "l2_grads": 1.7176496982574463, "l2_params": 282.09271240234375, "l2_updates": 0.4365096688270569, "train/loss": 1.9619946479797363, "uptime": 12477.148408946001, "examples_seen": 68864000.0, "progress": 0.5972309796364218, "epoch": 53.75099421074692, "img/sec/core": 725.9916681971812, "core_hours_NVIDIA A100-SXM4-40GB": 26.923429169917764, "core_hours": 26.923429169917764} {"step": 67300, "global_schedule": 0.408696711063385, "l2_grads": 1.6271370649337769, "l2_params": 282.0060729980469, "l2_updates": 0.4312559962272644, "train/loss": 3.828608751296997, "uptime": 12485.730286263, "examples_seen": 68915200.0, "progress": 0.5976750175394971, "epoch": 53.79095777521588, "img/sec/core": 745.757573033878, "core_hours_NVIDIA A100-SXM4-40GB": 26.942500008399982, "core_hours": 26.942500008399982} {"step": 67350, "global_schedule": 0.4079442024230957, "l2_grads": 1.653425693511963, "l2_params": 281.93377685546875, "l2_updates": 0.4275990128517151, "train/loss": 2.830893039703369, "uptime": 12494.586439055, "examples_seen": 68966400.0, "progress": 0.5981190554425726, "epoch": 53.830921339684835, "img/sec/core": 722.6614253744441, "core_hours_NVIDIA A100-SXM4-40GB": 26.96218034793776, "core_hours": 26.96218034793776} {"step": 67400, "global_schedule": 0.4071918725967407, "l2_grads": 1.7458441257476807, "l2_params": 281.8443603515625, "l2_updates": 0.43750864267349243, "train/loss": 2.182955265045166, "uptime": 12503.336714084, "examples_seen": 69017600.0, "progress": 0.598563093345648, "epoch": 53.87088490415379, "img/sec/core": 731.4055819718683, "core_hours_NVIDIA A100-SXM4-40GB": 26.98162540355776, "core_hours": 26.98162540355776} {"step": 67450, "global_schedule": 0.4064399003982544, "l2_grads": 1.825801134109497, "l2_params": 281.75750732421875, "l2_updates": 0.429517924785614, "train/loss": 2.1398985385894775, "uptime": 12512.021443407999, "examples_seen": 69068800.0, "progress": 0.5990071312487234, "epoch": 53.910848468622746, "img/sec/core": 736.9256727799896, "core_hours_NVIDIA A100-SXM4-40GB": 27.000924802055536, "core_hours": 27.000924802055536} {"step": 67500, "global_schedule": 0.4056880474090576, "l2_grads": 1.7964693307876587, "l2_params": 281.66375732421875, "l2_updates": 0.4325694143772125, "train/loss": 2.0537261962890625, "uptime": 12520.685384659, "examples_seen": 69120000.0, "progress": 0.5994511691517987, "epoch": 53.95081203309171, "img/sec/core": 738.6938362792332, "core_hours_NVIDIA A100-SXM4-40GB": 27.02017800483554, "core_hours": 27.02017800483554, "val/acc@1": 0.6943, "val/loss": 1.2439434130859375, "z/secs/eval/val": 2.704806904999714} {"step": 67550, "global_schedule": 0.40493637323379517, "l2_grads": 1.5874383449554443, "l2_params": 281.57159423828125, "l2_updates": 0.4271712303161621, "train/loss": 3.185248613357544, "uptime": 12531.585864319002, "examples_seen": 69171200.0, "progress": 0.5998952070548742, "epoch": 53.99077559756066, "img/sec/core": 781.009580806203, "core_hours_NVIDIA A100-SXM4-40GB": 27.038388053177766, "core_hours": 27.038388053177766} {"step": 67600, "global_schedule": 0.404185026884079, "l2_grads": 1.700709342956543, "l2_params": 281.4886779785156, "l2_updates": 0.42277032136917114, "train/loss": 2.441164016723633, "uptime": 12541.536814417, "examples_seen": 69222400.0, "progress": 0.6003392449579497, "epoch": 54.03073916202962, "img/sec/core": 643.1546673404904, "core_hours_NVIDIA A100-SXM4-40GB": 27.06050127561776, "core_hours": 27.06050127561776} {"step": 67650, "global_schedule": 0.40343379974365234, "l2_grads": 1.9055041074752808, "l2_params": 281.39776611328125, "l2_updates": 0.42851781845092773, "train/loss": 2.046224355697632, "uptime": 12550.751559377999, "examples_seen": 69273600.0, "progress": 0.600783282861025, "epoch": 54.070702726498574, "img/sec/core": 694.5390270797685, "core_hours_NVIDIA A100-SXM4-40GB": 27.080978486642202, "core_hours": 27.080978486642202} {"step": 67700, "global_schedule": 0.402682900428772, "l2_grads": 1.7789806127548218, "l2_params": 281.31768798828125, "l2_updates": 0.4312342405319214, "train/loss": 2.1242098808288574, "uptime": 12559.408676863002, "examples_seen": 69324800.0, "progress": 0.6012273207641005, "epoch": 54.11066629096753, "img/sec/core": 739.2760940447828, "core_hours_NVIDIA A100-SXM4-40GB": 27.100216525497768, "core_hours": 27.100216525497768} {"step": 67750, "global_schedule": 0.4019322097301483, "l2_grads": 1.6289087533950806, "l2_params": 281.2349853515625, "l2_updates": 0.41629573702812195, "train/loss": 3.4042367935180664, "uptime": 12568.031486858, "examples_seen": 69376000.0, "progress": 0.6016713586671758, "epoch": 54.15062985543649, "img/sec/core": 742.2174446279317, "core_hours_NVIDIA A100-SXM4-40GB": 27.11937832548665, "core_hours": 27.11937832548665} {"step": 67800, "global_schedule": 0.401181697845459, "l2_grads": 1.8005650043487549, "l2_params": 281.1326599121094, "l2_updates": 0.416263610124588, "train/loss": 3.354412794113159, "uptime": 12577.049379445, "examples_seen": 69427200.0, "progress": 0.6021153965702513, "epoch": 54.19059341990545, "img/sec/core": 709.7001808634388, "core_hours_NVIDIA A100-SXM4-40GB": 27.13941808679109, "core_hours": 27.13941808679109} {"step": 67850, "global_schedule": 0.40043139457702637, "l2_grads": 1.7710983753204346, "l2_params": 281.03759765625, "l2_updates": 0.43320322036743164, "train/loss": 2.0695202350616455, "uptime": 12585.595340807, "examples_seen": 69478400.0, "progress": 0.6025594344733266, "epoch": 54.2305569843744, "img/sec/core": 748.8917547015241, "core_hours_NVIDIA A100-SXM4-40GB": 27.15840911203998, "core_hours": 27.15840911203998} {"step": 67900, "global_schedule": 0.39968132972717285, "l2_grads": 1.7344822883605957, "l2_params": 280.9579772949219, "l2_updates": 0.42233073711395264, "train/loss": 4.539651870727539, "uptime": 12594.247442427999, "examples_seen": 69529600.0, "progress": 0.6030034723764021, "epoch": 54.27052054884336, "img/sec/core": 739.7046729625698, "core_hours_NVIDIA A100-SXM4-40GB": 27.17763600453109, "core_hours": 27.17763600453109} {"step": 67950, "global_schedule": 0.3989316523075104, "l2_grads": 1.7615888118743896, "l2_params": 280.8518981933594, "l2_updates": 0.42166727781295776, "train/loss": 2.417410373687744, "uptime": 12603.885106961001, "examples_seen": 69580800.0, "progress": 0.6034475102794774, "epoch": 54.31048411331231, "img/sec/core": 664.0612959794025, "core_hours_NVIDIA A100-SXM4-40GB": 27.199053036826648, "core_hours": 27.199053036826648} {"step": 68000, "global_schedule": 0.39818206429481506, "l2_grads": 1.726137399673462, "l2_params": 280.77239990234375, "l2_updates": 0.41347846388816833, "train/loss": 4.357414245605469, "uptime": 12613.670881583, "examples_seen": 69632000.0, "progress": 0.6038915481825529, "epoch": 54.350447677781276, "img/sec/core": 654.0105660733225, "core_hours_NVIDIA A100-SXM4-40GB": 27.220799202653318, "core_hours": 27.220799202653318} {"step": 68050, "global_schedule": 0.39743271470069885, "l2_grads": 1.646644949913025, "l2_params": 280.683837890625, "l2_updates": 0.42454126477241516, "train/loss": 4.171911239624023, "uptime": 12623.638197437, "examples_seen": 69683200.0, "progress": 0.6043355860856283, "epoch": 54.39041124225023, "img/sec/core": 689.629571179265, "core_hours_NVIDIA A100-SXM4-40GB": 27.241422190437763, "core_hours": 27.241422190437763} {"step": 68100, "global_schedule": 0.39668363332748413, "l2_grads": 1.852604866027832, "l2_params": 280.58966064453125, "l2_updates": 0.42044469714164734, "train/loss": 2.019975423812866, "uptime": 12632.663736003002, "examples_seen": 69734400.0, "progress": 0.6047796239887037, "epoch": 54.430374806719186, "img/sec/core": 709.0989588264458, "core_hours_NVIDIA A100-SXM4-40GB": 27.261478942806654, "core_hours": 27.261478942806654} {"step": 68150, "global_schedule": 0.3959348201751709, "l2_grads": 1.6425349712371826, "l2_params": 280.50311279296875, "l2_updates": 0.414885550737381, "train/loss": 4.072420120239258, "uptime": 12641.338606309999, "examples_seen": 69785600.0, "progress": 0.6052236618917791, "epoch": 54.47033837118814, "img/sec/core": 737.7631910920725, "core_hours_NVIDIA A100-SXM4-40GB": 27.28075643237776, "core_hours": 27.28075643237776} {"step": 68200, "global_schedule": 0.39518624544143677, "l2_grads": 2.003324508666992, "l2_params": 280.409912109375, "l2_updates": 0.41300103068351746, "train/loss": 2.045823574066162, "uptime": 12649.992314748002, "examples_seen": 69836800.0, "progress": 0.6056676997948545, "epoch": 54.5103019356571, "img/sec/core": 739.5673249047708, "core_hours_NVIDIA A100-SXM4-40GB": 27.299986895573323, "core_hours": 27.299986895573323} {"step": 68250, "global_schedule": 0.39443787932395935, "l2_grads": 1.600383996963501, "l2_params": 280.3221130371094, "l2_updates": 0.4180936813354492, "train/loss": 3.5892679691314697, "uptime": 12658.740332897001, "examples_seen": 69888000.0, "progress": 0.6061117376979299, "epoch": 54.55026550012606, "img/sec/core": 731.5942755253939, "core_hours_NVIDIA A100-SXM4-40GB": 27.319426935904435, "core_hours": 27.319426935904435} {"step": 68300, "global_schedule": 0.3936898112297058, "l2_grads": 1.8163294792175293, "l2_params": 280.23114013671875, "l2_updates": 0.42090803384780884, "train/loss": 2.184225082397461, "uptime": 12667.457774354001, "examples_seen": 69939200.0, "progress": 0.6065557756010053, "epoch": 54.590229064595015, "img/sec/core": 734.1603647777771, "core_hours_NVIDIA A100-SXM4-40GB": 27.338799028031097, "core_hours": 27.338799028031097} {"step": 68350, "global_schedule": 0.392941951751709, "l2_grads": 1.8005417585372925, "l2_params": 280.1493835449219, "l2_updates": 0.41762611269950867, "train/loss": 2.42037034034729, "uptime": 12675.934581583, "examples_seen": 69990400.0, "progress": 0.6069998135040807, "epoch": 54.63019262906397, "img/sec/core": 755.0012436410913, "core_hours_NVIDIA A100-SXM4-40GB": 27.357636377428875, "core_hours": 27.357636377428875} {"step": 68400, "global_schedule": 0.3921944499015808, "l2_grads": 1.799272060394287, "l2_params": 280.04986572265625, "l2_updates": 0.4221642315387726, "train/loss": 2.136491298675537, "uptime": 12684.602003101, "examples_seen": 70041600.0, "progress": 0.6074438514071561, "epoch": 54.670156193532925, "img/sec/core": 738.3972253696743, "core_hours_NVIDIA A100-SXM4-40GB": 27.37689731413554, "core_hours": 27.37689731413554} {"step": 68450, "global_schedule": 0.3914470672607422, "l2_grads": 1.8004673719406128, "l2_params": 279.96966552734375, "l2_updates": 0.4088169038295746, "train/loss": 4.314343452453613, "uptime": 12693.113522228, "examples_seen": 70092800.0, "progress": 0.6078878893102315, "epoch": 54.71011975800189, "img/sec/core": 751.9221779925228, "core_hours_NVIDIA A100-SXM4-40GB": 27.39581180108443, "core_hours": 27.39581180108443} {"step": 68500, "global_schedule": 0.39069995284080505, "l2_grads": 1.769273042678833, "l2_params": 279.8828430175781, "l2_updates": 0.421127051115036, "train/loss": 2.140737295150757, "uptime": 12702.093772608, "examples_seen": 70144000.0, "progress": 0.608331927213307, "epoch": 54.75008332247084, "img/sec/core": 712.6750067297338, "core_hours_NVIDIA A100-SXM4-40GB": 27.415767913039982, "core_hours": 27.415767913039982} {"step": 68550, "global_schedule": 0.389953076839447, "l2_grads": 1.67966628074646, "l2_params": 279.7850646972656, "l2_updates": 0.4104534387588501, "train/loss": 4.3508620262146, "uptime": 12710.826554315, "examples_seen": 70195200.0, "progress": 0.6087759651163823, "epoch": 54.7900468869398, "img/sec/core": 732.8707180290486, "core_hours_NVIDIA A100-SXM4-40GB": 27.435174094611096, "core_hours": 27.435174094611096} {"step": 68600, "global_schedule": 0.38920649886131287, "l2_grads": 1.8026460409164429, "l2_params": 279.69329833984375, "l2_updates": 0.4101168215274811, "train/loss": 1.9240854978561401, "uptime": 12719.873405698001, "examples_seen": 70246400.0, "progress": 0.6092200030194578, "epoch": 54.830010451408754, "img/sec/core": 707.428444334227, "core_hours_NVIDIA A100-SXM4-40GB": 27.455278208795544, "core_hours": 27.455278208795544} {"step": 68650, "global_schedule": 0.38846027851104736, "l2_grads": 1.832720160484314, "l2_params": 279.5936279296875, "l2_updates": 0.41463473439216614, "train/loss": 2.191143751144409, "uptime": 12728.406298135002, "examples_seen": 70297600.0, "progress": 0.6096640409225331, "epoch": 54.86997401587771, "img/sec/core": 750.0387526565024, "core_hours_NVIDIA A100-SXM4-40GB": 27.474240191988876, "core_hours": 27.474240191988876} {"step": 68700, "global_schedule": 0.3877141773700714, "l2_grads": 1.8244789838790894, "l2_params": 279.5091552734375, "l2_updates": 0.4113408029079437, "train/loss": 2.0105366706848145, "uptime": 12737.569321919002, "examples_seen": 70348800.0, "progress": 0.6101080788256086, "epoch": 54.90993758034667, "img/sec/core": 698.4593897022703, "core_hours_NVIDIA A100-SXM4-40GB": 27.494602467064436, "core_hours": 27.494602467064436} {"step": 68750, "global_schedule": 0.38696837425231934, "l2_grads": 1.8015189170837402, "l2_params": 279.412353515625, "l2_updates": 0.40738213062286377, "train/loss": 2.0173423290252686, "uptime": 12747.180914296, "examples_seen": 70400000.0, "progress": 0.6105521167286839, "epoch": 54.94990114481563, "img/sec/core": 665.8626114145719, "core_hours_NVIDIA A100-SXM4-40GB": 27.51596156123554, "core_hours": 27.51596156123554} {"step": 68800, "global_schedule": 0.38622280955314636, "l2_grads": 1.743340253829956, "l2_params": 279.3265075683594, "l2_updates": 0.40934741497039795, "train/loss": 4.141500473022461, "uptime": 12756.331782796, "examples_seen": 70451200.0, "progress": 0.6109961546317594, "epoch": 54.98986470928458, "img/sec/core": 699.3871674584158, "core_hours_NVIDIA A100-SXM4-40GB": 27.536296824568872, "core_hours": 27.536296824568872} {"step": 68850, "global_schedule": 0.38547760248184204, "l2_grads": 1.8964871168136597, "l2_params": 279.2398376464844, "l2_updates": 0.407662957906723, "train/loss": 2.0683140754699707, "uptime": 12765.779649028, "examples_seen": 70502400.0, "progress": 0.6114401925348347, "epoch": 55.02982827375354, "img/sec/core": 677.4016315264166, "core_hours_NVIDIA A100-SXM4-40GB": 27.557292082862208, "core_hours": 27.557292082862208} {"step": 68900, "global_schedule": 0.3847326338291168, "l2_grads": 1.795406460762024, "l2_params": 279.1517028808594, "l2_updates": 0.40473830699920654, "train/loss": 2.192089319229126, "uptime": 12775.260011156, "examples_seen": 70553600.0, "progress": 0.6118842304379102, "epoch": 55.06979183822249, "img/sec/core": 675.0796977572504, "core_hours_NVIDIA A100-SXM4-40GB": 27.578359554257762, "core_hours": 27.578359554257762} {"step": 68950, "global_schedule": 0.3839879333972931, "l2_grads": 1.7110085487365723, "l2_params": 279.06683349609375, "l2_updates": 0.40478697419166565, "train/loss": 4.09429407119751, "uptime": 12784.658174434002, "examples_seen": 70604800.0, "progress": 0.6123282683409856, "epoch": 55.109755402691455, "img/sec/core": 680.984125374866, "core_hours_NVIDIA A100-SXM4-40GB": 27.599244361542212, "core_hours": 27.599244361542212} {"step": 69000, "global_schedule": 0.38324347138404846, "l2_grads": 1.725740909576416, "l2_params": 278.9742431640625, "l2_updates": 0.40546759963035583, "train/loss": 3.090743064880371, "uptime": 12793.81811757, "examples_seen": 70656000.0, "progress": 0.612772306244061, "epoch": 55.14971896716041, "img/sec/core": 698.6942937286243, "core_hours_NVIDIA A100-SXM4-40GB": 27.619599790733318, "core_hours": 27.619599790733318} {"step": 69050, "global_schedule": 0.38249924778938293, "l2_grads": 1.564782738685608, "l2_params": 278.8865966796875, "l2_updates": 0.4075380265712738, "train/loss": 3.202540159225464, "uptime": 12802.788891022, "examples_seen": 70707200.0, "progress": 0.6132163441471364, "epoch": 55.189682531629366, "img/sec/core": 772.6404556135002, "core_hours_NVIDIA A100-SXM4-40GB": 27.638007087579982, "core_hours": 27.638007087579982} {"step": 69100, "global_schedule": 0.3817553222179413, "l2_grads": 1.997327446937561, "l2_params": 278.798095703125, "l2_updates": 0.40361565351486206, "train/loss": 2.195157289505005, "uptime": 12811.891122808001, "examples_seen": 70758400.0, "progress": 0.6136603820502118, "epoch": 55.22964609609832, "img/sec/core": 703.1242612216596, "core_hours_NVIDIA A100-SXM4-40GB": 27.658234269326652, "core_hours": 27.658234269326652} {"step": 69150, "global_schedule": 0.3810117840766907, "l2_grads": 1.877076268196106, "l2_params": 278.7073059082031, "l2_updates": 0.4021584987640381, "train/loss": 1.9681941270828247, "uptime": 12820.741704854, "examples_seen": 70809600.0, "progress": 0.6141044199532872, "epoch": 55.269609660567276, "img/sec/core": 723.1162839616983, "core_hours_NVIDIA A100-SXM4-40GB": 27.67790222942887, "core_hours": 27.67790222942887} {"step": 69200, "global_schedule": 0.3802684247493744, "l2_grads": 1.8151297569274902, "l2_params": 278.6225280761719, "l2_updates": 0.4075155258178711, "train/loss": 2.1048359870910645, "uptime": 12829.46051984, "examples_seen": 70860800.0, "progress": 0.6145484578563626, "epoch": 55.30957322503624, "img/sec/core": 734.0447079420449, "core_hours_NVIDIA A100-SXM4-40GB": 27.697277373842205, "core_hours": 27.697277373842205} {"step": 69250, "global_schedule": 0.3795253336429596, "l2_grads": 1.7722270488739014, "l2_params": 278.5299072265625, "l2_updates": 0.4055575728416443, "train/loss": 1.9978935718536377, "uptime": 12838.952608761001, "examples_seen": 70912000.0, "progress": 0.614992495759438, "epoch": 55.349536789505194, "img/sec/core": 674.2456853559787, "core_hours_NVIDIA A100-SXM4-40GB": 27.718370904777764, "core_hours": 27.718370904777764} {"step": 69300, "global_schedule": 0.3787825405597687, "l2_grads": 1.7259883880615234, "l2_params": 278.44232177734375, "l2_updates": 0.40791356563568115, "train/loss": 2.0525312423706055, "uptime": 12847.646314847001, "examples_seen": 70963200.0, "progress": 0.6154365336625134, "epoch": 55.38950035397415, "img/sec/core": 736.1647537528663, "core_hours_NVIDIA A100-SXM4-40GB": 27.737690251635538, "core_hours": 27.737690251635538} {"step": 69350, "global_schedule": 0.37804001569747925, "l2_grads": 1.6320749521255493, "l2_params": 278.35791015625, "l2_updates": 0.3993804156780243, "train/loss": 3.5486252307891846, "uptime": 12856.368017634, "examples_seen": 71014400.0, "progress": 0.6158805715655888, "epoch": 55.429463918443105, "img/sec/core": 733.8016619346381, "core_hours_NVIDIA A100-SXM4-40GB": 27.757071813384428, "core_hours": 27.757071813384428} {"step": 69400, "global_schedule": 0.37729787826538086, "l2_grads": 2.0040807723999023, "l2_params": 278.2626037597656, "l2_updates": 0.3951523005962372, "train/loss": 2.0293691158294678, "uptime": 12865.131688204, "examples_seen": 71065600.0, "progress": 0.6163246094686643, "epoch": 55.46942748291207, "img/sec/core": 730.2876059615372, "core_hours_NVIDIA A100-SXM4-40GB": 27.776546636873313, "core_hours": 27.776546636873313} {"step": 69450, "global_schedule": 0.3765559196472168, "l2_grads": 1.8968912363052368, "l2_params": 278.17901611328125, "l2_updates": 0.4023352265357971, "train/loss": 2.050996780395508, "uptime": 12873.700339822002, "examples_seen": 71116800.0, "progress": 0.6167686473717396, "epoch": 55.50939104738102, "img/sec/core": 746.9086485618529, "core_hours_NVIDIA A100-SXM4-40GB": 27.795588084913323, "core_hours": 27.795588084913323} {"step": 69500, "global_schedule": 0.3758143186569214, "l2_grads": 1.8086297512054443, "l2_params": 278.08856201171875, "l2_updates": 0.398031622171402, "train/loss": 4.5234527587890625, "uptime": 12882.463355378002, "examples_seen": 71168000.0, "progress": 0.6172126852748151, "epoch": 55.54935461184998, "img/sec/core": 730.3421931754905, "core_hours_NVIDIA A100-SXM4-40GB": 27.81506145281554, "core_hours": 27.81506145281554} {"step": 69550, "global_schedule": 0.3750729560852051, "l2_grads": 1.9777491092681885, "l2_params": 277.9996032714844, "l2_updates": 0.3904946744441986, "train/loss": 2.1176886558532715, "uptime": 12891.313250500001, "examples_seen": 71219200.0, "progress": 0.6176567231778904, "epoch": 55.58931817631893, "img/sec/core": 723.1724118505011, "core_hours_NVIDIA A100-SXM4-40GB": 27.834727886419987, "core_hours": 27.834727886419987} {"step": 69600, "global_schedule": 0.3743319511413574, "l2_grads": 1.7511707544326782, "l2_params": 277.91668701171875, "l2_updates": 0.39824116230010986, "train/loss": 4.477716445922852, "uptime": 12900.022929517001, "examples_seen": 71270400.0, "progress": 0.6181007610809659, "epoch": 55.62928174078789, "img/sec/core": 734.8146800253195, "core_hours_NVIDIA A100-SXM4-40GB": 27.854082728679984, "core_hours": 27.854082728679984} {"step": 69650, "global_schedule": 0.37359121441841125, "l2_grads": 1.7160515785217285, "l2_params": 277.821533203125, "l2_updates": 0.3988970220088959, "train/loss": 3.1881625652313232, "uptime": 12908.625694281001, "examples_seen": 71321600.0, "progress": 0.6185447989840412, "epoch": 55.66924530525685, "img/sec/core": 743.9468793546297, "core_hours_NVIDIA A100-SXM4-40GB": 27.873199983711096, "core_hours": 27.873199983711096} {"step": 69700, "global_schedule": 0.3728507161140442, "l2_grads": 1.9482216835021973, "l2_params": 277.73077392578125, "l2_updates": 0.3913937211036682, "train/loss": 2.0529165267944336, "uptime": 12918.357166294, "examples_seen": 71372800.0, "progress": 0.6189888368871167, "epoch": 55.709208869725806, "img/sec/core": 657.660011913074, "core_hours_NVIDIA A100-SXM4-40GB": 27.894825477073315, "core_hours": 27.894825477073315} {"step": 69750, "global_schedule": 0.3721105456352234, "l2_grads": 1.736875057220459, "l2_params": 277.6436462402344, "l2_updates": 0.3914230763912201, "train/loss": 4.078206539154053, "uptime": 12927.226827607, "examples_seen": 71424000.0, "progress": 0.619432874790192, "epoch": 55.74917243419476, "img/sec/core": 721.5608098382165, "core_hours_NVIDIA A100-SXM4-40GB": 27.91453583554665, "core_hours": 27.91453583554665} {"step": 69800, "global_schedule": 0.37137067317962646, "l2_grads": 1.6602919101715088, "l2_params": 277.551025390625, "l2_updates": 0.3927270174026489, "train/loss": 2.5316147804260254, "uptime": 12935.947350402, "examples_seen": 71475200.0, "progress": 0.6198769126932675, "epoch": 55.78913599866372, "img/sec/core": 733.9009541571995, "core_hours_NVIDIA A100-SXM4-40GB": 27.933914775091093, "core_hours": 27.933914775091093} {"step": 69850, "global_schedule": 0.3706311881542206, "l2_grads": 1.6861995458602905, "l2_params": 277.4670715332031, "l2_updates": 0.3901733458042145, "train/loss": 3.2432491779327393, "uptime": 12944.659284160001, "examples_seen": 71526400.0, "progress": 0.620320950596343, "epoch": 55.82909956313267, "img/sec/core": 734.6245021804158, "core_hours_NVIDIA A100-SXM4-40GB": 27.95327462788665, "core_hours": 27.95327462788665} {"step": 69900, "global_schedule": 0.369891881942749, "l2_grads": 1.737028956413269, "l2_params": 277.36700439453125, "l2_updates": 0.39128488302230835, "train/loss": 2.4939141273498535, "uptime": 12953.408925247999, "examples_seen": 71577600.0, "progress": 0.6207649884994183, "epoch": 55.869063127601635, "img/sec/core": 731.4585747727717, "core_hours_NVIDIA A100-SXM4-40GB": 27.972718274748868, "core_hours": 27.972718274748868} {"step": 69950, "global_schedule": 0.36915290355682373, "l2_grads": 1.8413187265396118, "l2_params": 277.2734069824219, "l2_updates": 0.39412721991539, "train/loss": 2.127910614013672, "uptime": 12962.090685762001, "examples_seen": 71628800.0, "progress": 0.6212090264024938, "epoch": 55.90902669207059, "img/sec/core": 737.1776714731839, "core_hours_NVIDIA A100-SXM4-40GB": 27.992011075891096, "core_hours": 27.992011075891096} {"step": 70000, "global_schedule": 0.3684142529964447, "l2_grads": 1.6829928159713745, "l2_params": 277.1761474609375, "l2_updates": 0.39330586791038513, "train/loss": 2.736626625061035, "uptime": 12970.844278224, "examples_seen": 71680000.0, "progress": 0.6216530643055691, "epoch": 55.948990256539545, "img/sec/core": 731.1283941745943, "core_hours_NVIDIA A100-SXM4-40GB": 28.011463503584427, "core_hours": 28.011463503584427, "val/acc@1": 0.69946, "val/loss": 1.2172532580566406, "z/secs/eval/val": 2.6555571050012077} {"step": 70050, "global_schedule": 0.3676759600639343, "l2_grads": 1.8637853860855103, "l2_params": 277.0935363769531, "l2_updates": 0.38692620396614075, "train/loss": 4.134464263916016, "uptime": 12983.326153802, "examples_seen": 71731200.0, "progress": 0.6220971022086446, "epoch": 55.9889538210085, "img/sec/core": 724.8251953743274, "core_hours_NVIDIA A100-SXM4-40GB": 28.03108509277998, "core_hours": 28.03108509277998} {"step": 70100, "global_schedule": 0.36693793535232544, "l2_grads": 1.8216803073883057, "l2_params": 277.0052795410156, "l2_updates": 0.40011176466941833, "train/loss": 2.043478488922119, "uptime": 12993.426232608, "examples_seen": 71782400.0, "progress": 0.6225411401117199, "epoch": 56.028917385477456, "img/sec/core": 633.6584221696803, "core_hours_NVIDIA A100-SXM4-40GB": 28.05352971234887, "core_hours": 28.05352971234887} {"step": 70150, "global_schedule": 0.36620020866394043, "l2_grads": 1.7405788898468018, "l2_params": 276.9267578125, "l2_updates": 0.3889901041984558, "train/loss": 2.6317620277404785, "uptime": 13002.58525917, "examples_seen": 71833600.0, "progress": 0.6229851780147954, "epoch": 56.06888094994642, "img/sec/core": 698.7642143711204, "core_hours_NVIDIA A100-SXM4-40GB": 28.073883104708873, "core_hours": 28.073883104708873} {"step": 70200, "global_schedule": 0.3654628396034241, "l2_grads": 1.766477346420288, "l2_params": 276.8427734375, "l2_updates": 0.39375537633895874, "train/loss": 2.143489122390747, "uptime": 13011.806336543, "examples_seen": 71884800.0, "progress": 0.6234292159178707, "epoch": 56.108844514415374, "img/sec/core": 694.0620646714741, "core_hours_NVIDIA A100-SXM4-40GB": 28.09437438775998, "core_hours": 28.09437438775998} {"step": 70250, "global_schedule": 0.3647257089614868, "l2_grads": 1.8653262853622437, "l2_params": 276.7591857910156, "l2_updates": 0.38894718885421753, "train/loss": 2.0374560356140137, "uptime": 13020.921300966, "examples_seen": 71936000.0, "progress": 0.6238732538209462, "epoch": 56.14880807888433, "img/sec/core": 702.1420713230003, "core_hours_NVIDIA A100-SXM4-40GB": 28.114629864255537, "core_hours": 28.114629864255537} {"step": 70300, "global_schedule": 0.3639889359474182, "l2_grads": 1.7734202146530151, "l2_params": 276.6648864746094, "l2_updates": 0.39175504446029663, "train/loss": 1.9308593273162842, "uptime": 13030.183975941001, "examples_seen": 71987200.0, "progress": 0.6243172917240216, "epoch": 56.188771643353284, "img/sec/core": 690.9451122135388, "core_hours_NVIDIA A100-SXM4-40GB": 28.135213586422207, "core_hours": 28.135213586422207} {"step": 70350, "global_schedule": 0.36325258016586304, "l2_grads": 1.7532191276550293, "l2_params": 276.5800476074219, "l2_updates": 0.3809680938720703, "train/loss": 2.6214537620544434, "uptime": 13039.143784407, "examples_seen": 72038400.0, "progress": 0.624761329627097, "epoch": 56.22873520782224, "img/sec/core": 714.300983585395, "core_hours_NVIDIA A100-SXM4-40GB": 28.155124271902203, "core_hours": 28.155124271902203} {"step": 70400, "global_schedule": 0.3625164031982422, "l2_grads": 1.9857672452926636, "l2_params": 276.4797668457031, "l2_updates": 0.3850158751010895, "train/loss": 2.0653369426727295, "uptime": 13047.778011725002, "examples_seen": 72089600.0, "progress": 0.6252053675301724, "epoch": 56.2686987722912, "img/sec/core": 741.23598606867, "core_hours_NVIDIA A100-SXM4-40GB": 28.174311443719986, "core_hours": 28.174311443719986} {"step": 70450, "global_schedule": 0.36178058385849, "l2_grads": 1.8820879459381104, "l2_params": 276.3938903808594, "l2_updates": 0.3856833875179291, "train/loss": 1.9910807609558105, "uptime": 13057.205739859002, "examples_seen": 72140800.0, "progress": 0.6256494054332478, "epoch": 56.30866233676016, "img/sec/core": 678.8485952325148, "core_hours_NVIDIA A100-SXM4-40GB": 28.19526195068443, "core_hours": 28.19526195068443} {"step": 70500, "global_schedule": 0.36104506254196167, "l2_grads": 1.7672284841537476, "l2_params": 276.3042297363281, "l2_updates": 0.3863987326622009, "train/loss": 1.907996416091919, "uptime": 13066.869447455001, "examples_seen": 72192000.0, "progress": 0.6260934433363232, "epoch": 56.34862590122911, "img/sec/core": 662.2716940079854, "core_hours_NVIDIA A100-SXM4-40GB": 28.21673685645332, "core_hours": 28.21673685645332} {"step": 70550, "global_schedule": 0.360309898853302, "l2_grads": 1.948943853378296, "l2_params": 276.2126159667969, "l2_updates": 0.3820798993110657, "train/loss": 2.0283305644989014, "uptime": 13076.375606908, "examples_seen": 72243200.0, "progress": 0.6265374812393986, "epoch": 56.38858946569807, "img/sec/core": 673.24770130819, "core_hours_NVIDIA A100-SXM4-40GB": 28.237861655237754, "core_hours": 28.237861655237754} {"step": 70600, "global_schedule": 0.35957515239715576, "l2_grads": 1.7892171144485474, "l2_params": 276.1358947753906, "l2_updates": 0.37943434715270996, "train/loss": 2.9679603576660156, "uptime": 13085.393113812, "examples_seen": 72294400.0, "progress": 0.626981519142474, "epoch": 56.42855303016703, "img/sec/core": 709.7305350728391, "core_hours_NVIDIA A100-SXM4-40GB": 28.25790055946887, "core_hours": 28.25790055946887} {"step": 70650, "global_schedule": 0.35884061455726624, "l2_grads": 1.9675865173339844, "l2_params": 276.0417175292969, "l2_updates": 0.37583500146865845, "train/loss": 1.959899663925171, "uptime": 13094.150721724001, "examples_seen": 72345600.0, "progress": 0.6274255570455494, "epoch": 56.468516594635986, "img/sec/core": 730.7931645615101, "core_hours_NVIDIA A100-SXM4-40GB": 28.277361910384432, "core_hours": 28.277361910384432} {"step": 70700, "global_schedule": 0.35810643434524536, "l2_grads": 1.8472905158996582, "l2_params": 275.9469299316406, "l2_updates": 0.37910744547843933, "train/loss": 1.964661955833435, "uptime": 13102.759398201999, "examples_seen": 72396800.0, "progress": 0.6278695949486248, "epoch": 56.50848015910494, "img/sec/core": 743.4359992918129, "core_hours_NVIDIA A100-SXM4-40GB": 28.296492302557755, "core_hours": 28.296492302557755} {"step": 70750, "global_schedule": 0.35737261176109314, "l2_grads": 1.9701385498046875, "l2_params": 275.8583068847656, "l2_updates": 0.38142600655555725, "train/loss": 1.9693711996078491, "uptime": 13111.444083366, "examples_seen": 72448000.0, "progress": 0.6283136328517002, "epoch": 56.5484437235739, "img/sec/core": 736.9294199091142, "core_hours_NVIDIA A100-SXM4-40GB": 28.315791602922204, "core_hours": 28.315791602922204} {"step": 70800, "global_schedule": 0.35663914680480957, "l2_grads": 1.8594406843185425, "l2_params": 275.7725830078125, "l2_updates": 0.38262173533439636, "train/loss": 2.073606014251709, "uptime": 13120.971970437002, "examples_seen": 72499200.0, "progress": 0.6287576707547756, "epoch": 56.58840728804285, "img/sec/core": 671.7124113989446, "core_hours_NVIDIA A100-SXM4-40GB": 28.33696468530221, "core_hours": 28.33696468530221} {"step": 70850, "global_schedule": 0.35590600967407227, "l2_grads": 2.0667052268981934, "l2_params": 275.68560791015625, "l2_updates": 0.37236592173576355, "train/loss": 1.965219497680664, "uptime": 13129.737388643001, "examples_seen": 72550400.0, "progress": 0.6292017086578511, "epoch": 56.628370852511814, "img/sec/core": 730.1420023085087, "core_hours_NVIDIA A100-SXM4-40GB": 28.356443392426648, "core_hours": 28.356443392426648} {"step": 70900, "global_schedule": 0.35517317056655884, "l2_grads": 1.9944889545440674, "l2_params": 275.5975646972656, "l2_updates": 0.384432852268219, "train/loss": 1.9972678422927856, "uptime": 13138.833427927, "examples_seen": 72601600.0, "progress": 0.6296457465609264, "epoch": 56.66833441698077, "img/sec/core": 703.6029419154409, "core_hours_NVIDIA A100-SXM4-40GB": 28.37665681305776, "core_hours": 28.37665681305776} {"step": 70950, "global_schedule": 0.3544406294822693, "l2_grads": 1.8672372102737427, "l2_params": 275.5119934082031, "l2_updates": 0.3814842104911804, "train/loss": 1.966841697692871, "uptime": 13147.575016745, "examples_seen": 72652800.0, "progress": 0.6300897844640019, "epoch": 56.708297981449725, "img/sec/core": 732.1323541118053, "core_hours_NVIDIA A100-SXM4-40GB": 28.39608256598665, "core_hours": 28.39608256598665} {"step": 71000, "global_schedule": 0.3537084460258484, "l2_grads": 1.9133132696151733, "l2_params": 275.4203186035156, "l2_updates": 0.37478554248809814, "train/loss": 2.0195281505584717, "uptime": 13156.862738566999, "examples_seen": 72704000.0, "progress": 0.6305338223670772, "epoch": 56.74826154591868, "img/sec/core": 689.0817923552995, "core_hours_NVIDIA A100-SXM4-40GB": 28.41672194781331, "core_hours": 28.41672194781331} {"step": 71050, "global_schedule": 0.3529767394065857, "l2_grads": 1.6217269897460938, "l2_params": 275.33026123046875, "l2_updates": 0.3769034445285797, "train/loss": 3.2961575984954834, "uptime": 13166.993238139, "examples_seen": 72755200.0, "progress": 0.6309778602701527, "epoch": 56.788225110387636, "img/sec/core": 701.3223693860102, "core_hours_NVIDIA A100-SXM4-40GB": 28.437001098804423, "core_hours": 28.437001098804423} {"step": 71100, "global_schedule": 0.3522452712059021, "l2_grads": 1.8286043405532837, "l2_params": 275.2432556152344, "l2_updates": 0.3730210065841675, "train/loss": 2.90816068649292, "uptime": 13176.674501885, "examples_seen": 72806400.0, "progress": 0.631421898173228, "epoch": 56.8281886748566, "img/sec/core": 661.0707205084693, "core_hours_NVIDIA A100-SXM4-40GB": 28.458515018239975, "core_hours": 28.458515018239975} {"step": 71150, "global_schedule": 0.3515141010284424, "l2_grads": 1.8710227012634277, "l2_params": 275.1488342285156, "l2_updates": 0.37095555663108826, "train/loss": 1.9014129638671875, "uptime": 13186.251791592002, "examples_seen": 72857600.0, "progress": 0.6318659360763035, "epoch": 56.86815223932555, "img/sec/core": 668.247510078033, "core_hours_NVIDIA A100-SXM4-40GB": 28.479797884255536, "core_hours": 28.479797884255536} {"step": 71200, "global_schedule": 0.3507833182811737, "l2_grads": 1.8027442693710327, "l2_params": 275.0584411621094, "l2_updates": 0.3714371621608734, "train/loss": 2.1363213062286377, "uptime": 13195.809153212, "examples_seen": 72908800.0, "progress": 0.6323099739793788, "epoch": 56.90811580379451, "img/sec/core": 669.640875218998, "core_hours_NVIDIA A100-SXM4-40GB": 28.50103646563331, "core_hours": 28.50103646563331} {"step": 71250, "global_schedule": 0.3500528931617737, "l2_grads": 1.7325043678283691, "l2_params": 274.9706726074219, "l2_updates": 0.37182363867759705, "train/loss": 2.601119041442871, "uptime": 13205.129582854, "examples_seen": 72960000.0, "progress": 0.6327540118824543, "epoch": 56.948079368263464, "img/sec/core": 686.6636245135703, "core_hours_NVIDIA A100-SXM4-40GB": 28.52174853150442, "core_hours": 28.52174853150442} {"step": 71300, "global_schedule": 0.3493229150772095, "l2_grads": 1.6593821048736572, "l2_params": 274.8778381347656, "l2_updates": 0.37282541394233704, "train/loss": 3.1845428943634033, "uptime": 13213.808106373, "examples_seen": 73011200.0, "progress": 0.6331980497855297, "epoch": 56.98804293273242, "img/sec/core": 737.4526307370595, "core_hours_NVIDIA A100-SXM4-40GB": 28.541034139324424, "core_hours": 28.541034139324424} {"step": 71350, "global_schedule": 0.34859317541122437, "l2_grads": 1.8524669408798218, "l2_params": 274.78424072265625, "l2_updates": 0.3735615313053131, "train/loss": 2.065863609313965, "uptime": 13223.696167804, "examples_seen": 73062400.0, "progress": 0.6336420876886051, "epoch": 57.02800649720138, "img/sec/core": 647.2451698100638, "core_hours_NVIDIA A100-SXM4-40GB": 28.56300760917109, "core_hours": 28.56300760917109} {"step": 71400, "global_schedule": 0.3478638231754303, "l2_grads": 1.9022668600082397, "l2_params": 274.7049560546875, "l2_updates": 0.3656359016895294, "train/loss": 3.12876033782959, "uptime": 13232.977929875002, "examples_seen": 73113600.0, "progress": 0.6340861255916805, "epoch": 57.06797006167034, "img/sec/core": 689.5242466939998, "core_hours_NVIDIA A100-SXM4-40GB": 28.58363374710665, "core_hours": 28.58363374710665} {"step": 71450, "global_schedule": 0.3471347987651825, "l2_grads": 1.7062280178070068, "l2_params": 274.62060546875, "l2_updates": 0.36966264247894287, "train/loss": 4.212663173675537, "uptime": 13241.573953150002, "examples_seen": 73164800.0, "progress": 0.6345301634947559, "epoch": 57.10793362613929, "img/sec/core": 744.5303246924667, "core_hours_NVIDIA A100-SXM4-40GB": 28.602736021051093, "core_hours": 28.602736021051093} {"step": 71500, "global_schedule": 0.34640613198280334, "l2_grads": 1.7980480194091797, "l2_params": 274.5288391113281, "l2_updates": 0.37067338824272156, "train/loss": 2.3018105030059814, "uptime": 13250.954502564002, "examples_seen": 73216000.0, "progress": 0.6349742013978313, "epoch": 57.14789719060825, "img/sec/core": 682.2628097293036, "core_hours_NVIDIA A100-SXM4-40GB": 28.623581686415537, "core_hours": 28.623581686415537} {"step": 71550, "global_schedule": 0.34567791223526, "l2_grads": 1.766745924949646, "l2_params": 274.4375, "l2_updates": 0.3648148477077484, "train/loss": 2.163115978240967, "uptime": 13259.527080458001, "examples_seen": 73267200.0, "progress": 0.6354182393009067, "epoch": 57.18786075507721, "img/sec/core": 746.5665613233722, "core_hours_NVIDIA A100-SXM4-40GB": 28.642631859513312, "core_hours": 28.642631859513312} {"step": 71600, "global_schedule": 0.34494999051094055, "l2_grads": 1.8673830032348633, "l2_params": 274.3481750488281, "l2_updates": 0.3615713119506836, "train/loss": 3.853630542755127, "uptime": 13269.054772564, "examples_seen": 73318400.0, "progress": 0.6358622772039821, "epoch": 57.227824319546166, "img/sec/core": 671.7261566387114, "core_hours_NVIDIA A100-SXM4-40GB": 28.663804508637757, "core_hours": 28.663804508637757} {"step": 71650, "global_schedule": 0.34422239661216736, "l2_grads": 1.847347617149353, "l2_params": 274.2595520019531, "l2_updates": 0.3719368577003479, "train/loss": 2.0055246353149414, "uptime": 13278.780651797, "examples_seen": 73369600.0, "progress": 0.6363063151070575, "epoch": 57.26778788401512, "img/sec/core": 658.0381934298663, "core_hours_NVIDIA A100-SXM4-40GB": 28.685417573599977, "core_hours": 28.685417573599977} {"step": 71700, "global_schedule": 0.3434951901435852, "l2_grads": 1.9209948778152466, "l2_params": 274.1785888671875, "l2_updates": 0.372852087020874, "train/loss": 2.0596020221710205, "uptime": 13288.170372079001, "examples_seen": 73420800.0, "progress": 0.6367503530101329, "epoch": 57.307751448484076, "img/sec/core": 681.5964488599521, "core_hours_NVIDIA A100-SXM4-40GB": 28.70628361867109, "core_hours": 28.70628361867109} {"step": 71750, "global_schedule": 0.3427683115005493, "l2_grads": 1.898488163948059, "l2_params": 274.0779113769531, "l2_updates": 0.3668248653411865, "train/loss": 1.9963760375976562, "uptime": 13297.09518342, "examples_seen": 73472000.0, "progress": 0.6371943909132084, "epoch": 57.34771501295303, "img/sec/core": 717.1019930246839, "core_hours_NVIDIA A100-SXM4-40GB": 28.726116532762198, "core_hours": 28.726116532762198} {"step": 71800, "global_schedule": 0.3420419692993164, "l2_grads": 1.8412976264953613, "l2_params": 273.9956970214844, "l2_updates": 0.3670302629470825, "train/loss": 2.0541510581970215, "uptime": 13305.735616078002, "examples_seen": 73523200.0, "progress": 0.6376384288162837, "epoch": 57.387678577421994, "img/sec/core": 740.703649148096, "core_hours_NVIDIA A100-SXM4-40GB": 28.745317494224423, "core_hours": 28.745317494224423} {"step": 71850, "global_schedule": 0.3413158655166626, "l2_grads": 1.8626856803894043, "l2_params": 273.91888427734375, "l2_updates": 0.36448362469673157, "train/loss": 1.938254714012146, "uptime": 13314.335199987001, "examples_seen": 73574400.0, "progress": 0.6380824667193592, "epoch": 57.42764214189095, "img/sec/core": 744.2220539650299, "core_hours_NVIDIA A100-SXM4-40GB": 28.76442768068887, "core_hours": 28.76442768068887} {"step": 71900, "global_schedule": 0.34059011936187744, "l2_grads": 1.7220826148986816, "l2_params": 273.8330993652344, "l2_updates": 0.3622918128967285, "train/loss": 2.137444496154785, "uptime": 13322.902023704, "examples_seen": 73625600.0, "progress": 0.6385265046224345, "epoch": 57.467605706359905, "img/sec/core": 747.0680162707595, "core_hours_NVIDIA A100-SXM4-40GB": 28.783465066726645, "core_hours": 28.783465066726645} {"step": 71950, "global_schedule": 0.3398647904396057, "l2_grads": 1.566850185394287, "l2_params": 273.7509765625, "l2_updates": 0.3641916811466217, "train/loss": 3.330990791320801, "uptime": 13331.486439415, "examples_seen": 73676800.0, "progress": 0.63897054252551, "epoch": 57.50756927082886, "img/sec/core": 745.5370540593391, "core_hours_NVIDIA A100-SXM4-40GB": 28.80254154608442, "core_hours": 28.80254154608442} {"step": 72000, "global_schedule": 0.3391398787498474, "l2_grads": 1.9046047925949097, "l2_params": 273.66717529296875, "l2_updates": 0.3604777455329895, "train/loss": 2.1021745204925537, "uptime": 13341.316609821, "examples_seen": 73728000.0, "progress": 0.6394145804285853, "epoch": 57.547532835297815, "img/sec/core": 651.0568724316283, "core_hours_NVIDIA A100-SXM4-40GB": 28.824386369208867, "core_hours": 28.824386369208867} {"step": 72050, "global_schedule": 0.3384152352809906, "l2_grads": 1.8401768207550049, "l2_params": 273.5701599121094, "l2_updates": 0.3552772104740143, "train/loss": 3.5711846351623535, "uptime": 13350.441691955, "examples_seen": 73779200.0, "progress": 0.6398586183316608, "epoch": 57.58749639976678, "img/sec/core": 759.5831596376908, "core_hours_NVIDIA A100-SXM4-40GB": 28.843110088977753, "core_hours": 28.843110088977753} {"step": 72100, "global_schedule": 0.337691068649292, "l2_grads": 1.9515364170074463, "l2_params": 273.4872131347656, "l2_updates": 0.36001136898994446, "train/loss": 1.9424734115600586, "uptime": 13359.697883556002, "examples_seen": 73830400.0, "progress": 0.6403026562347361, "epoch": 57.62745996423573, "img/sec/core": 691.429075356148, "core_hours_NVIDIA A100-SXM4-40GB": 28.863679403646646, "core_hours": 28.863679403646646} {"step": 72150, "global_schedule": 0.33696720004081726, "l2_grads": 1.8331671953201294, "l2_params": 273.4000549316406, "l2_updates": 0.3620109260082245, "train/loss": 2.541011333465576, "uptime": 13369.175793017, "examples_seen": 73881600.0, "progress": 0.6407466941378116, "epoch": 57.66742352870469, "img/sec/core": 675.2543930004756, "core_hours_NVIDIA A100-SXM4-40GB": 28.884741424671084, "core_hours": 28.884741424671084} {"step": 72200, "global_schedule": 0.33624374866485596, "l2_grads": 1.8845747709274292, "l2_params": 273.3043212890625, "l2_updates": 0.36137109994888306, "train/loss": 2.1077048778533936, "uptime": 13377.883484239, "examples_seen": 73932800.0, "progress": 0.6411907320408871, "epoch": 57.707387093173644, "img/sec/core": 734.9824237945405, "core_hours_NVIDIA A100-SXM4-40GB": 28.904091849608864, "core_hours": 28.904091849608864} {"step": 72250, "global_schedule": 0.33552074432373047, "l2_grads": 1.8273546695709229, "l2_params": 273.21051025390625, "l2_updates": 0.3534119129180908, "train/loss": 4.480133533477783, "uptime": 13386.486862827, "examples_seen": 73984000.0, "progress": 0.6416347699439624, "epoch": 57.7473506576426, "img/sec/core": 743.8938010850117, "core_hours_NVIDIA A100-SXM4-40GB": 28.923210468693306, "core_hours": 28.923210468693306} {"step": 72300, "global_schedule": 0.33479803800582886, "l2_grads": 1.8903335332870483, "l2_params": 273.1317443847656, "l2_updates": 0.35548245906829834, "train/loss": 2.3510453701019287, "uptime": 13395.698482277001, "examples_seen": 74035200.0, "progress": 0.6420788078470379, "epoch": 57.78731422211156, "img/sec/core": 694.7746848138729, "core_hours_NVIDIA A100-SXM4-40GB": 28.943680734137754, "core_hours": 28.943680734137754} {"step": 72350, "global_schedule": 0.3340757489204407, "l2_grads": 1.7457497119903564, "l2_params": 273.054931640625, "l2_updates": 0.3586035370826721, "train/loss": 2.690624952316284, "uptime": 13405.278058728001, "examples_seen": 74086400.0, "progress": 0.6425228457501132, "epoch": 57.82727778658052, "img/sec/core": 668.0879924844378, "core_hours_NVIDIA A100-SXM4-40GB": 28.964968681806642, "core_hours": 28.964968681806642} {"step": 72400, "global_schedule": 0.33335381746292114, "l2_grads": 1.8683205842971802, "l2_params": 272.96649169921875, "l2_updates": 0.3540065586566925, "train/loss": 2.0435690879821777, "uptime": 13413.992911387, "examples_seen": 74137600.0, "progress": 0.6429668836531887, "epoch": 57.86724135104947, "img/sec/core": 734.3784514120641, "core_hours_NVIDIA A100-SXM4-40GB": 28.984335021048864, "core_hours": 28.984335021048864} {"step": 72450, "global_schedule": 0.33263224363327026, "l2_grads": 1.941962718963623, "l2_params": 272.868896484375, "l2_updates": 0.34706956148147583, "train/loss": 1.914127230644226, "uptime": 13422.714883196002, "examples_seen": 74188800.0, "progress": 0.643410921556264, "epoch": 57.90720491551843, "img/sec/core": 733.7790284296306, "core_hours_NVIDIA A100-SXM4-40GB": 29.003717180624424, "core_hours": 29.003717180624424} {"step": 72500, "global_schedule": 0.33191123604774475, "l2_grads": 1.8284544944763184, "l2_params": 272.7875671386719, "l2_updates": 0.3507925868034363, "train/loss": 2.7271311283111572, "uptime": 13432.24834802, "examples_seen": 74240000.0, "progress": 0.6438549594593395, "epoch": 57.94716847998739, "img/sec/core": 671.3194120032033, "core_hours_NVIDIA A100-SXM4-40GB": 29.02490265801109, "core_hours": 29.02490265801109, "val/acc@1": 0.70684, "val/loss": 1.1856632861328125, "z/secs/eval/val": 2.567218205000245} {"step": 72550, "global_schedule": 0.33119046688079834, "l2_grads": 1.991281270980835, "l2_params": 272.69622802734375, "l2_updates": 0.348245233297348, "train/loss": 4.041046142578125, "uptime": 13444.288432801002, "examples_seen": 74291200.0, "progress": 0.6442989973624148, "epoch": 57.987132044456345, "img/sec/core": 675.6746242854526, "core_hours_NVIDIA A100-SXM4-40GB": 29.04595157965331, "core_hours": 29.04595157965331} {"step": 72600, "global_schedule": 0.33047014474868774, "l2_grads": 1.9585319757461548, "l2_params": 272.6023864746094, "l2_updates": 0.3547860383987427, "train/loss": 1.9298381805419922, "uptime": 13454.551322526999, "examples_seen": 74342400.0, "progress": 0.6447430352654903, "epoch": 58.0270956089253, "img/sec/core": 623.6060379552189, "core_hours_NVIDIA A100-SXM4-40GB": 29.068758001266637, "core_hours": 29.068758001266637} {"step": 72650, "global_schedule": 0.3297502398490906, "l2_grads": 2.035393714904785, "l2_params": 272.5141296386719, "l2_updates": 0.3454529941082001, "train/loss": 2.0942840576171875, "uptime": 13464.116146118, "examples_seen": 74393600.0, "progress": 0.6451870731685657, "epoch": 58.067059173394256, "img/sec/core": 669.1184567189794, "core_hours_NVIDIA A100-SXM4-40GB": 29.090013164802194, "core_hours": 29.090013164802194} {"step": 72700, "global_schedule": 0.3290306627750397, "l2_grads": 2.075786828994751, "l2_params": 272.425048828125, "l2_updates": 0.3489980399608612, "train/loss": 2.00453519821167, "uptime": 13473.065931539002, "examples_seen": 74444800.0, "progress": 0.6456311110716411, "epoch": 58.10702273786321, "img/sec/core": 715.1009436473565, "core_hours_NVIDIA A100-SXM4-40GB": 29.109901576848866, "core_hours": 29.109901576848866} {"step": 72750, "global_schedule": 0.32831162214279175, "l2_grads": 1.7682219743728638, "l2_params": 272.3462219238281, "l2_updates": 0.3507789671421051, "train/loss": 4.111292839050293, "uptime": 13481.717746953002, "examples_seen": 74496000.0, "progress": 0.6460751489747165, "epoch": 58.146986302332174, "img/sec/core": 739.7291428159938, "core_hours_NVIDIA A100-SXM4-40GB": 29.12912783332442, "core_hours": 29.12912783332442} {"step": 72800, "global_schedule": 0.3275928497314453, "l2_grads": 1.9170836210250854, "l2_params": 272.2535095214844, "l2_updates": 0.3480551838874817, "train/loss": 2.783001661300659, "uptime": 13490.482940061001, "examples_seen": 74547200.0, "progress": 0.6465191868777919, "epoch": 58.18694986680113, "img/sec/core": 730.1607530082539, "core_hours_NVIDIA A100-SXM4-40GB": 29.148606040231083, "core_hours": 29.148606040231083} {"step": 72850, "global_schedule": 0.3268744945526123, "l2_grads": 2.0183308124542236, "l2_params": 272.1661071777344, "l2_updates": 0.3423866927623749, "train/loss": 4.407421112060547, "uptime": 13499.184172532, "examples_seen": 74598400.0, "progress": 0.6469632247808673, "epoch": 58.226913431270084, "img/sec/core": 735.5279865619093, "core_hours_NVIDIA A100-SXM4-40GB": 29.167942112388857, "core_hours": 29.167942112388857} {"step": 72900, "global_schedule": 0.3261565566062927, "l2_grads": 1.7881664037704468, "l2_params": 272.0887756347656, "l2_updates": 0.3480437099933624, "train/loss": 2.4670181274414062, "uptime": 13508.565127120999, "examples_seen": 74649600.0, "progress": 0.6474072626839427, "epoch": 58.26687699573904, "img/sec/core": 682.2333419569737, "core_hours_NVIDIA A100-SXM4-40GB": 29.188788678142192, "core_hours": 29.188788678142192} {"step": 72950, "global_schedule": 0.3254390358924866, "l2_grads": 1.9762920141220093, "l2_params": 272.0064392089844, "l2_updates": 0.3465907573699951, "train/loss": 1.906649112701416, "uptime": 13517.756666023999, "examples_seen": 74700800.0, "progress": 0.6478513005870181, "epoch": 58.306840560207995, "img/sec/core": 696.2925433423446, "core_hours_NVIDIA A100-SXM4-40GB": 29.20921432014886, "core_hours": 29.20921432014886} {"step": 73000, "global_schedule": 0.3247219920158386, "l2_grads": 1.8877894878387451, "l2_params": 271.9186706542969, "l2_updates": 0.3471395969390869, "train/loss": 2.102266788482666, "uptime": 13527.186044147, "examples_seen": 74752000.0, "progress": 0.6482953384900935, "epoch": 58.34680412467696, "img/sec/core": 678.7298076835714, "core_hours_NVIDIA A100-SXM4-40GB": 29.230168493755524, "core_hours": 29.230168493755524} {"step": 73050, "global_schedule": 0.32400527596473694, "l2_grads": 1.9651882648468018, "l2_params": 271.832763671875, "l2_updates": 0.3397826552391052, "train/loss": 1.900195598602295, "uptime": 13537.051165635, "examples_seen": 74803200.0, "progress": 0.6487393763931689, "epoch": 58.38676768914591, "img/sec/core": 694.6682310308579, "core_hours_NVIDIA A100-SXM4-40GB": 29.250641896146647, "core_hours": 29.250641896146647} {"step": 73100, "global_schedule": 0.3232889771461487, "l2_grads": 1.7638707160949707, "l2_params": 271.7420654296875, "l2_updates": 0.34533825516700745, "train/loss": 2.4962971210479736, "uptime": 13546.620494661, "examples_seen": 74854400.0, "progress": 0.6491834142962444, "epoch": 58.42673125361487, "img/sec/core": 668.8034221220687, "core_hours_NVIDIA A100-SXM4-40GB": 29.271907071759976, "core_hours": 29.271907071759976} {"step": 73150, "global_schedule": 0.32257306575775146, "l2_grads": 1.7564979791641235, "l2_params": 271.6578063964844, "l2_updates": 0.3401978313922882, "train/loss": 3.500993013381958, "uptime": 13555.327153477001, "examples_seen": 74905600.0, "progress": 0.6496274521993197, "epoch": 58.46669481808382, "img/sec/core": 735.0695755113122, "core_hours_NVIDIA A100-SXM4-40GB": 29.291255202462203, "core_hours": 29.291255202462203} {"step": 73200, "global_schedule": 0.3218577206134796, "l2_grads": 1.7982189655303955, "l2_params": 271.5686340332031, "l2_updates": 0.3483448922634125, "train/loss": 2.0042905807495117, "uptime": 13563.805516061, "examples_seen": 74956800.0, "progress": 0.6500714901023952, "epoch": 58.50665838255278, "img/sec/core": 754.8627387177887, "core_hours_NVIDIA A100-SXM4-40GB": 29.31009600820442, "core_hours": 29.31009600820442} {"step": 73250, "global_schedule": 0.32114267349243164, "l2_grads": 1.9570857286453247, "l2_params": 271.4723205566406, "l2_updates": 0.3431132733821869, "train/loss": 1.9008699655532837, "uptime": 13573.60679991, "examples_seen": 75008000.0, "progress": 0.6505155280054705, "epoch": 58.54662194702174, "img/sec/core": 652.9756814106896, "core_hours_NVIDIA A100-SXM4-40GB": 29.331876638979978, "core_hours": 29.331876638979978} {"step": 73300, "global_schedule": 0.3204280734062195, "l2_grads": 1.817707896232605, "l2_params": 271.3975524902344, "l2_updates": 0.3432060182094574, "train/loss": 2.331962823867798, "uptime": 13582.732066039001, "examples_seen": 75059200.0, "progress": 0.650959565908546, "epoch": 58.586585511490696, "img/sec/core": 701.3494082829633, "core_hours_NVIDIA A100-SXM4-40GB": 29.352155008155535, "core_hours": 29.352155008155535} {"step": 73350, "global_schedule": 0.319713830947876, "l2_grads": 1.9397974014282227, "l2_params": 271.3021545410156, "l2_updates": 0.33528420329093933, "train/loss": 1.8199231624603271, "uptime": 13591.305983647, "examples_seen": 75110400.0, "progress": 0.6514036038116213, "epoch": 58.62654907595965, "img/sec/core": 746.4499068698004, "core_hours_NVIDIA A100-SXM4-40GB": 29.371208158395532, "core_hours": 29.371208158395532} {"step": 73400, "global_schedule": 0.3190000653266907, "l2_grads": 2.0216691493988037, "l2_params": 271.2177429199219, "l2_updates": 0.33832111954689026, "train/loss": 1.9259796142578125, "uptime": 13600.546120279001, "examples_seen": 75161600.0, "progress": 0.6518476417146968, "epoch": 58.66651264042861, "img/sec/core": 692.6304507051524, "core_hours_NVIDIA A100-SXM4-40GB": 29.391741795355536, "core_hours": 29.391741795355536} {"step": 73450, "global_schedule": 0.3182867765426636, "l2_grads": 1.8719184398651123, "l2_params": 271.1302490234375, "l2_updates": 0.33129751682281494, "train/loss": 4.31218147277832, "uptime": 13610.062219614001, "examples_seen": 75212800.0, "progress": 0.6522916796177721, "epoch": 58.70647620489757, "img/sec/core": 672.5444717102647, "core_hours_NVIDIA A100-SXM4-40GB": 29.41288868276665, "core_hours": 29.41288868276665} {"step": 73500, "global_schedule": 0.3175738453865051, "l2_grads": 2.076362371444702, "l2_params": 271.0370178222656, "l2_updates": 0.3319213092327118, "train/loss": 1.921319603919983, "uptime": 13619.51579217, "examples_seen": 75264000.0, "progress": 0.6527357175208476, "epoch": 58.746439769366525, "img/sec/core": 676.9927413250057, "core_hours_NVIDIA A100-SXM4-40GB": 29.433896621779976, "core_hours": 29.433896621779976} {"step": 73550, "global_schedule": 0.3168613314628601, "l2_grads": 1.7636030912399292, "l2_params": 270.9443664550781, "l2_updates": 0.3337092101573944, "train/loss": 2.642071008682251, "uptime": 13629.018948726001, "examples_seen": 75315200.0, "progress": 0.653179755423923, "epoch": 58.78640333383548, "img/sec/core": 673.4604404636315, "core_hours_NVIDIA A100-SXM4-40GB": 29.45501474745998, "core_hours": 29.45501474745998} {"step": 73600, "global_schedule": 0.3161492347717285, "l2_grads": 2.024127960205078, "l2_params": 270.8629455566406, "l2_updates": 0.3319995701313019, "train/loss": 1.882056474685669, "uptime": 13637.678150094, "examples_seen": 75366400.0, "progress": 0.6536237933269984, "epoch": 58.826366898304435, "img/sec/core": 739.0981833096506, "core_hours_NVIDIA A100-SXM4-40GB": 29.474257417166644, "core_hours": 29.474257417166644} {"step": 73650, "global_schedule": 0.31543758511543274, "l2_grads": 1.8847886323928833, "l2_params": 270.76873779296875, "l2_updates": 0.33523398637771606, "train/loss": 3.084024429321289, "uptime": 13646.329921711002, "examples_seen": 75417600.0, "progress": 0.6540678312300738, "epoch": 58.86633046277339, "img/sec/core": 739.7328874727929, "core_hours_NVIDIA A100-SXM4-40GB": 29.493483576315537, "core_hours": 29.493483576315537} {"step": 73700, "global_schedule": 0.31472647190093994, "l2_grads": 1.7972710132598877, "l2_params": 270.6856384277344, "l2_updates": 0.33127740025520325, "train/loss": 3.444121837615967, "uptime": 13654.955608633, "examples_seen": 75468800.0, "progress": 0.6545118691331492, "epoch": 58.90629402724235, "img/sec/core": 741.969892702489, "core_hours_NVIDIA A100-SXM4-40GB": 29.512651769475532, "core_hours": 29.512651769475532} {"step": 73750, "global_schedule": 0.3140156865119934, "l2_grads": 1.8176114559173584, "l2_params": 270.5998229980469, "l2_updates": 0.3291793167591095, "train/loss": 2.556070566177368, "uptime": 13663.635369705002, "examples_seen": 75520000.0, "progress": 0.6549559070362246, "epoch": 58.94625759171131, "img/sec/core": 737.3474853638586, "core_hours_NVIDIA A100-SXM4-40GB": 29.531940127413314, "core_hours": 29.531940127413314} {"step": 73800, "global_schedule": 0.3133053183555603, "l2_grads": 2.029741048812866, "l2_params": 270.51080322265625, "l2_updates": 0.3288317322731018, "train/loss": 2.0924232006073, "uptime": 13672.210655996, "examples_seen": 75571200.0, "progress": 0.6553999449393, "epoch": 58.986221156180264, "img/sec/core": 746.3307676058303, "core_hours_NVIDIA A100-SXM4-40GB": 29.550996319171087, "core_hours": 29.550996319171087} {"step": 73850, "global_schedule": 0.3125954568386078, "l2_grads": 1.9303367137908936, "l2_params": 270.4291076660156, "l2_updates": 0.33755192160606384, "train/loss": 2.0331122875213623, "uptime": 13682.208466940001, "examples_seen": 75622400.0, "progress": 0.6558439828423754, "epoch": 59.02618472064922, "img/sec/core": 640.1401302591906, "core_hours_NVIDIA A100-SXM4-40GB": 29.573213676824423, "core_hours": 29.573213676824423} {"step": 73900, "global_schedule": 0.3118859827518463, "l2_grads": 1.8231396675109863, "l2_params": 270.3393859863281, "l2_updates": 0.3263489603996277, "train/loss": 4.168068885803223, "uptime": 13691.21679167, "examples_seen": 75673600.0, "progress": 0.6562880207454508, "epoch": 59.066148285118174, "img/sec/core": 710.4539625094874, "core_hours_NVIDIA A100-SXM4-40GB": 29.593232176224422, "core_hours": 29.593232176224422} {"step": 73950, "global_schedule": 0.31117701530456543, "l2_grads": 1.7016925811767578, "l2_params": 270.25518798828125, "l2_updates": 0.32709014415740967, "train/loss": 2.7707087993621826, "uptime": 13699.882094043, "examples_seen": 75724800.0, "progress": 0.6567320586485262, "epoch": 59.10611184958714, "img/sec/core": 738.5778042716563, "core_hours_NVIDIA A100-SXM4-40GB": 29.612488403719976, "core_hours": 29.612488403719976} {"step": 74000, "global_schedule": 0.3104684352874756, "l2_grads": 1.967508316040039, "l2_params": 270.17333984375, "l2_updates": 0.3317636549472809, "train/loss": 1.8545751571655273, "uptime": 13708.624236552, "examples_seen": 75776000.0, "progress": 0.6571760965516017, "epoch": 59.14607541405609, "img/sec/core": 732.0859838891281, "core_hours_NVIDIA A100-SXM4-40GB": 29.63191538707331, "core_hours": 29.63191538707331} {"step": 74050, "global_schedule": 0.30976030230522156, "l2_grads": 1.7416363954544067, "l2_params": 270.09051513671875, "l2_updates": 0.33595988154411316, "train/loss": 2.3903450965881348, "uptime": 13718.625795967002, "examples_seen": 75827200.0, "progress": 0.657620134454677, "epoch": 59.18603897852505, "img/sec/core": 711.5429882942592, "core_hours_NVIDIA A100-SXM4-40GB": 29.651903247899988, "core_hours": 29.651903247899988} {"step": 74100, "global_schedule": 0.30905258655548096, "l2_grads": 1.8134686946868896, "l2_params": 270.0028076171875, "l2_updates": 0.3227457106113434, "train/loss": 2.973966121673584, "uptime": 13728.287280215, "examples_seen": 75878400.0, "progress": 0.6580641723577525, "epoch": 59.226002542994, "img/sec/core": 662.42409920882, "core_hours_NVIDIA A100-SXM4-40GB": 29.673373212895534, "core_hours": 29.673373212895534} {"step": 74150, "global_schedule": 0.30834531784057617, "l2_grads": 1.915267825126648, "l2_params": 269.9143981933594, "l2_updates": 0.3327023983001709, "train/loss": 1.8695588111877441, "uptime": 13737.757123553, "examples_seen": 75929600.0, "progress": 0.6585082102608278, "epoch": 59.26596610746296, "img/sec/core": 675.8295540453697, "core_hours_NVIDIA A100-SXM4-40GB": 29.6944173092022, "core_hours": 29.6944173092022} {"step": 74200, "global_schedule": 0.30763864517211914, "l2_grads": 1.8700342178344727, "l2_params": 269.828125, "l2_updates": 0.3277988135814667, "train/loss": 1.7996134757995605, "uptime": 13746.378706311001, "examples_seen": 75980800.0, "progress": 0.6589522481639033, "epoch": 59.30592967193192, "img/sec/core": 742.3230953806151, "core_hours_NVIDIA A100-SXM4-40GB": 29.71357638199776, "core_hours": 29.71357638199776} {"step": 74250, "global_schedule": 0.306932270526886, "l2_grads": 1.9447635412216187, "l2_params": 269.7480773925781, "l2_updates": 0.32620930671691895, "train/loss": 3.8041186332702637, "uptime": 13755.429947527, "examples_seen": 76032000.0, "progress": 0.6593962860669786, "epoch": 59.345893236400876, "img/sec/core": 707.0853430231782, "core_hours_NVIDIA A100-SXM4-40GB": 29.733690251366646, "core_hours": 29.733690251366646} {"step": 74300, "global_schedule": 0.30622637271881104, "l2_grads": 1.8666824102401733, "l2_params": 269.66302490234375, "l2_updates": 0.33351126313209534, "train/loss": 1.9819012880325317, "uptime": 13764.10349594, "examples_seen": 76083200.0, "progress": 0.6598403239700541, "epoch": 59.38585680086983, "img/sec/core": 737.8756300486349, "core_hours_NVIDIA A100-SXM4-40GB": 29.752964803395535, "core_hours": 29.752964803395535} {"step": 74350, "global_schedule": 0.3055209219455719, "l2_grads": 1.978349208831787, "l2_params": 269.58544921875, "l2_updates": 0.3301440477371216, "train/loss": 1.9642881155014038, "uptime": 13773.106058571999, "examples_seen": 76134400.0, "progress": 0.6602843618731294, "epoch": 59.42582036533879, "img/sec/core": 710.908689182792, "core_hours_NVIDIA A100-SXM4-40GB": 29.77297049813331, "core_hours": 29.77297049813331} {"step": 74400, "global_schedule": 0.30481603741645813, "l2_grads": 1.9669615030288696, "l2_params": 269.491455078125, "l2_updates": 0.32508552074432373, "train/loss": 1.843604564666748, "uptime": 13781.861041031001, "examples_seen": 76185600.0, "progress": 0.6607283997762049, "epoch": 59.46578392980775, "img/sec/core": 731.0123155551468, "core_hours_NVIDIA A100-SXM4-40GB": 29.792426014708873, "core_hours": 29.792426014708873} {"step": 74450, "global_schedule": 0.304111510515213, "l2_grads": 1.7295595407485962, "l2_params": 269.40191650390625, "l2_updates": 0.3240587115287781, "train/loss": 2.8586106300354004, "uptime": 13790.881879469, "examples_seen": 76236800.0, "progress": 0.6611724376792804, "epoch": 59.505747494276704, "img/sec/core": 709.4684207003742, "core_hours_NVIDIA A100-SXM4-40GB": 29.812472322348867, "core_hours": 29.812472322348867} {"step": 74500, "global_schedule": 0.3034074306488037, "l2_grads": 1.89351487159729, "l2_params": 269.31732177734375, "l2_updates": 0.32798296213150024, "train/loss": 1.9841070175170898, "uptime": 13799.673704851002, "examples_seen": 76288000.0, "progress": 0.6616164755823557, "epoch": 59.54571105874566, "img/sec/core": 727.9489436973133, "core_hours_NVIDIA A100-SXM4-40GB": 29.832009712086652, "core_hours": 29.832009712086652} {"step": 74550, "global_schedule": 0.302703857421875, "l2_grads": 2.002091884613037, "l2_params": 269.2339172363281, "l2_updates": 0.3240903913974762, "train/loss": 1.9197399616241455, "uptime": 13808.287673212, "examples_seen": 76339200.0, "progress": 0.6620605134854312, "epoch": 59.585674623214615, "img/sec/core": 742.9792787465523, "core_hours_NVIDIA A100-SXM4-40GB": 29.85115186399998, "core_hours": 29.85115186399998} {"step": 74600, "global_schedule": 0.3020007014274597, "l2_grads": 1.7388206720352173, "l2_params": 269.15301513671875, "l2_updates": 0.32102689146995544, "train/loss": 2.973062038421631, "uptime": 13816.994439181, "examples_seen": 76390400.0, "progress": 0.6625045513885065, "epoch": 59.62563818768357, "img/sec/core": 735.0605291088323, "core_hours_NVIDIA A100-SXM4-40GB": 29.870500232819982, "core_hours": 29.870500232819982} {"step": 74650, "global_schedule": 0.3012981414794922, "l2_grads": 1.9134228229522705, "l2_params": 269.06927490234375, "l2_updates": 0.3166358768939972, "train/loss": 3.3212037086486816, "uptime": 13825.518486964002, "examples_seen": 76441600.0, "progress": 0.662948589291582, "epoch": 59.66560175215253, "img/sec/core": 750.8170018430709, "core_hours_NVIDIA A100-SXM4-40GB": 29.88944256122665, "core_hours": 29.88944256122665} {"step": 74700, "global_schedule": 0.30059587955474854, "l2_grads": 2.0297398567199707, "l2_params": 268.9828796386719, "l2_updates": 0.32117190957069397, "train/loss": 1.9777748584747314, "uptime": 13834.219503281, "examples_seen": 76492800.0, "progress": 0.6633926271946573, "epoch": 59.70556531662149, "img/sec/core": 735.5462588315332, "core_hours_NVIDIA A100-SXM4-40GB": 29.9087781530422, "core_hours": 29.9087781530422} {"step": 74750, "global_schedule": 0.29989415407180786, "l2_grads": 1.9980770349502563, "l2_params": 268.8955078125, "l2_updates": 0.3212597072124481, "train/loss": 4.404451370239258, "uptime": 13843.894940381002, "examples_seen": 76544000.0, "progress": 0.6638366650977328, "epoch": 59.74552888109044, "img/sec/core": 661.4688239767872, "core_hours_NVIDIA A100-SXM4-40GB": 29.93027912437554, "core_hours": 29.93027912437554} {"step": 74800, "global_schedule": 0.2991928458213806, "l2_grads": 1.9551242589950562, "l2_params": 268.8151550292969, "l2_updates": 0.318185418844223, "train/loss": 1.8714286088943481, "uptime": 13853.359513295001, "examples_seen": 76595200.0, "progress": 0.6642807030008081, "epoch": 59.7854924455594, "img/sec/core": 676.2058952003631, "core_hours_NVIDIA A100-SXM4-40GB": 29.951311508628873, "core_hours": 29.951311508628873} {"step": 74850, "global_schedule": 0.2984920144081116, "l2_grads": 1.9194964170455933, "l2_params": 268.73651123046875, "l2_updates": 0.3113296329975128, "train/loss": 4.357143878936768, "uptime": 13862.950541805001, "examples_seen": 76646400.0, "progress": 0.6647247409038836, "epoch": 59.825456010028354, "img/sec/core": 667.2902695813251, "core_hours_NVIDIA A100-SXM4-40GB": 29.972624905317762, "core_hours": 29.972624905317762} {"step": 74900, "global_schedule": 0.2977917790412903, "l2_grads": 1.8146110773086548, "l2_params": 268.6433410644531, "l2_updates": 0.3180718421936035, "train/loss": 2.9976823329925537, "uptime": 13872.606377170001, "examples_seen": 76697600.0, "progress": 0.665168778806959, "epoch": 59.86541957449732, "img/sec/core": 662.8116323522394, "core_hours_NVIDIA A100-SXM4-40GB": 29.994082317239982, "core_hours": 29.994082317239982} {"step": 74950, "global_schedule": 0.29709193110466003, "l2_grads": 1.9694879055023193, "l2_params": 268.5605773925781, "l2_updates": 0.31263816356658936, "train/loss": 2.5294995307922363, "uptime": 13882.222253760001, "examples_seen": 76748800.0, "progress": 0.6656128167100344, "epoch": 59.90538313896627, "img/sec/core": 665.5659460787672, "core_hours_NVIDIA A100-SXM4-40GB": 30.015450931884427, "core_hours": 30.015450931884427} {"step": 75000, "global_schedule": 0.2963925302028656, "l2_grads": 2.043501377105713, "l2_params": 268.4733581542969, "l2_updates": 0.31430235505104065, "train/loss": 1.8941919803619385, "uptime": 13891.704397246, "examples_seen": 76800000.0, "progress": 0.6660568546131098, "epoch": 59.94534670343523, "img/sec/core": 674.9528742578335, "core_hours_NVIDIA A100-SXM4-40GB": 30.03652236185331, "core_hours": 30.03652236185331, "val/acc@1": 0.71286, "val/loss": 1.1557268017578124, "z/secs/eval/val": 4.720533676001651} {"step": 75050, "global_schedule": 0.29569360613822937, "l2_grads": 1.9842119216918945, "l2_params": 268.384033203125, "l2_updates": 0.3186485469341278, "train/loss": 1.8425272703170776, "uptime": 13906.471657562002, "examples_seen": 76851200.0, "progress": 0.6665008925161852, "epoch": 59.98531026790418, "img/sec/core": 703.1705068310671, "core_hours_NVIDIA A100-SXM4-40GB": 30.05674821331332, "core_hours": 30.05674821331332} {"step": 75100, "global_schedule": 0.2949952185153961, "l2_grads": 1.8523038625717163, "l2_params": 268.2995910644531, "l2_updates": 0.3152737617492676, "train/loss": 1.798951506614685, "uptime": 13915.895979923002, "examples_seen": 76902400.0, "progress": 0.6669449304192606, "epoch": 60.02527383237314, "img/sec/core": 679.0939183580134, "core_hours_NVIDIA A100-SXM4-40GB": 30.077691151893315, "core_hours": 30.077691151893315} {"step": 75150, "global_schedule": 0.29429733753204346, "l2_grads": 1.895513653755188, "l2_params": 268.2070617675781, "l2_updates": 0.317433625459671, "train/loss": 1.7945945262908936, "uptime": 13924.74010464, "examples_seen": 76953600.0, "progress": 0.667388968322336, "epoch": 60.0652373968421, "img/sec/core": 723.6442502557404, "core_hours_NVIDIA A100-SXM4-40GB": 30.097344762375535, "core_hours": 30.097344762375535} {"step": 75200, "global_schedule": 0.2935999035835266, "l2_grads": 1.8158783912658691, "l2_params": 268.1228942871094, "l2_updates": 0.31071844696998596, "train/loss": 2.4132797718048096, "uptime": 13933.431350820001, "examples_seen": 77004800.0, "progress": 0.6678330062254114, "epoch": 60.105200961311056, "img/sec/core": 736.3731123766751, "core_hours_NVIDIA A100-SXM4-40GB": 30.116658642775537, "core_hours": 30.116658642775537} {"step": 75250, "global_schedule": 0.2929028868675232, "l2_grads": 2.0536279678344727, "l2_params": 268.0406799316406, "l2_updates": 0.3077128529548645, "train/loss": 1.8917782306671143, "uptime": 13941.855480790002, "examples_seen": 77056000.0, "progress": 0.6682770441284868, "epoch": 60.14516452578001, "img/sec/core": 759.7223716622581, "core_hours_NVIDIA A100-SXM4-40GB": 30.13537893159776, "core_hours": 30.13537893159776} {"step": 75300, "global_schedule": 0.29220640659332275, "l2_grads": 1.9270905256271362, "l2_params": 267.9537353515625, "l2_updates": 0.3103203773498535, "train/loss": 2.1934139728546143, "uptime": 13950.344796003, "examples_seen": 77107200.0, "progress": 0.6687210820315622, "epoch": 60.185128090248966, "img/sec/core": 753.8888401976476, "core_hours_NVIDIA A100-SXM4-40GB": 30.154244076515536, "core_hours": 30.154244076515536} {"step": 75350, "global_schedule": 0.2915104329586029, "l2_grads": 2.1148414611816406, "l2_params": 267.85833740234375, "l2_updates": 0.3102323114871979, "train/loss": 4.337573051452637, "uptime": 13959.728525338001, "examples_seen": 77158400.0, "progress": 0.6691651199346377, "epoch": 60.22509165471793, "img/sec/core": 682.031607212756, "core_hours_NVIDIA A100-SXM4-40GB": 30.175096808371094, "core_hours": 30.175096808371094} {"step": 75400, "global_schedule": 0.29081493616104126, "l2_grads": 1.6948981285095215, "l2_params": 267.7808532714844, "l2_updates": 0.30330634117126465, "train/loss": 3.1134355068206787, "uptime": 13968.320209835, "examples_seen": 77209600.0, "progress": 0.669609157837713, "epoch": 60.265055219186884, "img/sec/core": 744.9063105420448, "core_hours_NVIDIA A100-SXM4-40GB": 30.194189440586644, "core_hours": 30.194189440586644} {"step": 75450, "global_schedule": 0.29011985659599304, "l2_grads": 1.963577151298523, "l2_params": 267.69952392578125, "l2_updates": 0.30390095710754395, "train/loss": 1.895485758781433, "uptime": 13977.040670274002, "examples_seen": 77260800.0, "progress": 0.6700531957407885, "epoch": 60.30501878365584, "img/sec/core": 733.906201944994, "core_hours_NVIDIA A100-SXM4-40GB": 30.213568241562207, "core_hours": 30.213568241562207} {"step": 75500, "global_schedule": 0.2894253730773926, "l2_grads": 1.8793246746063232, "l2_params": 267.6091613769531, "l2_updates": 0.31015196442604065, "train/loss": 4.155614376068115, "uptime": 13985.741944485, "examples_seen": 77312000.0, "progress": 0.6704972336438638, "epoch": 60.344982348124795, "img/sec/core": 735.5244582351546, "core_hours_NVIDIA A100-SXM4-40GB": 30.232904406475537, "core_hours": 30.232904406475537} {"step": 75550, "global_schedule": 0.28873133659362793, "l2_grads": 2.077272415161133, "l2_params": 267.5312194824219, "l2_updates": 0.300138920545578, "train/loss": 2.02593994140625, "uptime": 13994.435133059002, "examples_seen": 77363200.0, "progress": 0.6709412715469393, "epoch": 60.38494591259375, "img/sec/core": 736.2085781896409, "core_hours_NVIDIA A100-SXM4-40GB": 30.252222603306652, "core_hours": 30.252222603306652} {"step": 75600, "global_schedule": 0.28803783655166626, "l2_grads": 1.9578940868377686, "l2_params": 267.43731689453125, "l2_updates": 0.3079109191894531, "train/loss": 1.8898332118988037, "uptime": 14002.940442572, "examples_seen": 77414400.0, "progress": 0.6713853094500146, "epoch": 60.42490947706271, "img/sec/core": 752.471146431389, "core_hours_NVIDIA A100-SXM4-40GB": 30.271123291113316, "core_hours": 30.271123291113316} {"step": 75650, "global_schedule": 0.2873448133468628, "l2_grads": 2.0107600688934326, "l2_params": 267.354736328125, "l2_updates": 0.3108612298965454, "train/loss": 2.0707080364227295, "uptime": 14011.975573896, "examples_seen": 77465600.0, "progress": 0.6718293473530901, "epoch": 60.46487304153167, "img/sec/core": 708.3460959776472, "core_hours_NVIDIA A100-SXM4-40GB": 30.2912013607222, "core_hours": 30.2912013607222} {"step": 75700, "global_schedule": 0.28665220737457275, "l2_grads": 1.9157886505126953, "l2_params": 267.2765808105469, "l2_updates": 0.30655720829963684, "train/loss": 2.2236475944519043, "uptime": 14021.509410560002, "examples_seen": 77516800.0, "progress": 0.6722733852561654, "epoch": 60.50483660600062, "img/sec/core": 671.2932291115093, "core_hours_NVIDIA A100-SXM4-40GB": 30.312387664419983, "core_hours": 30.312387664419983} {"step": 75750, "global_schedule": 0.28596019744873047, "l2_grads": 1.8985618352890015, "l2_params": 267.189208984375, "l2_updates": 0.30758097767829895, "train/loss": 1.7915148735046387, "uptime": 14031.005186928001, "examples_seen": 77568000.0, "progress": 0.6727174231592409, "epoch": 60.54480017046958, "img/sec/core": 673.9838589257243, "core_hours_NVIDIA A100-SXM4-40GB": 30.333489389682207, "core_hours": 30.333489389682207} {"step": 75800, "global_schedule": 0.2852685749530792, "l2_grads": 1.9289968013763428, "l2_params": 267.11285400390625, "l2_updates": 0.3062276244163513, "train/loss": 2.1779658794403076, "uptime": 14040.573341589, "examples_seen": 77619200.0, "progress": 0.6731614610623162, "epoch": 60.584763734938534, "img/sec/core": 668.8855089358996, "core_hours_NVIDIA A100-SXM4-40GB": 30.35475195559554, "core_hours": 30.35475195559554} {"step": 75850, "global_schedule": 0.2845776677131653, "l2_grads": 1.9657820463180542, "l2_params": 267.0290832519531, "l2_updates": 0.3012230694293976, "train/loss": 1.7896054983139038, "uptime": 14050.078891503, "examples_seen": 77670400.0, "progress": 0.6736054989653917, "epoch": 60.624727299407496, "img/sec/core": 673.2908730060976, "core_hours_NVIDIA A100-SXM4-40GB": 30.375875399848873, "core_hours": 30.375875399848873} {"step": 75900, "global_schedule": 0.2838870882987976, "l2_grads": 1.806996464729309, "l2_params": 266.94573974609375, "l2_updates": 0.29853177070617676, "train/loss": 3.5828099250793457, "uptime": 14058.794521129, "examples_seen": 77721600.0, "progress": 0.6740495368684671, "epoch": 60.66469086387645, "img/sec/core": 734.3129842172109, "core_hours_NVIDIA A100-SXM4-40GB": 30.395243465684427, "core_hours": 30.395243465684427} {"step": 75950, "global_schedule": 0.2831970751285553, "l2_grads": 1.8811205625534058, "l2_params": 266.8624572753906, "l2_updates": 0.2990282475948334, "train/loss": 3.7828195095062256, "uptime": 14068.011319406001, "examples_seen": 77772800.0, "progress": 0.6744935747715425, "epoch": 60.70465442834541, "img/sec/core": 694.384297849981, "core_hours_NVIDIA A100-SXM4-40GB": 30.415725239633318, "core_hours": 30.415725239633318} {"step": 76000, "global_schedule": 0.2825074791908264, "l2_grads": 2.150941848754883, "l2_params": 266.78070068359375, "l2_updates": 0.29902270436286926, "train/loss": 1.948441743850708, "uptime": 14077.804890837999, "examples_seen": 77824000.0, "progress": 0.6749376126746179, "epoch": 60.74461799281436, "img/sec/core": 653.4898983929415, "core_hours_NVIDIA A100-SXM4-40GB": 30.437488731704423, "core_hours": 30.437488731704423} {"step": 76050, "global_schedule": 0.2818185091018677, "l2_grads": 1.9763309955596924, "l2_params": 266.6928405761719, "l2_updates": 0.30088043212890625, "train/loss": 1.9458600282669067, "uptime": 14087.578906695, "examples_seen": 77875200.0, "progress": 0.6753816505776933, "epoch": 60.78458155728332, "img/sec/core": 724.1954670062477, "core_hours_NVIDIA A100-SXM4-40GB": 30.45712738296665, "core_hours": 30.45712738296665} {"step": 76100, "global_schedule": 0.28113001585006714, "l2_grads": 2.0365142822265625, "l2_params": 266.6075134277344, "l2_updates": 0.3002532720565796, "train/loss": 1.8800430297851562, "uptime": 14097.214294562002, "examples_seen": 77926400.0, "progress": 0.6758256884807687, "epoch": 60.82454512175228, "img/sec/core": 664.2182015233832, "core_hours_NVIDIA A100-SXM4-40GB": 30.478539356004433, "core_hours": 30.478539356004433} {"step": 76150, "global_schedule": 0.2804420590400696, "l2_grads": 2.1449625492095947, "l2_params": 266.5282287597656, "l2_updates": 0.30046865344047546, "train/loss": 1.9195293188095093, "uptime": 14106.299168186999, "examples_seen": 77977600.0, "progress": 0.6762697263838441, "epoch": 60.864508686221235, "img/sec/core": 704.4676969848242, "core_hours_NVIDIA A100-SXM4-40GB": 30.49872796405998, "core_hours": 30.49872796405998} {"step": 76200, "global_schedule": 0.279754638671875, "l2_grads": 1.9155592918395996, "l2_params": 266.4515075683594, "l2_updates": 0.2935393154621124, "train/loss": 2.7938156127929688, "uptime": 14115.863399843, "examples_seen": 78028800.0, "progress": 0.6767137642869195, "epoch": 60.90447225069019, "img/sec/core": 669.1598687893156, "core_hours_NVIDIA A100-SXM4-40GB": 30.519981812184426, "core_hours": 30.519981812184426} {"step": 76250, "global_schedule": 0.27906760573387146, "l2_grads": 1.8296847343444824, "l2_params": 266.37017822265625, "l2_updates": 0.2953765392303467, "train/loss": 2.3410632610321045, "uptime": 14125.408062719, "examples_seen": 78080000.0, "progress": 0.6771578021899949, "epoch": 60.944435815159146, "img/sec/core": 670.531802238161, "core_hours_NVIDIA A100-SXM4-40GB": 30.541192174131094, "core_hours": 30.541192174131094} {"step": 76300, "global_schedule": 0.27838119864463806, "l2_grads": 1.808275580406189, "l2_params": 266.2879943847656, "l2_updates": 0.29445722699165344, "train/loss": 3.413729190826416, "uptime": 14134.261712427002, "examples_seen": 78131200.0, "progress": 0.6776018400930703, "epoch": 60.9843993796281, "img/sec/core": 722.8657345925362, "core_hours_NVIDIA A100-SXM4-40GB": 30.560866951259985, "core_hours": 30.560866951259985} {"step": 76350, "global_schedule": 0.27769529819488525, "l2_grads": 1.9695366621017456, "l2_params": 266.2055969238281, "l2_updates": 0.2966623604297638, "train/loss": 1.8430498838424683, "uptime": 14144.076443311, "examples_seen": 78182400.0, "progress": 0.6780458779961458, "epoch": 61.024362944097064, "img/sec/core": 652.0810479311881, "core_hours_NVIDIA A100-SXM4-40GB": 30.582677464335536, "core_hours": 30.582677464335536} {"step": 76400, "global_schedule": 0.2770099639892578, "l2_grads": 2.0784013271331787, "l2_params": 266.1236572265625, "l2_updates": 0.29125553369522095, "train/loss": 1.8768268823623657, "uptime": 14152.86576292, "examples_seen": 78233600.0, "progress": 0.6784899158992211, "epoch": 61.06432650856602, "img/sec/core": 728.1564768046436, "core_hours_NVIDIA A100-SXM4-40GB": 30.602209285688875, "core_hours": 30.602209285688875} {"step": 76450, "global_schedule": 0.276324987411499, "l2_grads": 1.8326932191848755, "l2_params": 266.0309753417969, "l2_updates": 0.29253894090652466, "train/loss": 2.852323532104492, "uptime": 14161.256783665, "examples_seen": 78284800.0, "progress": 0.6789339538022966, "epoch": 61.104290073034974, "img/sec/core": 762.7200783426006, "core_hours_NVIDIA A100-SXM4-40GB": 30.620855998455536, "core_hours": 30.620855998455536} {"step": 76500, "global_schedule": 0.27564066648483276, "l2_grads": 2.0541443824768066, "l2_params": 265.9534912109375, "l2_updates": 0.293351411819458, "train/loss": 1.8523554801940918, "uptime": 14169.740281696, "examples_seen": 78336000.0, "progress": 0.6793779917053719, "epoch": 61.14425363750393, "img/sec/core": 754.4057859874478, "core_hours_NVIDIA A100-SXM4-40GB": 30.639708216302207, "core_hours": 30.639708216302207} {"step": 76550, "global_schedule": 0.27495676279067993, "l2_grads": 2.0626895427703857, "l2_params": 265.8653259277344, "l2_updates": 0.29022127389907837, "train/loss": 1.9081662893295288, "uptime": 14178.501676966001, "examples_seen": 78387200.0, "progress": 0.6798220296084474, "epoch": 61.18421720197289, "img/sec/core": 730.4772587892957, "core_hours_NVIDIA A100-SXM4-40GB": 30.659177983568878, "core_hours": 30.659177983568878} {"step": 76600, "global_schedule": 0.2742736339569092, "l2_grads": 1.9371627569198608, "l2_params": 265.7797546386719, "l2_updates": 0.2880500853061676, "train/loss": 4.33182430267334, "uptime": 14187.109667211002, "examples_seen": 78438400.0, "progress": 0.6802660675115227, "epoch": 61.22418076644185, "img/sec/core": 743.4952663564407, "core_hours_NVIDIA A100-SXM4-40GB": 30.678306850779986, "core_hours": 30.678306850779986} {"step": 76650, "global_schedule": 0.2735908031463623, "l2_grads": 1.9644051790237427, "l2_params": 265.6988525390625, "l2_updates": 0.2934095561504364, "train/loss": 1.9775068759918213, "uptime": 14195.918181031999, "examples_seen": 78489600.0, "progress": 0.6807101054145982, "epoch": 61.2641443309108, "img/sec/core": 726.5697857843039, "core_hours_NVIDIA A100-SXM4-40GB": 30.697881325937757, "core_hours": 30.697881325937757} {"step": 76700, "global_schedule": 0.2729085683822632, "l2_grads": 1.8757832050323486, "l2_params": 265.6160583496094, "l2_updates": 0.2888099253177643, "train/loss": 3.668539524078369, "uptime": 14205.030278601002, "examples_seen": 78540800.0, "progress": 0.6811541433176735, "epoch": 61.30410789537976, "img/sec/core": 702.3629797129572, "core_hours_NVIDIA A100-SXM4-40GB": 30.718130431646653, "core_hours": 30.718130431646653} {"step": 76750, "global_schedule": 0.27222689986228943, "l2_grads": 2.072838068008423, "l2_params": 265.5355224609375, "l2_updates": 0.28446099162101746, "train/loss": 1.8577631711959839, "uptime": 14213.508081076, "examples_seen": 78592000.0, "progress": 0.681598181220749, "epoch": 61.34407145984871, "img/sec/core": 754.9126107708496, "core_hours_NVIDIA A100-SXM4-40GB": 30.736969992702203, "core_hours": 30.736969992702203} {"step": 76800, "global_schedule": 0.2715456485748291, "l2_grads": 1.9254847764968872, "l2_params": 265.4505615234375, "l2_updates": 0.29209810495376587, "train/loss": 1.781820297241211, "uptime": 14222.024332715, "examples_seen": 78643200.0, "progress": 0.6820422191238245, "epoch": 61.384035024317676, "img/sec/core": 751.5043321043488, "core_hours_NVIDIA A100-SXM4-40GB": 30.755894996344427, "core_hours": 30.755894996344427} {"step": 76850, "global_schedule": 0.27086514234542847, "l2_grads": 2.065479278564453, "l2_params": 265.36810302734375, "l2_updates": 0.2883390486240387, "train/loss": 1.9135468006134033, "uptime": 14230.598965919, "examples_seen": 78694400.0, "progress": 0.6824862570268998, "epoch": 61.42399858878663, "img/sec/core": 746.387611893949, "core_hours_NVIDIA A100-SXM4-40GB": 30.77494973679776, "core_hours": 30.77494973679776} {"step": 76900, "global_schedule": 0.2701849937438965, "l2_grads": 1.980388879776001, "l2_params": 265.2743835449219, "l2_updates": 0.28459474444389343, "train/loss": 2.460376739501953, "uptime": 14239.291683537, "examples_seen": 78745600.0, "progress": 0.6829302949299753, "epoch": 61.463962153255586, "img/sec/core": 736.2484646628488, "core_hours_NVIDIA A100-SXM4-40GB": 30.79426688705998, "core_hours": 30.79426688705998} {"step": 76950, "global_schedule": 0.26950544118881226, "l2_grads": 1.9844648838043213, "l2_params": 265.2049255371094, "l2_updates": 0.28297606110572815, "train/loss": 1.8659172058105469, "uptime": 14247.977737923002, "examples_seen": 78796800.0, "progress": 0.6833743328330506, "epoch": 61.50392571772454, "img/sec/core": 736.8132543947527, "core_hours_NVIDIA A100-SXM4-40GB": 30.813569230139986, "core_hours": 30.813569230139986} {"step": 77000, "global_schedule": 0.26882636547088623, "l2_grads": 1.9078720808029175, "l2_params": 265.121337890625, "l2_updates": 0.2858245372772217, "train/loss": 1.7528581619262695, "uptime": 14256.492277872001, "examples_seen": 78848000.0, "progress": 0.6838183707361261, "epoch": 61.5438892821935, "img/sec/core": 751.6554080825215, "core_hours_NVIDIA A100-SXM4-40GB": 30.832490430026652, "core_hours": 30.832490430026652} {"step": 77050, "global_schedule": 0.2681480050086975, "l2_grads": 1.8723540306091309, "l2_params": 265.0311279296875, "l2_updates": 0.28608614206314087, "train/loss": 2.897477865219116, "uptime": 14265.543613381002, "examples_seen": 78899200.0, "progress": 0.6842624086392014, "epoch": 61.58385284666246, "img/sec/core": 764.4087443648435, "core_hours_NVIDIA A100-SXM4-40GB": 30.851095950079984, "core_hours": 30.851095950079984} {"step": 77100, "global_schedule": 0.26747000217437744, "l2_grads": 1.896907091140747, "l2_params": 264.9515686035156, "l2_updates": 0.2857840359210968, "train/loss": 3.8317794799804688, "uptime": 14274.175634586, "examples_seen": 78950400.0, "progress": 0.6847064465422769, "epoch": 61.623816411131415, "img/sec/core": 741.4254260977207, "core_hours_NVIDIA A100-SXM4-40GB": 30.870278219424424, "core_hours": 30.870278219424424} {"step": 77150, "global_schedule": 0.2667926549911499, "l2_grads": 1.8587827682495117, "l2_params": 264.8701477050781, "l2_updates": 0.2832891047000885, "train/loss": 3.1150457859039307, "uptime": 14282.766246531, "examples_seen": 79001600.0, "progress": 0.6851504844453522, "epoch": 61.66377997560037, "img/sec/core": 744.9993133171672, "core_hours_NVIDIA A100-SXM4-40GB": 30.889368468191094, "core_hours": 30.889368468191094} {"step": 77200, "global_schedule": 0.2661157250404358, "l2_grads": 1.8249880075454712, "l2_params": 264.79547119140625, "l2_updates": 0.28031107783317566, "train/loss": 3.9205985069274902, "uptime": 14291.370590539, "examples_seen": 79052800.0, "progress": 0.6855945223484277, "epoch": 61.703743540069325, "img/sec/core": 743.8103351109655, "core_hours_NVIDIA A100-SXM4-40GB": 30.908489232653313, "core_hours": 30.908489232653313} {"step": 77250, "global_schedule": 0.2654394805431366, "l2_grads": 1.9342228174209595, "l2_params": 264.7070617675781, "l2_updates": 0.2812845706939697, "train/loss": 4.169645309448242, "uptime": 14300.026807272001, "examples_seen": 79104000.0, "progress": 0.6860385602515031, "epoch": 61.74370710453828, "img/sec/core": 739.3530219270575, "core_hours_NVIDIA A100-SXM4-40GB": 30.92772526983776, "core_hours": 30.92772526983776} {"step": 77300, "global_schedule": 0.2647637724876404, "l2_grads": 2.181623935699463, "l2_params": 264.62994384765625, "l2_updates": 0.28284314274787903, "train/loss": 1.995495319366455, "uptime": 14308.691178264, "examples_seen": 79155200.0, "progress": 0.6864825981545785, "epoch": 61.78367066900724, "img/sec/core": 738.6571980712714, "core_hours_NVIDIA A100-SXM4-40GB": 30.946979427597757, "core_hours": 30.946979427597757} {"step": 77350, "global_schedule": 0.26408860087394714, "l2_grads": 1.9904752969741821, "l2_params": 264.55303955078125, "l2_updates": 0.281680703163147, "train/loss": 1.9631006717681885, "uptime": 14318.437931359002, "examples_seen": 79206400.0, "progress": 0.6869266360576539, "epoch": 61.8236342334762, "img/sec/core": 656.6289242806488, "core_hours_NVIDIA A100-SXM4-40GB": 30.968638878919982, "core_hours": 30.968638878919982} {"step": 77400, "global_schedule": 0.2634139955043793, "l2_grads": 2.170727014541626, "l2_params": 264.4665222167969, "l2_updates": 0.2801317870616913, "train/loss": 1.8463289737701416, "uptime": 14328.299514838001, "examples_seen": 79257600.0, "progress": 0.6873706739607293, "epoch": 61.863597797945154, "img/sec/core": 648.9829968613824, "core_hours_NVIDIA A100-SXM4-40GB": 30.990553508873315, "core_hours": 30.990553508873315} {"step": 77450, "global_schedule": 0.2627398371696472, "l2_grads": 2.0528934001922607, "l2_params": 264.38958740234375, "l2_updates": 0.27939465641975403, "train/loss": 1.9239022731781006, "uptime": 14337.110214598999, "examples_seen": 79308800.0, "progress": 0.6878147118638047, "epoch": 61.90356136241411, "img/sec/core": 726.3895233759969, "core_hours_NVIDIA A100-SXM4-40GB": 31.010132841675535, "core_hours": 31.010132841675535} {"step": 77500, "global_schedule": 0.2620663344860077, "l2_grads": 2.0067336559295654, "l2_params": 264.3040466308594, "l2_updates": 0.2762266993522644, "train/loss": 4.261497974395752, "uptime": 14345.874629372001, "examples_seen": 79360000.0, "progress": 0.6882587497668801, "epoch": 61.94352492688307, "img/sec/core": 730.2255958622892, "core_hours_NVIDIA A100-SXM4-40GB": 31.02960931894887, "core_hours": 31.02960931894887, "val/acc@1": 0.71896, "val/loss": 1.1172862329101563, "z/secs/eval/val": 4.119351926998206} {"step": 77550, "global_schedule": 0.26139339804649353, "l2_grads": 1.9667812585830688, "l2_params": 264.2240905761719, "l2_updates": 0.27807343006134033, "train/loss": 2.1963703632354736, "uptime": 14358.347082123999, "examples_seen": 79411200.0, "progress": 0.6887027876699555, "epoch": 61.98348849135203, "img/sec/core": 766.2721825717305, "core_hours_NVIDIA A100-SXM4-40GB": 31.048169593673308, "core_hours": 31.048169593673308} {"step": 77600, "global_schedule": 0.26072102785110474, "l2_grads": 2.113900899887085, "l2_params": 264.146728515625, "l2_updates": 0.27842509746551514, "train/loss": 1.8795145750045776, "uptime": 14367.750978819002, "examples_seen": 79462400.0, "progress": 0.6891468255730309, "epoch": 62.02345205582098, "img/sec/core": 680.568939405817, "core_hours_NVIDIA A100-SXM4-40GB": 31.069067141884425, "core_hours": 31.069067141884425} {"step": 77650, "global_schedule": 0.26004910469055176, "l2_grads": 2.0700063705444336, "l2_params": 264.0623779296875, "l2_updates": 0.27648019790649414, "train/loss": 1.8246071338653564, "uptime": 14376.436254556002, "examples_seen": 79513600.0, "progress": 0.6895908634761063, "epoch": 62.06341562028994, "img/sec/core": 736.8793108934522, "core_hours_NVIDIA A100-SXM4-40GB": 31.088367754633314, "core_hours": 31.088367754633314} {"step": 77700, "global_schedule": 0.2593778371810913, "l2_grads": 1.8662885427474976, "l2_params": 263.985107421875, "l2_updates": 0.27545812726020813, "train/loss": 2.9557816982269287, "uptime": 14385.082246708002, "examples_seen": 79564800.0, "progress": 0.6900349013791818, "epoch": 62.10337918475889, "img/sec/core": 740.2273663317602, "core_hours_NVIDIA A100-SXM4-40GB": 31.107581070526646, "core_hours": 31.107581070526646} {"step": 77750, "global_schedule": 0.25870704650878906, "l2_grads": 2.098360776901245, "l2_params": 263.906005859375, "l2_updates": 0.2763466536998749, "train/loss": 1.8895992040634155, "uptime": 14393.748861875001, "examples_seen": 79616000.0, "progress": 0.6904789392822571, "epoch": 62.143342749227855, "img/sec/core": 738.4659266249186, "core_hours_NVIDIA A100-SXM4-40GB": 31.1268402153422, "core_hours": 31.1268402153422} {"step": 77800, "global_schedule": 0.2580370008945465, "l2_grads": 1.9895738363265991, "l2_params": 263.8292236328125, "l2_updates": 0.27430394291877747, "train/loss": 3.8070151805877686, "uptime": 14403.059000688, "examples_seen": 79667200.0, "progress": 0.6909229771853326, "epoch": 62.18330631369681, "img/sec/core": 687.4226183464469, "core_hours_NVIDIA A100-SXM4-40GB": 31.14752941270442, "core_hours": 31.14752941270442} {"step": 77850, "global_schedule": 0.257367342710495, "l2_grads": 2.068690299987793, "l2_params": 263.7516784667969, "l2_updates": 0.2687913775444031, "train/loss": 1.880551815032959, "uptime": 14412.617618967002, "examples_seen": 79718400.0, "progress": 0.6913670150884079, "epoch": 62.223269878165766, "img/sec/core": 669.5528384116574, "core_hours_NVIDIA A100-SXM4-40GB": 31.16877078665776, "core_hours": 31.16877078665776} {"step": 77900, "global_schedule": 0.256698340177536, "l2_grads": 2.001441240310669, "l2_params": 263.6582946777344, "l2_updates": 0.27378150820732117, "train/loss": 1.9922508001327515, "uptime": 14421.130451260002, "examples_seen": 79769600.0, "progress": 0.6918110529914834, "epoch": 62.26323344263472, "img/sec/core": 751.8061885540732, "core_hours_NVIDIA A100-SXM4-40GB": 31.18768819175331, "core_hours": 31.18768819175331} {"step": 77950, "global_schedule": 0.2560299038887024, "l2_grads": 1.9690496921539307, "l2_params": 263.57568359375, "l2_updates": 0.27819839119911194, "train/loss": 1.9896174669265747, "uptime": 14429.782732548001, "examples_seen": 79820800.0, "progress": 0.6922550908945587, "epoch": 62.30319700710368, "img/sec/core": 739.6893127916156, "core_hours_NVIDIA A100-SXM4-40GB": 31.20691548350442, "core_hours": 31.20691548350442} {"step": 78000, "global_schedule": 0.25536197423934937, "l2_grads": 1.9851211309432983, "l2_params": 263.50384521484375, "l2_updates": 0.2747802734375, "train/loss": 1.7883436679840088, "uptime": 14438.590719763999, "examples_seen": 79872000.0, "progress": 0.6926991287976342, "epoch": 62.34316057157264, "img/sec/core": 726.613225366148, "core_hours_NVIDIA A100-SXM4-40GB": 31.22648878842886, "core_hours": 31.22648878842886} {"step": 78050, "global_schedule": 0.25469470024108887, "l2_grads": 2.070124864578247, "l2_params": 263.4237060546875, "l2_updates": 0.2722698152065277, "train/loss": 1.8879821300506592, "uptime": 14448.484044793002, "examples_seen": 79923200.0, "progress": 0.6931431667007095, "epoch": 62.383124136041594, "img/sec/core": 709.523988489959, "core_hours_NVIDIA A100-SXM4-40GB": 31.2465335261022, "core_hours": 31.2465335261022} {"step": 78100, "global_schedule": 0.25402799248695374, "l2_grads": 2.1517138481140137, "l2_params": 263.345703125, "l2_updates": 0.2678561806678772, "train/loss": 1.907570481300354, "uptime": 14457.909550539001, "examples_seen": 79974400.0, "progress": 0.693587204603785, "epoch": 62.42308770051055, "img/sec/core": 679.0086571976623, "core_hours_NVIDIA A100-SXM4-40GB": 31.26747909442664, "core_hours": 31.26747909442664} {"step": 78150, "global_schedule": 0.25336188077926636, "l2_grads": 1.8648213148117065, "l2_params": 263.2578125, "l2_updates": 0.27145516872406006, "train/loss": 4.132597923278809, "uptime": 14467.300094072, "examples_seen": 80025600.0, "progress": 0.6940312425068604, "epoch": 62.463051264979505, "img/sec/core": 681.5366946024652, "core_hours_NVIDIA A100-SXM4-40GB": 31.288346968944417, "core_hours": 31.288346968944417} {"step": 78200, "global_schedule": 0.2526962161064148, "l2_grads": 1.7738457918167114, "l2_params": 263.1802978515625, "l2_updates": 0.26476889848709106, "train/loss": 3.167020082473755, "uptime": 14476.884627964, "examples_seen": 80076800.0, "progress": 0.6944752804099358, "epoch": 62.50301482944846, "img/sec/core": 667.7424350642059, "core_hours_NVIDIA A100-SXM4-40GB": 31.309645933148865, "core_hours": 31.309645933148865} {"step": 78250, "global_schedule": 0.2520313262939453, "l2_grads": 2.0169734954833984, "l2_params": 263.09954833984375, "l2_updates": 0.266150563955307, "train/loss": 4.096877098083496, "uptime": 14486.448540020001, "examples_seen": 80128000.0, "progress": 0.6949193183130112, "epoch": 62.54297839391742, "img/sec/core": 669.1822302971033, "core_hours_NVIDIA A100-SXM4-40GB": 31.330899071051086, "core_hours": 31.330899071051086} {"step": 78300, "global_schedule": 0.25136685371398926, "l2_grads": 1.9770286083221436, "l2_params": 263.0213928222656, "l2_updates": 0.2687534689903259, "train/loss": 1.837888479232788, "uptime": 14495.714542751002, "examples_seen": 80179200.0, "progress": 0.6953633562160866, "epoch": 62.58294195838638, "img/sec/core": 690.6969688868706, "core_hours_NVIDIA A100-SXM4-40GB": 31.35149018823109, "core_hours": 31.35149018823109} {"step": 78350, "global_schedule": 0.25070303678512573, "l2_grads": 1.9959869384765625, "l2_params": 262.9368896484375, "l2_updates": 0.263759046792984, "train/loss": 1.833022117614746, "uptime": 14504.399389823999, "examples_seen": 80230400.0, "progress": 0.695807394119162, "epoch": 62.62290552285533, "img/sec/core": 736.9156815552124, "core_hours_NVIDIA A100-SXM4-40GB": 31.370789848393304, "core_hours": 31.370789848393304} {"step": 78400, "global_schedule": 0.2500397264957428, "l2_grads": 2.0230531692504883, "l2_params": 262.8560791015625, "l2_updates": 0.2629542052745819, "train/loss": 2.384948253631592, "uptime": 14512.977788887, "examples_seen": 80281600.0, "progress": 0.6962514320222374, "epoch": 62.66286908732429, "img/sec/core": 746.0599527951206, "core_hours_NVIDIA A100-SXM4-40GB": 31.389852957422193, "core_hours": 31.389852957422193} {"step": 78450, "global_schedule": 0.24937710165977478, "l2_grads": 1.9191638231277466, "l2_params": 262.7812805175781, "l2_updates": 0.2651387155056, "train/loss": 3.938046932220459, "uptime": 14521.586613443002, "examples_seen": 80332800.0, "progress": 0.6966954699253128, "epoch": 62.70283265179325, "img/sec/core": 743.4232116552789, "core_hours_NVIDIA A100-SXM4-40GB": 31.408983678657755, "core_hours": 31.408983678657755} {"step": 78500, "global_schedule": 0.24871504306793213, "l2_grads": 2.0029873847961426, "l2_params": 262.7041931152344, "l2_updates": 0.26623186469078064, "train/loss": 2.0118696689605713, "uptime": 14530.184824155001, "examples_seen": 80384000.0, "progress": 0.6971395078283882, "epoch": 62.74279621626221, "img/sec/core": 744.3409116582845, "core_hours_NVIDIA A100-SXM4-40GB": 31.42809081357331, "core_hours": 31.42809081357331} {"step": 78550, "global_schedule": 0.24805358052253723, "l2_grads": 1.9623570442199707, "l2_params": 262.624267578125, "l2_updates": 0.2619405686855316, "train/loss": 3.9512736797332764, "uptime": 14538.672767786002, "examples_seen": 80435200.0, "progress": 0.6975835457314636, "epoch": 62.78275978073116, "img/sec/core": 754.0106624442572, "core_hours_NVIDIA A100-SXM4-40GB": 31.44695291053109, "core_hours": 31.44695291053109} {"step": 78600, "global_schedule": 0.24739262461662292, "l2_grads": 1.8060146570205688, "l2_params": 262.5467529296875, "l2_updates": 0.26422038674354553, "train/loss": 3.3530588150024414, "uptime": 14547.902696972002, "examples_seen": 80486400.0, "progress": 0.6980275836345391, "epoch": 62.82272334520012, "img/sec/core": 693.3964357719661, "core_hours_NVIDIA A100-SXM4-40GB": 31.467463864277754, "core_hours": 31.467463864277754} {"step": 78650, "global_schedule": 0.24673232436180115, "l2_grads": 1.9548332691192627, "l2_params": 262.4598693847656, "l2_updates": 0.26106739044189453, "train/loss": 3.698202610015869, "uptime": 14557.247500251002, "examples_seen": 80537600.0, "progress": 0.6984716215376144, "epoch": 62.86268690966907, "img/sec/core": 684.872630158218, "core_hours_NVIDIA A100-SXM4-40GB": 31.488230093786644, "core_hours": 31.488230093786644} {"step": 78700, "global_schedule": 0.2460726499557495, "l2_grads": 2.0011212825775146, "l2_params": 262.3771667480469, "l2_updates": 0.2603578567504883, "train/loss": 1.804089069366455, "uptime": 14566.510374366999, "examples_seen": 80588800.0, "progress": 0.6989156594406899, "epoch": 62.902650474138035, "img/sec/core": 690.9302576990885, "core_hours_NVIDIA A100-SXM4-40GB": 31.50881425848886, "core_hours": 31.50881425848886} {"step": 78750, "global_schedule": 0.24541357159614563, "l2_grads": 1.9653682708740234, "l2_params": 262.3023986816406, "l2_updates": 0.2615630328655243, "train/loss": 2.4337058067321777, "uptime": 14575.021785325001, "examples_seen": 80640000.0, "progress": 0.6993596973437652, "epoch": 62.94261403860699, "img/sec/core": 751.9317339485926, "core_hours_NVIDIA A100-SXM4-40GB": 31.5277285050622, "core_hours": 31.5277285050622} {"step": 78800, "global_schedule": 0.2447550892829895, "l2_grads": 1.9726552963256836, "l2_params": 262.2158203125, "l2_updates": 0.2611292004585266, "train/loss": 3.902773857116699, "uptime": 14583.56491128, "examples_seen": 80691200.0, "progress": 0.6998037352468407, "epoch": 62.982577603075946, "img/sec/core": 749.1403069218806, "core_hours_NVIDIA A100-SXM4-40GB": 31.54671322940664, "core_hours": 31.54671322940664} {"step": 78850, "global_schedule": 0.24409708380699158, "l2_grads": 2.0988752841949463, "l2_params": 262.1377258300781, "l2_updates": 0.25494077801704407, "train/loss": 3.848628044128418, "uptime": 14592.857932472, "examples_seen": 80742400.0, "progress": 0.700247773149916, "epoch": 63.0225411675449, "img/sec/core": 688.6888416341934, "core_hours_NVIDIA A100-SXM4-40GB": 31.567364387611082, "core_hours": 31.567364387611082} {"step": 78900, "global_schedule": 0.24343979358673096, "l2_grads": 2.0356085300445557, "l2_params": 262.0653991699219, "l2_updates": 0.25978365540504456, "train/loss": 4.254117965698242, "uptime": 14601.271660697, "examples_seen": 80793600.0, "progress": 0.7006918110529915, "epoch": 63.062504732013856, "img/sec/core": 760.6616031383696, "core_hours_NVIDIA A100-SXM4-40GB": 31.586061561444417, "core_hours": 31.586061561444417} {"step": 78950, "global_schedule": 0.24278298020362854, "l2_grads": 2.0704193115234375, "l2_params": 261.9845886230469, "l2_updates": 0.26203739643096924, "train/loss": 2.2274351119995117, "uptime": 14609.855533191001, "examples_seen": 80844800.0, "progress": 0.7011358489560668, "epoch": 63.10246829648282, "img/sec/core": 745.5842342105169, "core_hours_NVIDIA A100-SXM4-40GB": 31.605136833653308, "core_hours": 31.605136833653308} {"step": 79000, "global_schedule": 0.24212700128555298, "l2_grads": 2.055938720703125, "l2_params": 261.90771484375, "l2_updates": 0.25779590010643005, "train/loss": 1.8288705348968506, "uptime": 14618.339663164, "examples_seen": 80896000.0, "progress": 0.7015798868591423, "epoch": 63.142431860951774, "img/sec/core": 754.3495939321651, "core_hours_NVIDIA A100-SXM4-40GB": 31.62399045581553, "core_hours": 31.62399045581553} {"step": 79050, "global_schedule": 0.24147140979766846, "l2_grads": 2.242363214492798, "l2_params": 261.820556640625, "l2_updates": 0.25436073541641235, "train/loss": 4.111227989196777, "uptime": 14628.148858211001, "examples_seen": 80947200.0, "progress": 0.7020239247622178, "epoch": 63.18239542542073, "img/sec/core": 733.140661912891, "core_hours_NVIDIA A100-SXM4-40GB": 31.64338949199109, "core_hours": 31.64338949199109} {"step": 79100, "global_schedule": 0.24081653356552124, "l2_grads": 1.8379608392715454, "l2_params": 261.7417297363281, "l2_updates": 0.25793513655662537, "train/loss": 2.4910387992858887, "uptime": 14636.920405548999, "examples_seen": 80998400.0, "progress": 0.7024679626652931, "epoch": 63.222358989889685, "img/sec/core": 729.6318144776725, "core_hours_NVIDIA A100-SXM4-40GB": 31.662881819408863, "core_hours": 31.662881819408863} {"step": 79150, "global_schedule": 0.24016216397285461, "l2_grads": 2.0077245235443115, "l2_params": 261.660400390625, "l2_updates": 0.2571049630641937, "train/loss": 1.7384592294692993, "uptime": 14645.574230653, "examples_seen": 81049600.0, "progress": 0.7029120005683686, "epoch": 63.26232255435864, "img/sec/core": 739.5573544745746, "core_hours_NVIDIA A100-SXM4-40GB": 31.682112541862196, "core_hours": 31.682112541862196} {"step": 79200, "global_schedule": 0.2395085096359253, "l2_grads": 2.0573573112487793, "l2_params": 261.5823669433594, "l2_updates": 0.2532496452331543, "train/loss": 3.8327274322509766, "uptime": 14654.059204751002, "examples_seen": 81100800.0, "progress": 0.7033560384714439, "epoch": 63.3022861188276, "img/sec/core": 754.2745476979844, "core_hours_NVIDIA A100-SXM4-40GB": 31.700968039857756, "core_hours": 31.700968039857756} {"step": 79250, "global_schedule": 0.23885545134544373, "l2_grads": 1.890720248222351, "l2_params": 261.50860595703125, "l2_updates": 0.24937497079372406, "train/loss": 2.608376979827881, "uptime": 14662.813098343, "examples_seen": 81152000.0, "progress": 0.7038000763745194, "epoch": 63.34224968329656, "img/sec/core": 731.1032436869044, "core_hours_NVIDIA A100-SXM4-40GB": 31.720421136728866, "core_hours": 31.720421136728866} {"step": 79300, "global_schedule": 0.2382030189037323, "l2_grads": 1.8882519006729126, "l2_params": 261.43670654296875, "l2_updates": 0.25654202699661255, "train/loss": 3.01411509513855, "uptime": 14672.130970913002, "examples_seen": 81203200.0, "progress": 0.7042441142775947, "epoch": 63.38221324776551, "img/sec/core": 686.8520632707875, "core_hours_NVIDIA A100-SXM4-40GB": 31.741127520217756, "core_hours": 31.741127520217756} {"step": 79350, "global_schedule": 0.23755118250846863, "l2_grads": 2.0150866508483887, "l2_params": 261.35980224609375, "l2_updates": 0.251859575510025, "train/loss": 3.7144765853881836, "uptime": 14681.447889671, "examples_seen": 81254400.0, "progress": 0.7046881521806702, "epoch": 63.42217681223447, "img/sec/core": 686.9223791938135, "core_hours_NVIDIA A100-SXM4-40GB": 31.76183178412442, "core_hours": 31.76183178412442} {"step": 79400, "global_schedule": 0.23689988255500793, "l2_grads": 1.8456169366836548, "l2_params": 261.2840881347656, "l2_updates": 0.25609949231147766, "train/loss": 2.371910572052002, "uptime": 14690.474321709002, "examples_seen": 81305600.0, "progress": 0.7051321900837455, "epoch": 63.46214037670343, "img/sec/core": 709.0287694025883, "core_hours_NVIDIA A100-SXM4-40GB": 31.781890521986647, "core_hours": 31.781890521986647} {"step": 79450, "global_schedule": 0.2362493872642517, "l2_grads": 2.218143939971924, "l2_params": 261.2022399902344, "l2_updates": 0.24456660449504852, "train/loss": 1.8428499698638916, "uptime": 14699.617359185, "examples_seen": 81356800.0, "progress": 0.705576227986821, "epoch": 63.502103941172386, "img/sec/core": 699.9861935161887, "core_hours_NVIDIA A100-SXM4-40GB": 31.802208383044423, "core_hours": 31.802208383044423} {"step": 79500, "global_schedule": 0.2355993092060089, "l2_grads": 2.1312239170074463, "l2_params": 261.1240539550781, "l2_updates": 0.2537388205528259, "train/loss": 1.8344653844833374, "uptime": 14708.343885148, "examples_seen": 81408000.0, "progress": 0.7060202658898964, "epoch": 63.54206750564134, "img/sec/core": 733.39608764535, "core_hours_NVIDIA A100-SXM4-40GB": 31.8216006629622, "core_hours": 31.8216006629622} {"step": 79550, "global_schedule": 0.23494994640350342, "l2_grads": 1.9054251909255981, "l2_params": 261.0447692871094, "l2_updates": 0.24694500863552094, "train/loss": 2.7888615131378174, "uptime": 14716.894401994, "examples_seen": 81459200.0, "progress": 0.7064643037929718, "epoch": 63.5820310701103, "img/sec/core": 748.4927654395159, "core_hours_NVIDIA A100-SXM4-40GB": 31.84060181150887, "core_hours": 31.84060181150887} {"step": 79600, "global_schedule": 0.2343011200428009, "l2_grads": 1.933665156364441, "l2_params": 260.96600341796875, "l2_updates": 0.24659062922000885, "train/loss": 3.749941110610962, "uptime": 14725.256853329001, "examples_seen": 81510400.0, "progress": 0.7069083416960472, "epoch": 63.62199463457925, "img/sec/core": 765.3258289484093, "core_hours_NVIDIA A100-SXM4-40GB": 31.859185036697756, "core_hours": 31.859185036697756} {"step": 79650, "global_schedule": 0.2336530089378357, "l2_grads": 1.921339988708496, "l2_params": 260.8874816894531, "l2_updates": 0.24889548122882843, "train/loss": 1.894317865371704, "uptime": 14733.836096099001, "examples_seen": 81561600.0, "progress": 0.7073523795991226, "epoch": 63.661958199048215, "img/sec/core": 745.98658314924, "core_hours_NVIDIA A100-SXM4-40GB": 31.87825002063109, "core_hours": 31.87825002063109} {"step": 79700, "global_schedule": 0.23300552368164062, "l2_grads": 1.9226877689361572, "l2_params": 260.8174133300781, "l2_updates": 0.24607734382152557, "train/loss": 2.7923378944396973, "uptime": 14742.529557594002, "examples_seen": 81612800.0, "progress": 0.707796417502198, "epoch": 63.70192176351717, "img/sec/core": 736.1854657871947, "core_hours_NVIDIA A100-SXM4-40GB": 31.89756882395331, "core_hours": 31.89756882395331} {"step": 79750, "global_schedule": 0.2323586642742157, "l2_grads": 2.1262896060943604, "l2_params": 260.7362060546875, "l2_updates": 0.2449771910905838, "train/loss": 4.190243721008301, "uptime": 14751.618426965002, "examples_seen": 81664000.0, "progress": 0.7082404554052734, "epoch": 63.741885327986125, "img/sec/core": 704.1579913581277, "core_hours_NVIDIA A100-SXM4-40GB": 31.917766311444428, "core_hours": 31.917766311444428} {"step": 79800, "global_schedule": 0.23171231150627136, "l2_grads": 2.1249189376831055, "l2_params": 260.65252685546875, "l2_updates": 0.2485889345407486, "train/loss": 1.7192847728729248, "uptime": 14760.231298960001, "examples_seen": 81715200.0, "progress": 0.7086844933083488, "epoch": 63.78184889245508, "img/sec/core": 743.0738554707294, "core_hours_NVIDIA A100-SXM4-40GB": 31.93690602698887, "core_hours": 31.93690602698887} {"step": 79850, "global_schedule": 0.23106670379638672, "l2_grads": 1.967066764831543, "l2_params": 260.5743713378906, "l2_updates": 0.24396048486232758, "train/loss": 3.9692769050598145, "uptime": 14769.130021572999, "examples_seen": 81766400.0, "progress": 0.7091285312114242, "epoch": 63.821812456924036, "img/sec/core": 719.2043485715724, "core_hours_NVIDIA A100-SXM4-40GB": 31.956680966128864, "core_hours": 31.956680966128864} {"step": 79900, "global_schedule": 0.2304217517375946, "l2_grads": 2.0071566104888916, "l2_params": 260.4988098144531, "l2_updates": 0.24447107315063477, "train/loss": 2.593663454055786, "uptime": 14778.481739803, "examples_seen": 81817600.0, "progress": 0.7095725691144996, "epoch": 63.861776021393, "img/sec/core": 684.3662140576092, "core_hours_NVIDIA A100-SXM4-40GB": 31.977462562195534, "core_hours": 31.977462562195534} {"step": 79950, "global_schedule": 0.22977739572525024, "l2_grads": 2.1272470951080322, "l2_params": 260.42486572265625, "l2_updates": 0.239968404173851, "train/loss": 3.902496814727783, "uptime": 14787.827333416002, "examples_seen": 81868800.0, "progress": 0.7100166070175751, "epoch": 63.901739585861954, "img/sec/core": 684.8147121544584, "core_hours_NVIDIA A100-SXM4-40GB": 31.9982305480022, "core_hours": 31.9982305480022} {"step": 80000, "global_schedule": 0.2291336953639984, "l2_grads": 2.0872159004211426, "l2_params": 260.3489685058594, "l2_updates": 0.24204634130001068, "train/loss": 2.350252151489258, "uptime": 14797.115965299, "examples_seen": 81920000.0, "progress": 0.7104606449206504, "epoch": 63.94170315033091, "img/sec/core": 689.0142790257529, "core_hours_NVIDIA A100-SXM4-40GB": 32.01887195218664, "core_hours": 32.01887195218664, "val/acc@1": 0.72338, "val/loss": 1.1065173474121093, "z/secs/eval/val": 2.621075799001119} {"step": 80050, "global_schedule": 0.22849050164222717, "l2_grads": 2.0755722522735596, "l2_params": 260.2655334472656, "l2_updates": 0.2421909123659134, "train/loss": 4.112213134765625, "uptime": 14809.096015437002, "examples_seen": 81971200.0, "progress": 0.7109046828237259, "epoch": 63.981666714799864, "img/sec/core": 757.1429218754084, "core_hours_NVIDIA A100-SXM4-40GB": 32.03765601766664, "core_hours": 32.03765601766664} {"step": 80100, "global_schedule": 0.22784805297851562, "l2_grads": 2.0183122158050537, "l2_params": 260.1888732910156, "l2_updates": 0.23959068953990936, "train/loss": 2.8346054553985596, "uptime": 14818.756253348, "examples_seen": 82022400.0, "progress": 0.7113487207268012, "epoch": 64.02163027926882, "img/sec/core": 662.509563321854, "core_hours_NVIDIA A100-SXM4-40GB": 32.059123213024414, "core_hours": 32.059123213024414} {"step": 80150, "global_schedule": 0.22720617055892944, "l2_grads": 2.063920497894287, "l2_params": 260.10687255859375, "l2_updates": 0.24245859682559967, "train/loss": 1.8786720037460327, "uptime": 14827.258440684001, "examples_seen": 82073600.0, "progress": 0.7117927586298767, "epoch": 64.06159384373778, "img/sec/core": 752.747469218847, "core_hours_NVIDIA A100-SXM4-40GB": 32.07801696265997, "core_hours": 32.07801696265997} {"step": 80200, "global_schedule": 0.22656509280204773, "l2_grads": 2.0345780849456787, "l2_params": 260.030517578125, "l2_updates": 0.2413063496351242, "train/loss": 2.0594682693481445, "uptime": 14836.234679365001, "examples_seen": 82124800.0, "progress": 0.712236796532952, "epoch": 64.10155740820673, "img/sec/core": 712.9935184931089, "core_hours_NVIDIA A100-SXM4-40GB": 32.09796415972886, "core_hours": 32.09796415972886} {"step": 80250, "global_schedule": 0.22592449188232422, "l2_grads": 2.1021549701690674, "l2_params": 259.953125, "l2_updates": 0.24097894132137299, "train/loss": 1.7949674129486084, "uptime": 14844.873272089999, "examples_seen": 82176000.0, "progress": 0.7126808344360275, "epoch": 64.14152097267569, "img/sec/core": 740.8614115445283, "core_hours_NVIDIA A100-SXM4-40GB": 32.11716103245108, "core_hours": 32.11716103245108} {"step": 80300, "global_schedule": 0.225284606218338, "l2_grads": 1.9560414552688599, "l2_params": 259.8829040527344, "l2_updates": 0.23882660269737244, "train/loss": 2.856501340866089, "uptime": 14853.685295270001, "examples_seen": 82227200.0, "progress": 0.7131248723391028, "epoch": 64.18148453714466, "img/sec/core": 726.2804317768991, "core_hours_NVIDIA A100-SXM4-40GB": 32.136743306184414, "core_hours": 32.136743306184414} {"step": 80350, "global_schedule": 0.22464525699615479, "l2_grads": 1.9636207818984985, "l2_params": 259.8052978515625, "l2_updates": 0.2401181310415268, "train/loss": 1.7483000755310059, "uptime": 14863.013701594, "examples_seen": 82278400.0, "progress": 0.7135689102421783, "epoch": 64.2214481016136, "img/sec/core": 686.0764612637955, "core_hours_NVIDIA A100-SXM4-40GB": 32.15747309801552, "core_hours": 32.15747309801552} {"step": 80400, "global_schedule": 0.22400668263435364, "l2_grads": 2.273756265640259, "l2_params": 259.7337951660156, "l2_updates": 0.23533190786838531, "train/loss": 3.9888432025909424, "uptime": 14872.228418331999, "examples_seen": 82329600.0, "progress": 0.7140129481452537, "epoch": 64.26141166608257, "img/sec/core": 694.5411543263345, "core_hours_NVIDIA A100-SXM4-40GB": 32.17795024632219, "core_hours": 32.17795024632219} {"step": 80450, "global_schedule": 0.22336873412132263, "l2_grads": 1.992711067199707, "l2_params": 259.65869140625, "l2_updates": 0.23971955478191376, "train/loss": 1.8665276765823364, "uptime": 14881.388902775, "examples_seen": 82380800.0, "progress": 0.7144569860483291, "epoch": 64.30137523055151, "img/sec/core": 698.6530068167248, "core_hours_NVIDIA A100-SXM4-40GB": 32.198306878417746, "core_hours": 32.198306878417746} {"step": 80500, "global_schedule": 0.22273144125938416, "l2_grads": 2.092400074005127, "l2_params": 259.5801696777344, "l2_updates": 0.23858071863651276, "train/loss": 1.7099413871765137, "uptime": 14890.722434546, "examples_seen": 82432000.0, "progress": 0.7149010239514045, "epoch": 64.34133879502048, "img/sec/core": 685.6997069303183, "core_hours_NVIDIA A100-SXM4-40GB": 32.21904806013108, "core_hours": 32.21904806013108} {"step": 80550, "global_schedule": 0.2220948040485382, "l2_grads": 2.2160470485687256, "l2_params": 259.5026550292969, "l2_updates": 0.23703251779079437, "train/loss": 1.9049150943756104, "uptime": 14899.568677831, "examples_seen": 82483200.0, "progress": 0.7153450618544799, "epoch": 64.38130235948944, "img/sec/core": 723.4709462323549, "core_hours_NVIDIA A100-SXM4-40GB": 32.23870637854219, "core_hours": 32.23870637854219} {"step": 80600, "global_schedule": 0.22145870327949524, "l2_grads": 1.923701286315918, "l2_params": 259.4361877441406, "l2_updates": 0.23655317723751068, "train/loss": 2.88120436668396, "uptime": 14908.573646728002, "examples_seen": 82534400.0, "progress": 0.7157890997575553, "epoch": 64.42126592395839, "img/sec/core": 710.7187235405152, "core_hours_NVIDIA A100-SXM4-40GB": 32.258717420535525, "core_hours": 32.258717420535525} {"step": 80650, "global_schedule": 0.2208234667778015, "l2_grads": 2.0361204147338867, "l2_params": 259.3604736328125, "l2_updates": 0.23359185457229614, "train/loss": 3.2681987285614014, "uptime": 14917.193384847002, "examples_seen": 82585600.0, "progress": 0.7162331376606307, "epoch": 64.46122948842735, "img/sec/core": 742.4819538186663, "core_hours_NVIDIA A100-SXM4-40GB": 32.277872394133304, "core_hours": 32.277872394133304} {"step": 80700, "global_schedule": 0.2201886773109436, "l2_grads": 2.0528430938720703, "l2_params": 259.2804260253906, "l2_updates": 0.23681612312793732, "train/loss": 1.8619096279144287, "uptime": 14926.31040547, "examples_seen": 82636800.0, "progress": 0.7166771755637061, "epoch": 64.5011930528963, "img/sec/core": 701.9837142690793, "core_hours_NVIDIA A100-SXM4-40GB": 32.29813243996219, "core_hours": 32.29813243996219} {"step": 80750, "global_schedule": 0.21955463290214539, "l2_grads": 2.094930648803711, "l2_params": 259.2039489746094, "l2_updates": 0.23587720096111298, "train/loss": 1.8859567642211914, "uptime": 14934.88737223, "examples_seen": 82688000.0, "progress": 0.7171212134667815, "epoch": 64.54115661736526, "img/sec/core": 746.1845404190614, "core_hours_NVIDIA A100-SXM4-40GB": 32.31719236609552, "core_hours": 32.31719236609552} {"step": 80800, "global_schedule": 0.21892118453979492, "l2_grads": 1.9778313636779785, "l2_params": 259.1304931640625, "l2_updates": 0.23613549768924713, "train/loss": 3.4537439346313477, "uptime": 14943.599535786, "examples_seen": 82739200.0, "progress": 0.7175652513698569, "epoch": 64.58112018183422, "img/sec/core": 734.6051252208841, "core_hours_NVIDIA A100-SXM4-40GB": 32.3365527295533, "core_hours": 32.3365527295533} {"step": 80850, "global_schedule": 0.21828845143318176, "l2_grads": 1.8957980871200562, "l2_params": 259.05621337890625, "l2_updates": 0.2331525981426239, "train/loss": 2.861703395843506, "uptime": 14952.010569977001, "examples_seen": 82790400.0, "progress": 0.7180092892729323, "epoch": 64.62108374630317, "img/sec/core": 760.9052412183468, "core_hours_NVIDIA A100-SXM4-40GB": 32.35524391664441, "core_hours": 32.35524391664441} {"step": 80900, "global_schedule": 0.21765640377998352, "l2_grads": 1.954092264175415, "l2_params": 258.9743957519531, "l2_updates": 0.23042026162147522, "train/loss": 2.71755313873291, "uptime": 14960.449223116002, "examples_seen": 82841600.0, "progress": 0.7184533271760077, "epoch": 64.66104731077213, "img/sec/core": 758.4148672281706, "core_hours_NVIDIA A100-SXM4-40GB": 32.37399647917553, "core_hours": 32.37399647917553} {"step": 80950, "global_schedule": 0.2170250117778778, "l2_grads": 2.0813148021698, "l2_params": 258.899169921875, "l2_updates": 0.2318401336669922, "train/loss": 1.8073136806488037, "uptime": 14968.793504755, "examples_seen": 82892800.0, "progress": 0.7188973650790832, "epoch": 64.7010108752411, "img/sec/core": 766.9923280260447, "core_hours_NVIDIA A100-SXM4-40GB": 32.39253932726219, "core_hours": 32.39253932726219} {"step": 81000, "global_schedule": 0.21639418601989746, "l2_grads": 2.090543746948242, "l2_params": 258.8151550292969, "l2_updates": 0.22894501686096191, "train/loss": 3.982367992401123, "uptime": 14977.186703087, "examples_seen": 82944000.0, "progress": 0.7193414029821585, "epoch": 64.74097443971004, "img/sec/core": 762.5221931905718, "core_hours_NVIDIA A100-SXM4-40GB": 32.41119087911108, "core_hours": 32.41119087911108} {"step": 81050, "global_schedule": 0.2157641053199768, "l2_grads": 1.9608007669448853, "l2_params": 258.74383544921875, "l2_updates": 0.23233452439308167, "train/loss": 2.7431929111480713, "uptime": 14986.875814792, "examples_seen": 82995200.0, "progress": 0.719785440885234, "epoch": 64.780938004179, "img/sec/core": 708.3078080873598, "core_hours_NVIDIA A100-SXM4-40GB": 32.43127003404886, "core_hours": 32.43127003404886} {"step": 81100, "global_schedule": 0.21513471007347107, "l2_grads": 2.0995852947235107, "l2_params": 258.6761169433594, "l2_updates": 0.22881737351417542, "train/loss": 2.2118494510650635, "uptime": 14996.089385963, "examples_seen": 83046400.0, "progress": 0.7202294787883093, "epoch": 64.82090156864795, "img/sec/core": 694.6275099219233, "core_hours_NVIDIA A100-SXM4-40GB": 32.45174463665108, "core_hours": 32.45174463665108} {"step": 81150, "global_schedule": 0.21450600028038025, "l2_grads": 1.902459740638733, "l2_params": 258.6026916503906, "l2_updates": 0.2274370789527893, "train/loss": 3.3341078758239746, "uptime": 15004.497958712001, "examples_seen": 83097600.0, "progress": 0.7206735166913848, "epoch": 64.86086513311692, "img/sec/core": 761.1279810547727, "core_hours_NVIDIA A100-SXM4-40GB": 32.47043035387108, "core_hours": 32.47043035387108} {"step": 81200, "global_schedule": 0.21387791633605957, "l2_grads": 1.9911279678344727, "l2_params": 258.5281982421875, "l2_updates": 0.228777676820755, "train/loss": 2.3717873096466064, "uptime": 15012.966452597999, "examples_seen": 83148800.0, "progress": 0.7211175545944601, "epoch": 64.90082869758588, "img/sec/core": 755.7424125419079, "core_hours_NVIDIA A100-SXM4-40GB": 32.489249229173296, "core_hours": 32.489249229173296} {"step": 81250, "global_schedule": 0.21325042843818665, "l2_grads": 1.9299007654190063, "l2_params": 258.4499206542969, "l2_updates": 0.2253800928592682, "train/loss": 3.1956777572631836, "uptime": 15021.263436042, "examples_seen": 83200000.0, "progress": 0.7215615924975356, "epoch": 64.94079226205483, "img/sec/core": 771.3646825012602, "core_hours_NVIDIA A100-SXM4-40GB": 32.507686970159966, "core_hours": 32.507686970159966} {"step": 81300, "global_schedule": 0.2126237154006958, "l2_grads": 2.2255842685699463, "l2_params": 258.37860107421875, "l2_updates": 0.22936347126960754, "train/loss": 1.847398042678833, "uptime": 15029.826726436002, "examples_seen": 83251200.0, "progress": 0.7220056304006109, "epoch": 64.98075582652379, "img/sec/core": 747.3762660767145, "core_hours_NVIDIA A100-SXM4-40GB": 32.526716504368856, "core_hours": 32.526716504368856} {"step": 81350, "global_schedule": 0.21199756860733032, "l2_grads": 2.1091396808624268, "l2_params": 258.3111877441406, "l2_updates": 0.22143584489822388, "train/loss": 3.668870687484741, "uptime": 15039.761281778001, "examples_seen": 83302400.0, "progress": 0.7224496683036864, "epoch": 65.02071939099274, "img/sec/core": 644.216049906493, "core_hours_NVIDIA A100-SXM4-40GB": 32.54879329401775, "core_hours": 32.54879329401775} {"step": 81400, "global_schedule": 0.2113722860813141, "l2_grads": 2.1826670169830322, "l2_params": 258.2403564453125, "l2_updates": 0.2219788134098053, "train/loss": 1.76615571975708, "uptime": 15048.819740189001, "examples_seen": 83353600.0, "progress": 0.7228937062067619, "epoch": 65.0606829554617, "img/sec/core": 706.5219830592957, "core_hours_NVIDIA A100-SXM4-40GB": 32.56892320159775, "core_hours": 32.56892320159775} {"step": 81450, "global_schedule": 0.21074751019477844, "l2_grads": 1.9984699487686157, "l2_params": 258.1649475097656, "l2_updates": 0.2221655398607254, "train/loss": 2.1921517848968506, "uptime": 15057.000438140001, "examples_seen": 83404800.0, "progress": 0.7233377441098372, "epoch": 65.10064651993066, "img/sec/core": 782.3293364862012, "core_hours_NVIDIA A100-SXM4-40GB": 32.58710253037775, "core_hours": 32.58710253037775} {"step": 81500, "global_schedule": 0.2101234793663025, "l2_grads": 1.9786627292633057, "l2_params": 258.08984375, "l2_updates": 0.22170484066009521, "train/loss": 3.147709846496582, "uptime": 15065.410649399999, "examples_seen": 83456000.0, "progress": 0.7237817820129127, "epoch": 65.14061008439961, "img/sec/core": 760.9796950572476, "core_hours_NVIDIA A100-SXM4-40GB": 32.6057918887333, "core_hours": 32.6057918887333} {"step": 81550, "global_schedule": 0.2095000445842743, "l2_grads": 1.9812692403793335, "l2_params": 258.01007080078125, "l2_updates": 0.22447802126407623, "train/loss": 2.712017297744751, "uptime": 15074.026646627002, "examples_seen": 83507200.0, "progress": 0.724225819915988, "epoch": 65.18057364886857, "img/sec/core": 742.8043244886111, "core_hours_NVIDIA A100-SXM4-40GB": 32.62493854923775, "core_hours": 32.62493854923775} {"step": 81600, "global_schedule": 0.20887741446495056, "l2_grads": 2.227294445037842, "l2_params": 257.9317321777344, "l2_updates": 0.219906747341156, "train/loss": 4.162457466125488, "uptime": 15082.397527716, "examples_seen": 83558400.0, "progress": 0.7246698578190635, "epoch": 65.22053721333752, "img/sec/core": 764.5551205369894, "core_hours_NVIDIA A100-SXM4-40GB": 32.6435405072133, "core_hours": 32.6435405072133} {"step": 81650, "global_schedule": 0.20825543999671936, "l2_grads": 2.029662847518921, "l2_params": 257.8605041503906, "l2_updates": 0.21887215971946716, "train/loss": 2.9330594539642334, "uptime": 15090.777831244, "examples_seen": 83609600.0, "progress": 0.7251138957221388, "epoch": 65.26050077780648, "img/sec/core": 763.6954889064209, "core_hours_NVIDIA A100-SXM4-40GB": 32.66216340394219, "core_hours": 32.66216340394219} {"step": 81700, "global_schedule": 0.20763415098190308, "l2_grads": 2.091630458831787, "l2_params": 257.7862548828125, "l2_updates": 0.22239191830158234, "train/loss": 1.6699198484420776, "uptime": 15099.105320098, "examples_seen": 83660800.0, "progress": 0.7255579336252143, "epoch": 65.30046434227545, "img/sec/core": 768.5390052399614, "core_hours_NVIDIA A100-SXM4-40GB": 32.68066893472886, "core_hours": 32.68066893472886} {"step": 81750, "global_schedule": 0.2070135474205017, "l2_grads": 2.2052626609802246, "l2_params": 257.7181091308594, "l2_updates": 0.2215188592672348, "train/loss": 1.7723957300186157, "uptime": 15107.667399693999, "examples_seen": 83712000.0, "progress": 0.7260019715282896, "epoch": 65.3404279067444, "img/sec/core": 747.4819555509669, "core_hours_NVIDIA A100-SXM4-40GB": 32.69969577827552, "core_hours": 32.69969577827552} {"step": 81800, "global_schedule": 0.2063935101032257, "l2_grads": 2.1074178218841553, "l2_params": 257.6441955566406, "l2_updates": 0.22018975019454956, "train/loss": 2.113417387008667, "uptime": 15116.395804942002, "examples_seen": 83763200.0, "progress": 0.7264460094313651, "epoch": 65.38039147121336, "img/sec/core": 733.2381824806446, "core_hours_NVIDIA A100-SXM4-40GB": 32.719092234382195, "core_hours": 32.719092234382195} {"step": 81850, "global_schedule": 0.20577427744865417, "l2_grads": 2.078796148300171, "l2_params": 257.56964111328125, "l2_updates": 0.22002547979354858, "train/loss": 3.592968225479126, "uptime": 15125.628323437, "examples_seen": 83814400.0, "progress": 0.7268900473344405, "epoch": 65.4203550356823, "img/sec/core": 693.2019690474425, "core_hours_NVIDIA A100-SXM4-40GB": 32.739608942148855, "core_hours": 32.739608942148855} {"step": 81900, "global_schedule": 0.20515576004981995, "l2_grads": 2.3303112983703613, "l2_params": 257.49676513671875, "l2_updates": 0.21717742085456848, "train/loss": 4.052233695983887, "uptime": 15134.247975156, "examples_seen": 83865600.0, "progress": 0.7273340852375159, "epoch": 65.46031860015127, "img/sec/core": 742.4893961658131, "core_hours_NVIDIA A100-SXM4-40GB": 32.75876372374663, "core_hours": 32.75876372374663} {"step": 81950, "global_schedule": 0.20453789830207825, "l2_grads": 2.164747714996338, "l2_params": 257.4278259277344, "l2_updates": 0.21807904541492462, "train/loss": 3.7595272064208984, "uptime": 15142.510167123002, "examples_seen": 83916800.0, "progress": 0.7277781231405913, "epoch": 65.50028216462023, "img/sec/core": 774.6128419142024, "core_hours_NVIDIA A100-SXM4-40GB": 32.77712415033997, "core_hours": 32.77712415033997} {"step": 82000, "global_schedule": 0.2039206326007843, "l2_grads": 2.1189396381378174, "l2_params": 257.3543701171875, "l2_updates": 0.2186998873949051, "train/loss": 1.7575966119766235, "uptime": 15151.055267009999, "examples_seen": 83968000.0, "progress": 0.7282221610436667, "epoch": 65.54024572908918, "img/sec/core": 748.9672542902886, "core_hours_NVIDIA A100-SXM4-40GB": 32.79611326119996, "core_hours": 32.79611326119996} {"step": 82050, "global_schedule": 0.20330417156219482, "l2_grads": 1.9774010181427002, "l2_params": 257.2804260253906, "l2_updates": 0.2166510820388794, "train/loss": 3.4072344303131104, "uptime": 15160.006492272, "examples_seen": 84019200.0, "progress": 0.7286661989467421, "epoch": 65.58020929355814, "img/sec/core": 770.5632022992662, "core_hours_NVIDIA A100-SXM4-40GB": 32.81457017969774, "core_hours": 32.81457017969774} {"step": 82100, "global_schedule": 0.20268842577934265, "l2_grads": 2.136991024017334, "l2_params": 257.21435546875, "l2_updates": 0.2145930677652359, "train/loss": 3.910109043121338, "uptime": 15169.291268572999, "examples_seen": 84070400.0, "progress": 0.7291102368498175, "epoch": 65.62017285802709, "img/sec/core": 689.3003980409347, "core_hours_NVIDIA A100-SXM4-40GB": 32.83520301592218, "core_hours": 32.83520301592218} {"step": 82150, "global_schedule": 0.202073335647583, "l2_grads": 2.0215446949005127, "l2_params": 257.139404296875, "l2_updates": 0.21488437056541443, "train/loss": 3.077387809753418, "uptime": 15178.558642835002, "examples_seen": 84121600.0, "progress": 0.7295542747528929, "epoch": 65.66013642249605, "img/sec/core": 690.5947487456866, "core_hours_NVIDIA A100-SXM4-40GB": 32.855797180948855, "core_hours": 32.855797180948855} {"step": 82200, "global_schedule": 0.2014588713645935, "l2_grads": 2.2366039752960205, "l2_params": 257.0704650878906, "l2_updates": 0.21402649581432343, "train/loss": 1.837536096572876, "uptime": 15187.271047748001, "examples_seen": 84172800.0, "progress": 0.7299983126559683, "epoch": 65.70009998696501, "img/sec/core": 734.5847746872467, "core_hours_NVIDIA A100-SXM4-40GB": 32.87515808075552, "core_hours": 32.87515808075552} {"step": 82250, "global_schedule": 0.20084521174430847, "l2_grads": 2.1497135162353516, "l2_params": 256.9999084472656, "l2_updates": 0.21409271657466888, "train/loss": 3.9937448501586914, "uptime": 15195.664303463001, "examples_seen": 84224000.0, "progress": 0.7304423505590437, "epoch": 65.74006355143396, "img/sec/core": 762.5169799797892, "core_hours_NVIDIA A100-SXM4-40GB": 32.89380976012219, "core_hours": 32.89380976012219} {"step": 82300, "global_schedule": 0.20023223757743835, "l2_grads": 2.252614974975586, "l2_params": 256.9214782714844, "l2_updates": 0.2145504355430603, "train/loss": 4.182644367218018, "uptime": 15204.232304337, "examples_seen": 84275200.0, "progress": 0.7308863884621192, "epoch": 65.78002711590293, "img/sec/core": 746.9653766519109, "core_hours_NVIDIA A100-SXM4-40GB": 32.912849762064404, "core_hours": 32.912849762064404} {"step": 82350, "global_schedule": 0.19961994886398315, "l2_grads": 2.133863687515259, "l2_params": 256.8513488769531, "l2_updates": 0.21587830781936646, "train/loss": 1.6839476823806763, "uptime": 15212.620937869002, "examples_seen": 84326400.0, "progress": 0.7313304263651945, "epoch": 65.81999068037187, "img/sec/core": 762.9371310100013, "core_hours_NVIDIA A100-SXM4-40GB": 32.9314911699133, "core_hours": 32.9314911699133} {"step": 82400, "global_schedule": 0.19900831580162048, "l2_grads": 1.9874120950698853, "l2_params": 256.7781982421875, "l2_updates": 0.21060062944889069, "train/loss": 3.3365817070007324, "uptime": 15221.027960597, "examples_seen": 84377600.0, "progress": 0.73177446426827, "epoch": 65.85995424484084, "img/sec/core": 761.2683118704145, "core_hours_NVIDIA A100-SXM4-40GB": 32.95017344264219, "core_hours": 32.95017344264219} {"step": 82450, "global_schedule": 0.1983974277973175, "l2_grads": 2.308839797973633, "l2_params": 256.7115173339844, "l2_updates": 0.2118336260318756, "train/loss": 4.17024040222168, "uptime": 15230.336773942001, "examples_seen": 84428800.0, "progress": 0.7322185021713453, "epoch": 65.8999178093098, "img/sec/core": 687.5204994240797, "core_hours_NVIDIA A100-SXM4-40GB": 32.970859694519966, "core_hours": 32.970859694519966} {"step": 82500, "global_schedule": 0.19778728485107422, "l2_grads": 2.0884275436401367, "l2_params": 256.6373596191406, "l2_updates": 0.2131163328886032, "train/loss": 1.862512469291687, "uptime": 15239.645862327, "examples_seen": 84480000.0, "progress": 0.7326625400744208, "epoch": 65.93988137377875, "img/sec/core": 687.5001864107077, "core_hours_NVIDIA A100-SXM4-40GB": 32.99154655759774, "core_hours": 32.99154655759774, "val/acc@1": 0.73086, "val/loss": 1.083975782470703, "z/secs/eval/val": 2.636672645003273} {"step": 82550, "global_schedule": 0.1971777379512787, "l2_grads": 2.034616231918335, "l2_params": 256.56951904296875, "l2_updates": 0.20986509323120117, "train/loss": 3.513052225112915, "uptime": 15251.128929171, "examples_seen": 84531200.0, "progress": 0.7331065779774961, "epoch": 65.97984493824771, "img/sec/core": 723.5203399004635, "core_hours_NVIDIA A100-SXM4-40GB": 33.0112035339644, "core_hours": 33.0112035339644} {"step": 82600, "global_schedule": 0.19656911492347717, "l2_grads": 1.9599123001098633, "l2_params": 256.4977722167969, "l2_updates": 0.2088521271944046, "train/loss": 2.2481391429901123, "uptime": 15260.496191855002, "examples_seen": 84582400.0, "progress": 0.7335506158805716, "epoch": 66.01980850271666, "img/sec/core": 683.230546201142, "core_hours_NVIDIA A100-SXM4-40GB": 33.03201967326218, "core_hours": 33.03201967326218} {"step": 82650, "global_schedule": 0.19596099853515625, "l2_grads": 1.9959125518798828, "l2_params": 256.427978515625, "l2_updates": 0.2094622403383255, "train/loss": 2.3755688667297363, "uptime": 15268.963533703, "examples_seen": 84633600.0, "progress": 0.7339946537836469, "epoch": 66.05977206718562, "img/sec/core": 755.8452363079315, "core_hours_NVIDIA A100-SXM4-40GB": 33.05083598847995, "core_hours": 33.05083598847995} {"step": 82700, "global_schedule": 0.1953536868095398, "l2_grads": 2.1653528213500977, "l2_params": 256.3586730957031, "l2_updates": 0.20864319801330566, "train/loss": 4.06547737121582, "uptime": 15277.526896589, "examples_seen": 84684800.0, "progress": 0.7344386916867224, "epoch": 66.09973563165458, "img/sec/core": 747.3699392632446, "core_hours_NVIDIA A100-SXM4-40GB": 33.069865683782176, "core_hours": 33.069865683782176} {"step": 82750, "global_schedule": 0.19474700093269348, "l2_grads": 2.1388328075408936, "l2_params": 256.2879333496094, "l2_updates": 0.20382435619831085, "train/loss": 3.976620674133301, "uptime": 15286.092743378, "examples_seen": 84736000.0, "progress": 0.7348827295897978, "epoch": 66.13969919612353, "img/sec/core": 747.1532187827022, "core_hours_NVIDIA A100-SXM4-40GB": 33.08890089886884, "core_hours": 33.08890089886884} {"step": 82800, "global_schedule": 0.19414111971855164, "l2_grads": 2.1521270275115967, "l2_params": 256.2146911621094, "l2_updates": 0.20422087609767914, "train/loss": 2.258228302001953, "uptime": 15294.512748447001, "examples_seen": 84787200.0, "progress": 0.7353267674928732, "epoch": 66.17966276059249, "img/sec/core": 760.0945542849847, "core_hours_NVIDIA A100-SXM4-40GB": 33.1076120212444, "core_hours": 33.1076120212444} {"step": 82850, "global_schedule": 0.1935359537601471, "l2_grads": 2.1755778789520264, "l2_params": 256.1382751464844, "l2_updates": 0.2085544615983963, "train/loss": 1.8675075769424438, "uptime": 15303.190944283999, "examples_seen": 84838400.0, "progress": 0.7357708053959486, "epoch": 66.21962632506145, "img/sec/core": 737.4804763814024, "core_hours_NVIDIA A100-SXM4-40GB": 33.12689690088217, "core_hours": 33.12689690088217} {"step": 82900, "global_schedule": 0.19293150305747986, "l2_grads": 2.0016725063323975, "l2_params": 256.0791320800781, "l2_updates": 0.20456920564174652, "train/loss": 2.652169704437256, "uptime": 15312.311320615, "examples_seen": 84889600.0, "progress": 0.736214843299024, "epoch": 66.2595898895304, "img/sec/core": 701.7254297112939, "core_hours_NVIDIA A100-SXM4-40GB": 33.14716440383995, "core_hours": 33.14716440383995} {"step": 82950, "global_schedule": 0.19232767820358276, "l2_grads": 2.172696828842163, "l2_params": 255.99754333496094, "l2_updates": 0.20361225306987762, "train/loss": 4.119892120361328, "uptime": 15321.021680062002, "examples_seen": 84940800.0, "progress": 0.7366588812020994, "epoch": 66.29955345399937, "img/sec/core": 734.7572782662013, "core_hours_NVIDIA A100-SXM4-40GB": 33.16652075816663, "core_hours": 33.16652075816663} {"step": 83000, "global_schedule": 0.19172465801239014, "l2_grads": 2.1548919677734375, "l2_params": 255.93292236328125, "l2_updates": 0.20550447702407837, "train/loss": 1.7179076671600342, "uptime": 15329.716187762, "examples_seen": 84992000.0, "progress": 0.7371029191051748, "epoch": 66.33951701846831, "img/sec/core": 736.0968810230987, "core_hours_NVIDIA A100-SXM4-40GB": 33.18584188638884, "core_hours": 33.18584188638884} {"step": 83050, "global_schedule": 0.1911223828792572, "l2_grads": 1.9534547328948975, "l2_params": 255.85874938964844, "l2_updates": 0.20077602565288544, "train/loss": 3.4035472869873047, "uptime": 15339.349345128, "examples_seen": 85043200.0, "progress": 0.7375469570082502, "epoch": 66.37948058293728, "img/sec/core": 745.4809978882327, "core_hours_NVIDIA A100-SXM4-40GB": 33.20491980019552, "core_hours": 33.20491980019552} {"step": 83100, "global_schedule": 0.19052082300186157, "l2_grads": 2.142289638519287, "l2_params": 255.79107666015625, "l2_updates": 0.20296472311019897, "train/loss": 1.6605578660964966, "uptime": 15348.236301892002, "examples_seen": 85094400.0, "progress": 0.7379909949113256, "epoch": 66.41944414740624, "img/sec/core": 720.1565361410771, "core_hours_NVIDIA A100-SXM4-40GB": 33.22466859300441, "core_hours": 33.22466859300441} {"step": 83150, "global_schedule": 0.18991997838020325, "l2_grads": 2.075385093688965, "l2_params": 255.722412109375, "l2_updates": 0.20107577741146088, "train/loss": 2.4917244911193848, "uptime": 15356.716812481, "examples_seen": 85145600.0, "progress": 0.738435032814401, "epoch": 66.45940771187519, "img/sec/core": 754.6715416290432, "core_hours_NVIDIA A100-SXM4-40GB": 33.243514172091075, "core_hours": 33.243514172091075} {"step": 83200, "global_schedule": 0.18931978940963745, "l2_grads": 2.100965738296509, "l2_params": 255.65225219726562, "l2_updates": 0.20228159427642822, "train/loss": 3.8967134952545166, "uptime": 15365.680706357, "examples_seen": 85196800.0, "progress": 0.7388790707174765, "epoch": 66.49937127634415, "img/sec/core": 713.975431718961, "core_hours_NVIDIA A100-SXM4-40GB": 33.26343393625996, "core_hours": 33.26343393625996} {"step": 83250, "global_schedule": 0.18872040510177612, "l2_grads": 2.1676180362701416, "l2_params": 255.58534240722656, "l2_updates": 0.20070980489253998, "train/loss": 3.647077798843384, "uptime": 15374.809771404, "examples_seen": 85248000.0, "progress": 0.7393231086205518, "epoch": 66.5393348408131, "img/sec/core": 701.0575526683474, "core_hours_NVIDIA A100-SXM4-40GB": 33.28372074747551, "core_hours": 33.28372074747551} {"step": 83300, "global_schedule": 0.1881217658519745, "l2_grads": 2.1121575832366943, "l2_params": 255.51441955566406, "l2_updates": 0.19642944633960724, "train/loss": 2.0588622093200684, "uptime": 15383.451665488, "examples_seen": 85299200.0, "progress": 0.7397671465236273, "epoch": 66.57929840528206, "img/sec/core": 740.5783891575722, "core_hours_NVIDIA A100-SXM4-40GB": 33.302924956551074, "core_hours": 33.302924956551074} {"step": 83350, "global_schedule": 0.18752384185791016, "l2_grads": 2.4286108016967773, "l2_params": 255.4461669921875, "l2_updates": 0.19805553555488586, "train/loss": 1.8634874820709229, "uptime": 15391.967096203001, "examples_seen": 85350400.0, "progress": 0.7402111844267026, "epoch": 66.61926196975102, "img/sec/core": 751.5767803413556, "core_hours_NVIDIA A100-SXM4-40GB": 33.32184813591774, "core_hours": 33.32184813591774} {"step": 83400, "global_schedule": 0.18692657351493835, "l2_grads": 2.3773322105407715, "l2_params": 255.37606811523438, "l2_updates": 0.19939075410366058, "train/loss": 1.7541465759277344, "uptime": 15400.444768973999, "examples_seen": 85401600.0, "progress": 0.7406552223297781, "epoch": 66.65922553421997, "img/sec/core": 754.9241605425613, "core_hours_NVIDIA A100-SXM4-40GB": 33.340687408742184, "core_hours": 33.340687408742184} {"step": 83450, "global_schedule": 0.18633010983467102, "l2_grads": 2.1751222610473633, "l2_params": 255.30477905273438, "l2_updates": 0.2016160488128662, "train/loss": 1.7564024925231934, "uptime": 15408.969101259, "examples_seen": 85452800.0, "progress": 0.7410992602328534, "epoch": 66.69918909868893, "img/sec/core": 750.7919431134545, "core_hours_NVIDIA A100-SXM4-40GB": 33.359630369375516, "core_hours": 33.359630369375516} {"step": 83500, "global_schedule": 0.18573430180549622, "l2_grads": 2.011078357696533, "l2_params": 255.23460388183594, "l2_updates": 0.19804957509040833, "train/loss": 2.329171895980835, "uptime": 15417.424774637, "examples_seen": 85504000.0, "progress": 0.7415432981359289, "epoch": 66.73915266315788, "img/sec/core": 756.8882706196803, "core_hours_NVIDIA A100-SXM4-40GB": 33.37842075465996, "core_hours": 33.37842075465996} {"step": 83550, "global_schedule": 0.18513941764831543, "l2_grads": 2.1604552268981934, "l2_params": 255.17242431640625, "l2_updates": 0.19726116955280304, "train/loss": 3.9177045822143555, "uptime": 15425.957053443, "examples_seen": 85555200.0, "progress": 0.7419873360390042, "epoch": 66.77911622762684, "img/sec/core": 750.0926945213342, "core_hours_NVIDIA A100-SXM4-40GB": 33.39738137422885, "core_hours": 33.39738137422885} {"step": 83600, "global_schedule": 0.18454506993293762, "l2_grads": 2.161759853363037, "l2_params": 255.09996032714844, "l2_updates": 0.19661100208759308, "train/loss": 1.6669350862503052, "uptime": 15434.483825194, "examples_seen": 85606400.0, "progress": 0.7424313739420797, "epoch": 66.8190797920958, "img/sec/core": 750.5771453598147, "core_hours_NVIDIA A100-SXM4-40GB": 33.41632975589774, "core_hours": 33.41632975589774} {"step": 83650, "global_schedule": 0.18395158648490906, "l2_grads": 2.197659730911255, "l2_params": 255.0259246826172, "l2_updates": 0.19720475375652313, "train/loss": 1.7971177101135254, "uptime": 15443.044544620001, "examples_seen": 85657600.0, "progress": 0.7428754118451552, "epoch": 66.85904335656475, "img/sec/core": 747.6007192294637, "core_hours_NVIDIA A100-SXM4-40GB": 33.435353576844406, "core_hours": 33.435353576844406} {"step": 83700, "global_schedule": 0.1833588182926178, "l2_grads": 2.3442811965942383, "l2_params": 254.95758056640625, "l2_updates": 0.19627340137958527, "train/loss": 1.7352526187896729, "uptime": 15451.906256327, "examples_seen": 85708800.0, "progress": 0.7433194497482305, "epoch": 66.89900692103372, "img/sec/core": 722.2081028595564, "core_hours_NVIDIA A100-SXM4-40GB": 33.455046269526626, "core_hours": 33.455046269526626} {"step": 83750, "global_schedule": 0.18276670575141907, "l2_grads": 2.0807816982269287, "l2_params": 254.8844451904297, "l2_updates": 0.19148345291614532, "train/loss": 3.590458393096924, "uptime": 15461.078816952, "examples_seen": 85760000.0, "progress": 0.743763487651306, "epoch": 66.93897048550267, "img/sec/core": 697.7331915971795, "core_hours_NVIDIA A100-SXM4-40GB": 33.47542973758218, "core_hours": 33.47542973758218} {"step": 83800, "global_schedule": 0.18217551708221436, "l2_grads": 2.2227272987365723, "l2_params": 254.81353759765625, "l2_updates": 0.18999344110488892, "train/loss": 3.1273467540740967, "uptime": 15470.392866953001, "examples_seen": 85811200.0, "progress": 0.7442075255543813, "epoch": 66.97893404997163, "img/sec/core": 687.1339534694326, "core_hours_NVIDIA A100-SXM4-40GB": 33.496127626473296, "core_hours": 33.496127626473296} {"step": 83850, "global_schedule": 0.181584894657135, "l2_grads": 2.059793710708618, "l2_params": 254.74362182617188, "l2_updates": 0.19325554370880127, "train/loss": 2.1392717361450195, "uptime": 15480.439846306, "examples_seen": 85862400.0, "progress": 0.7446515634574568, "epoch": 67.01889761444059, "img/sec/core": 637.0073805406493, "core_hours_NVIDIA A100-SXM4-40GB": 33.518454247257736, "core_hours": 33.518454247257736} {"step": 83900, "global_schedule": 0.18099510669708252, "l2_grads": 2.208024263381958, "l2_params": 254.67327880859375, "l2_updates": 0.19121578335762024, "train/loss": 1.8868129253387451, "uptime": 15489.581689285, "examples_seen": 85913600.0, "progress": 0.7450956013605321, "epoch": 67.05886117890954, "img/sec/core": 700.0776555342501, "core_hours_NVIDIA A100-SXM4-40GB": 33.538769453877734, "core_hours": 33.538769453877734} {"step": 83950, "global_schedule": 0.18040597438812256, "l2_grads": 2.1237199306488037, "l2_params": 254.60581970214844, "l2_updates": 0.19111241400241852, "train/loss": 3.67325496673584, "uptime": 15498.072112430002, "examples_seen": 85964800.0, "progress": 0.7455396392636076, "epoch": 67.0988247433785, "img/sec/core": 753.7904637612278, "core_hours_NVIDIA A100-SXM4-40GB": 33.55763706086663, "core_hours": 33.55763706086663} {"step": 84000, "global_schedule": 0.17981767654418945, "l2_grads": 2.1822309494018555, "l2_params": 254.53707885742188, "l2_updates": 0.19145554304122925, "train/loss": 4.129868984222412, "uptime": 15506.487111072, "examples_seen": 86016000.0, "progress": 0.7459836771666829, "epoch": 67.13878830784745, "img/sec/core": 760.5467656356582, "core_hours_NVIDIA A100-SXM4-40GB": 33.576337057848846, "core_hours": 33.576337057848846} {"step": 84050, "global_schedule": 0.17923015356063843, "l2_grads": 2.2286081314086914, "l2_params": 254.47401428222656, "l2_updates": 0.1932808756828308, "train/loss": 1.6114675998687744, "uptime": 15515.509109587, "examples_seen": 86067200.0, "progress": 0.7464277150697584, "epoch": 67.17875187231641, "img/sec/core": 796.8813565998092, "core_hours_NVIDIA A100-SXM4-40GB": 33.59418441003551, "core_hours": 33.59418441003551} {"step": 84100, "global_schedule": 0.1786433458328247, "l2_grads": 2.1793229579925537, "l2_params": 254.40536499023438, "l2_updates": 0.1913755089044571, "train/loss": 1.7879338264465332, "uptime": 15524.099307617, "examples_seen": 86118400.0, "progress": 0.7468717529728338, "epoch": 67.21871543678537, "img/sec/core": 745.0352107889245, "core_hours_NVIDIA A100-SXM4-40GB": 33.61327373899107, "core_hours": 33.61327373899107} {"step": 84150, "global_schedule": 0.1780572235584259, "l2_grads": 1.9865204095840454, "l2_params": 254.3383026123047, "l2_updates": 0.18947625160217285, "train/loss": 1.922853708267212, "uptime": 15533.252788537002, "examples_seen": 86169600.0, "progress": 0.7473157908759092, "epoch": 67.25867900125432, "img/sec/core": 699.1875610965467, "core_hours_NVIDIA A100-SXM4-40GB": 33.63361480770218, "core_hours": 33.63361480770218} {"step": 84200, "global_schedule": 0.17747193574905396, "l2_grads": 2.097302198410034, "l2_params": 254.27035522460938, "l2_updates": 0.18846064805984497, "train/loss": 2.749537944793701, "uptime": 15542.041477313001, "examples_seen": 86220800.0, "progress": 0.7477598287789846, "epoch": 67.29864256572328, "img/sec/core": 728.2087422958119, "core_hours_NVIDIA A100-SXM4-40GB": 33.653145227204405, "core_hours": 33.653145227204405} {"step": 84250, "global_schedule": 0.1768874228000641, "l2_grads": 2.2038090229034424, "l2_params": 254.200927734375, "l2_updates": 0.18845082819461823, "train/loss": 4.064870357513428, "uptime": 15550.509504229, "examples_seen": 86272000.0, "progress": 0.74820386668206, "epoch": 67.33860613019223, "img/sec/core": 755.7840880157013, "core_hours_NVIDIA A100-SXM4-40GB": 33.67196306479551, "core_hours": 33.67196306479551} {"step": 84300, "global_schedule": 0.1763036549091339, "l2_grads": 2.1394588947296143, "l2_params": 254.13311767578125, "l2_updates": 0.18661311268806458, "train/loss": 1.977541208267212, "uptime": 15559.078985926999, "examples_seen": 86323200.0, "progress": 0.7486479045851354, "epoch": 67.3785696946612, "img/sec/core": 746.8362995038655, "core_hours_NVIDIA A100-SXM4-40GB": 33.69100635745773, "core_hours": 33.69100635745773} {"step": 84350, "global_schedule": 0.17572066187858582, "l2_grads": 2.0994865894317627, "l2_params": 254.0691680908203, "l2_updates": 0.18881307542324066, "train/loss": 2.0182576179504395, "uptime": 15567.928446598, "examples_seen": 86374400.0, "progress": 0.7490919424882108, "epoch": 67.41853325913016, "img/sec/core": 723.2079149153471, "core_hours_NVIDIA A100-SXM4-40GB": 33.71067182561551, "core_hours": 33.71067182561551} {"step": 84400, "global_schedule": 0.17513832449913025, "l2_grads": 2.282290458679199, "l2_params": 253.99884033203125, "l2_updates": 0.18603047728538513, "train/loss": 1.7856478691101074, "uptime": 15576.394046091, "examples_seen": 86425600.0, "progress": 0.7495359803912862, "epoch": 67.4584968235991, "img/sec/core": 756.0008012772257, "core_hours_NVIDIA A100-SXM4-40GB": 33.72948426893329, "core_hours": 33.72948426893329} {"step": 84450, "global_schedule": 0.17455682158470154, "l2_grads": 2.3418526649475098, "l2_params": 253.92881774902344, "l2_updates": 0.18338844180107117, "train/loss": 3.786175489425659, "uptime": 15585.835025161, "examples_seen": 86476800.0, "progress": 0.7499800182943616, "epoch": 67.49846038806807, "img/sec/core": 677.8957937038715, "core_hours_NVIDIA A100-SXM4-40GB": 33.75046422242218, "core_hours": 33.75046422242218} {"step": 84500, "global_schedule": 0.1739760935306549, "l2_grads": 2.286447048187256, "l2_params": 253.86166381835938, "l2_updates": 0.18668809533119202, "train/loss": 1.7406768798828125, "uptime": 15594.736263609999, "examples_seen": 86528000.0, "progress": 0.750424056197437, "epoch": 67.53842395253702, "img/sec/core": 719.0010734652896, "core_hours_NVIDIA A100-SXM4-40GB": 33.77024475230884, "core_hours": 33.77024475230884} {"step": 84550, "global_schedule": 0.17339614033699036, "l2_grads": 2.2701222896575928, "l2_params": 253.79554748535156, "l2_updates": 0.1846587210893631, "train/loss": 1.6061347723007202, "uptime": 15603.336363722, "examples_seen": 86579200.0, "progress": 0.7508680941005125, "epoch": 67.57838751700598, "img/sec/core": 744.1773835944423, "core_hours_NVIDIA A100-SXM4-40GB": 33.78935608589107, "core_hours": 33.78935608589107} {"step": 84600, "global_schedule": 0.17281687259674072, "l2_grads": 2.11116886138916, "l2_params": 253.72393798828125, "l2_updates": 0.18630734086036682, "train/loss": 2.4441635608673096, "uptime": 15612.076372897, "examples_seen": 86630400.0, "progress": 0.7513121320035878, "epoch": 67.61835108147494, "img/sec/core": 732.2646775140198, "core_hours_NVIDIA A100-SXM4-40GB": 33.80877832850218, "core_hours": 33.80877832850218} {"step": 84650, "global_schedule": 0.17223843932151794, "l2_grads": 2.311785936355591, "l2_params": 253.65640258789062, "l2_updates": 0.1828705221414566, "train/loss": 4.089112281799316, "uptime": 15621.294900056002, "examples_seen": 86681600.0, "progress": 0.7517561699066633, "epoch": 67.65831464594389, "img/sec/core": 694.2540700495787, "core_hours_NVIDIA A100-SXM4-40GB": 33.82926394441107, "core_hours": 33.82926394441107} {"step": 84700, "global_schedule": 0.17166069149971008, "l2_grads": 2.087998151779175, "l2_params": 253.58642578125, "l2_updates": 0.181162029504776, "train/loss": 3.616637706756592, "uptime": 15630.610179874, "examples_seen": 86732800.0, "progress": 0.7522002078097386, "epoch": 67.69827821041285, "img/sec/core": 687.0432370302537, "core_hours_NVIDIA A100-SXM4-40GB": 33.84996456622885, "core_hours": 33.84996456622885} {"step": 84750, "global_schedule": 0.17108389735221863, "l2_grads": 2.0228946208953857, "l2_params": 253.52125549316406, "l2_updates": 0.18524834513664246, "train/loss": 2.4466233253479004, "uptime": 15638.932105860002, "examples_seen": 86784000.0, "progress": 0.7526442457128141, "epoch": 67.7382417748818, "img/sec/core": 769.0527422096179, "core_hours_NVIDIA A100-SXM4-40GB": 33.86845773508663, "core_hours": 33.86845773508663} {"step": 84800, "global_schedule": 0.17050766944885254, "l2_grads": 2.249898910522461, "l2_params": 253.4552764892578, "l2_updates": 0.18066062033176422, "train/loss": 3.8711605072021484, "uptime": 15647.773897565, "examples_seen": 86835200.0, "progress": 0.7530882836158894, "epoch": 67.77820533935076, "img/sec/core": 723.8351924057888, "core_hours_NVIDIA A100-SXM4-40GB": 33.88810616109774, "core_hours": 33.88810616109774} {"step": 84850, "global_schedule": 0.16993233561515808, "l2_grads": 2.032879590988159, "l2_params": 253.39263916015625, "l2_updates": 0.17893530428409576, "train/loss": 2.415487051010132, "uptime": 15655.90410397, "examples_seen": 86886400.0, "progress": 0.7535323215189649, "epoch": 67.81816890381972, "img/sec/core": 787.1878868984624, "core_hours_NVIDIA A100-SXM4-40GB": 33.90617328644218, "core_hours": 33.90617328644218} {"step": 84900, "global_schedule": 0.16935774683952332, "l2_grads": 2.26422381401062, "l2_params": 253.32077026367188, "l2_updates": 0.17841418087482452, "train/loss": 4.0807342529296875, "uptime": 15664.371479612999, "examples_seen": 86937600.0, "progress": 0.7539763594220402, "epoch": 67.85813246828867, "img/sec/core": 755.8422195774582, "core_hours_NVIDIA A100-SXM4-40GB": 33.92498967675996, "core_hours": 33.92498967675996} {"step": 84950, "global_schedule": 0.16878387331962585, "l2_grads": 2.0177085399627686, "l2_params": 253.2591552734375, "l2_updates": 0.18186408281326294, "train/loss": 2.040383815765381, "uptime": 15673.346509500001, "examples_seen": 86988800.0, "progress": 0.7544203973251157, "epoch": 67.89809603275764, "img/sec/core": 713.0895473973429, "core_hours_NVIDIA A100-SXM4-40GB": 33.94493418761996, "core_hours": 33.94493418761996} {"step": 85000, "global_schedule": 0.1682109236717224, "l2_grads": 1.9527995586395264, "l2_params": 253.19241333007812, "l2_updates": 0.17919841408729553, "train/loss": 2.2878479957580566, "uptime": 15682.611573807999, "examples_seen": 87040000.0, "progress": 0.7548644352281911, "epoch": 67.9380595972266, "img/sec/core": 690.7669269467857, "core_hours_NVIDIA A100-SXM4-40GB": 33.96552321941551, "core_hours": 33.96552321941551, "val/acc@1": 0.73516, "val/loss": 1.072210301513672, "z/secs/eval/val": 2.5476229570012947} {"step": 85050, "global_schedule": 0.1676385998725891, "l2_grads": 2.355137348175049, "l2_params": 253.12510681152344, "l2_updates": 0.17699074745178223, "train/loss": 1.7360475063323975, "uptime": 15693.985993057, "examples_seen": 87091200.0, "progress": 0.7553084731312665, "epoch": 67.97802316169555, "img/sec/core": 783.0260362947398, "core_hours_NVIDIA A100-SXM4-40GB": 33.98368637308218, "core_hours": 33.98368637308218} {"step": 85100, "global_schedule": 0.16706714034080505, "l2_grads": 2.2942917346954346, "l2_params": 253.0614471435547, "l2_updates": 0.17606650292873383, "train/loss": 3.9732308387756348, "uptime": 15703.335830089001, "examples_seen": 87142400.0, "progress": 0.7557525110343419, "epoch": 68.01798672616451, "img/sec/core": 684.5039093296526, "core_hours_NVIDIA A100-SXM4-40GB": 34.00446378870885, "core_hours": 34.00446378870885} {"step": 85150, "global_schedule": 0.1664963662624359, "l2_grads": 2.1418113708496094, "l2_params": 252.99571228027344, "l2_updates": 0.1793563812971115, "train/loss": 3.8834519386291504, "uptime": 15711.855947205002, "examples_seen": 87193600.0, "progress": 0.7561965489374173, "epoch": 68.05795029063346, "img/sec/core": 751.1633834212115, "core_hours_NVIDIA A100-SXM4-40GB": 34.02339738229996, "core_hours": 34.02339738229996} {"step": 85200, "global_schedule": 0.16592645645141602, "l2_grads": 2.258849620819092, "l2_params": 252.9356231689453, "l2_updates": 0.17555303871631622, "train/loss": 4.0659661293029785, "uptime": 15720.300163432, "examples_seen": 87244800.0, "progress": 0.7566405868404927, "epoch": 68.09791385510242, "img/sec/core": 757.9152200694688, "core_hours_NVIDIA A100-SXM4-40GB": 34.042162307248844, "core_hours": 34.042162307248844} {"step": 85250, "global_schedule": 0.16535735130310059, "l2_grads": 2.3112194538116455, "l2_params": 252.86279296875, "l2_updates": 0.17534294724464417, "train/loss": 1.6906187534332275, "uptime": 15728.735481464, "examples_seen": 87296000.0, "progress": 0.7570846247435681, "epoch": 68.13787741957138, "img/sec/core": 758.7147248890343, "core_hours_NVIDIA A100-SXM4-40GB": 34.06090745843107, "core_hours": 34.06090745843107} {"step": 85300, "global_schedule": 0.16478899121284485, "l2_grads": 2.104485511779785, "l2_params": 252.79843139648438, "l2_updates": 0.17521460354328156, "train/loss": 2.8447654247283936, "uptime": 15737.59858334, "examples_seen": 87347200.0, "progress": 0.7575286626466435, "epoch": 68.17784098404033, "img/sec/core": 722.0948252136327, "core_hours_NVIDIA A100-SXM4-40GB": 34.08060324037773, "core_hours": 34.08060324037773} {"step": 85350, "global_schedule": 0.1642213761806488, "l2_grads": 2.267545461654663, "l2_params": 252.7330780029297, "l2_updates": 0.1718512773513794, "train/loss": 2.1559290885925293, "uptime": 15745.930857531, "examples_seen": 87398400.0, "progress": 0.7579727005497189, "epoch": 68.21780454850929, "img/sec/core": 768.0976229648966, "core_hours_NVIDIA A100-SXM4-40GB": 34.099119405246626, "core_hours": 34.099119405246626} {"step": 85400, "global_schedule": 0.16365459561347961, "l2_grads": 2.1997623443603516, "l2_params": 252.6611785888672, "l2_updates": 0.1726759523153305, "train/loss": 1.825182318687439, "uptime": 15755.043620725, "examples_seen": 87449600.0, "progress": 0.7584167384527943, "epoch": 68.25776811297824, "img/sec/core": 702.3116769032222, "core_hours_NVIDIA A100-SXM4-40GB": 34.11936999012218, "core_hours": 34.11936999012218} {"step": 85450, "global_schedule": 0.1630886197090149, "l2_grads": 2.0265424251556396, "l2_params": 252.60198974609375, "l2_updates": 0.1729053258895874, "train/loss": 2.767892360687256, "uptime": 15763.835524498, "examples_seen": 87500800.0, "progress": 0.7588607763558697, "epoch": 68.2977316774472, "img/sec/core": 727.9424531072816, "core_hours_NVIDIA A100-SXM4-40GB": 34.13890755406217, "core_hours": 34.13890755406217} {"step": 85500, "global_schedule": 0.16252344846725464, "l2_grads": 2.2857789993286133, "l2_params": 252.53651428222656, "l2_updates": 0.1739245057106018, "train/loss": 1.904533863067627, "uptime": 15772.213487521001, "examples_seen": 87552000.0, "progress": 0.7593048142589451, "epoch": 68.33769524191617, "img/sec/core": 763.9088382735297, "core_hours_NVIDIA A100-SXM4-40GB": 34.15752524966885, "core_hours": 34.15752524966885} {"step": 85550, "global_schedule": 0.16195905208587646, "l2_grads": 2.2167932987213135, "l2_params": 252.46937561035156, "l2_updates": 0.17269739508628845, "train/loss": 3.619671583175659, "uptime": 15780.660899954002, "examples_seen": 87603200.0, "progress": 0.7597488521620206, "epoch": 68.37765880638511, "img/sec/core": 757.6284514057354, "core_hours_NVIDIA A100-SXM4-40GB": 34.176297277297735, "core_hours": 34.176297277297735} {"step": 85600, "global_schedule": 0.1613953709602356, "l2_grads": 2.1113803386688232, "l2_params": 252.40496826171875, "l2_updates": 0.17166009545326233, "train/loss": 2.1690518856048584, "uptime": 15789.043956979001, "examples_seen": 87654400.0, "progress": 0.7601928900650959, "epoch": 68.41762237085408, "img/sec/core": 763.44464566022, "core_hours_NVIDIA A100-SXM4-40GB": 34.194926292908846, "core_hours": 34.194926292908846} {"step": 85650, "global_schedule": 0.16083255410194397, "l2_grads": 2.3194468021392822, "l2_params": 252.3383026123047, "l2_updates": 0.17292320728302002, "train/loss": 1.8440438508987427, "uptime": 15797.846166169, "examples_seen": 87705600.0, "progress": 0.7606369279681714, "epoch": 68.45758593532302, "img/sec/core": 727.0901954104964, "core_hours_NVIDIA A100-SXM4-40GB": 34.21448675777551, "core_hours": 34.21448675777551} {"step": 85700, "global_schedule": 0.1602705419063568, "l2_grads": 2.1497819423675537, "l2_params": 252.27728271484375, "l2_updates": 0.17313523590564728, "train/loss": 2.036966323852539, "uptime": 15806.815708258999, "examples_seen": 87756800.0, "progress": 0.7610809658712467, "epoch": 68.49754949979199, "img/sec/core": 713.5258339593574, "core_hours_NVIDIA A100-SXM4-40GB": 34.234419073531065, "core_hours": 34.234419073531065} {"step": 85750, "global_schedule": 0.15970930457115173, "l2_grads": 2.299396514892578, "l2_params": 252.21217346191406, "l2_updates": 0.17387673258781433, "train/loss": 1.6338564157485962, "uptime": 15815.941572323, "examples_seen": 87808000.0, "progress": 0.7615250037743222, "epoch": 68.53751306426095, "img/sec/core": 701.3034552252841, "core_hours_NVIDIA A100-SXM4-40GB": 34.25469877145107, "core_hours": 34.25469877145107} {"step": 85800, "global_schedule": 0.15914881229400635, "l2_grads": 2.4148919582366943, "l2_params": 252.14706420898438, "l2_updates": 0.1692522019147873, "train/loss": 1.7169251441955566, "uptime": 15824.887735360002, "examples_seen": 87859200.0, "progress": 0.7619690416773975, "epoch": 68.5774766287299, "img/sec/core": 715.3904946208593, "core_hours_NVIDIA A100-SXM4-40GB": 34.274579133755516, "core_hours": 34.274579133755516} {"step": 85850, "global_schedule": 0.1585891842842102, "l2_grads": 2.266728162765503, "l2_params": 252.0869140625, "l2_updates": 0.17042207717895508, "train/loss": 1.5316132307052612, "uptime": 15833.332008848001, "examples_seen": 87910400.0, "progress": 0.762413079580473, "epoch": 68.61744019319886, "img/sec/core": 757.9100806120663, "core_hours_NVIDIA A100-SXM4-40GB": 34.293344185951064, "core_hours": 34.293344185951064} {"step": 85900, "global_schedule": 0.15803027153015137, "l2_grads": 2.3618972301483154, "l2_params": 252.028076171875, "l2_updates": 0.16583068668842316, "train/loss": 4.064367294311523, "uptime": 15841.76029094, "examples_seen": 87961600.0, "progress": 0.7628571174835483, "epoch": 68.65740375766781, "img/sec/core": 759.3481008515752, "core_hours_NVIDIA A100-SXM4-40GB": 34.312073701711064, "core_hours": 34.312073701711064} {"step": 85950, "global_schedule": 0.15747234225273132, "l2_grads": 2.067064046859741, "l2_params": 251.96360778808594, "l2_updates": 0.16699713468551636, "train/loss": 2.3982856273651123, "uptime": 15850.058332454, "examples_seen": 88012800.0, "progress": 0.7633011553866238, "epoch": 68.69736732213677, "img/sec/core": 771.2663270244605, "core_hours_NVIDIA A100-SXM4-40GB": 34.3305137939644, "core_hours": 34.3305137939644} {"step": 86000, "global_schedule": 0.15691503882408142, "l2_grads": 2.13908314704895, "l2_params": 251.8968505859375, "l2_updates": 0.16652633249759674, "train/loss": 3.8972373008728027, "uptime": 15858.482583697, "examples_seen": 88064000.0, "progress": 0.7637451932896993, "epoch": 68.73733088660573, "img/sec/core": 759.7114349264709, "core_hours_NVIDIA A100-SXM4-40GB": 34.34923435228218, "core_hours": 34.34923435228218} {"step": 86050, "global_schedule": 0.15635862946510315, "l2_grads": 2.2342159748077393, "l2_params": 251.83792114257812, "l2_updates": 0.16657589375972748, "train/loss": 3.4500932693481445, "uptime": 15867.251159626, "examples_seen": 88115200.0, "progress": 0.7641892311927746, "epoch": 68.77729445107468, "img/sec/core": 796.3367636880095, "core_hours_NVIDIA A100-SXM4-40GB": 34.3670939097844, "core_hours": 34.3670939097844} {"step": 86100, "global_schedule": 0.15580302476882935, "l2_grads": 2.2442543506622314, "l2_params": 251.77235412597656, "l2_updates": 0.16725698113441467, "train/loss": 2.0798394680023193, "uptime": 15875.576035129, "examples_seen": 88166400.0, "progress": 0.76463326909585, "epoch": 68.81725801554364, "img/sec/core": 768.7802655659791, "core_hours_NVIDIA A100-SXM4-40GB": 34.3855936331244, "core_hours": 34.3855936331244} {"step": 86150, "global_schedule": 0.15524813532829285, "l2_grads": 2.3785533905029297, "l2_params": 251.705078125, "l2_updates": 0.16502994298934937, "train/loss": 1.7720705270767212, "uptime": 15884.669581785, "examples_seen": 88217600.0, "progress": 0.7650773069989254, "epoch": 68.85722158001259, "img/sec/core": 703.7958062025167, "core_hours_NVIDIA A100-SXM4-40GB": 34.40580151458218, "core_hours": 34.40580151458218} {"step": 86200, "global_schedule": 0.15469413995742798, "l2_grads": 2.0540783405303955, "l2_params": 251.63897705078125, "l2_updates": 0.16505204141139984, "train/loss": 2.7739973068237305, "uptime": 15893.180438936999, "examples_seen": 88268800.0, "progress": 0.7655213449020009, "epoch": 68.89718514448155, "img/sec/core": 751.9806625465923, "core_hours_NVIDIA A100-SXM4-40GB": 34.42471453047551, "core_hours": 34.42471453047551} {"step": 86250, "global_schedule": 0.15414097905158997, "l2_grads": 2.1841776371002197, "l2_params": 251.57501220703125, "l2_updates": 0.16591902077198029, "train/loss": 1.7252733707427979, "uptime": 15901.69251548, "examples_seen": 88320000.0, "progress": 0.7659653828050762, "epoch": 68.93714870895052, "img/sec/core": 751.8729381331749, "core_hours_NVIDIA A100-SXM4-40GB": 34.443630256126625, "core_hours": 34.443630256126625} {"step": 86300, "global_schedule": 0.15358859300613403, "l2_grads": 2.3092470169067383, "l2_params": 251.5105743408203, "l2_updates": 0.16387875378131866, "train/loss": 1.6696686744689941, "uptime": 15910.496200836, "examples_seen": 88371200.0, "progress": 0.7664094207081517, "epoch": 68.97711227341946, "img/sec/core": 726.9682798962963, "core_hours_NVIDIA A100-SXM4-40GB": 34.463194001362176, "core_hours": 34.463194001362176} {"step": 86350, "global_schedule": 0.1530369520187378, "l2_grads": 2.233856678009033, "l2_params": 251.44894409179688, "l2_updates": 0.1621888279914856, "train/loss": 2.291199207305908, "uptime": 15920.03284758, "examples_seen": 88422400.0, "progress": 0.766853458611227, "epoch": 69.01707583788843, "img/sec/core": 671.0954250273192, "core_hours_NVIDIA A100-SXM4-40GB": 34.48438654968218, "core_hours": 34.48438654968218} {"step": 86400, "global_schedule": 0.15248620510101318, "l2_grads": 2.356282949447632, "l2_params": 251.386962890625, "l2_updates": 0.15958279371261597, "train/loss": 4.015611171722412, "uptime": 15928.547139784, "examples_seen": 88473600.0, "progress": 0.7672974965143025, "epoch": 69.05703940235738, "img/sec/core": 751.6772794095162, "core_hours_NVIDIA A100-SXM4-40GB": 34.503307199024405, "core_hours": 34.503307199024405} {"step": 86450, "global_schedule": 0.15193626284599304, "l2_grads": 2.2178547382354736, "l2_params": 251.3253631591797, "l2_updates": 0.15965518355369568, "train/loss": 2.6199727058410645, "uptime": 15937.348624312, "examples_seen": 88524800.0, "progress": 0.7677415344173779, "epoch": 69.09700296682634, "img/sec/core": 727.1500597017293, "core_hours_NVIDIA A100-SXM4-40GB": 34.52286605353107, "core_hours": 34.52286605353107} {"step": 86500, "global_schedule": 0.15138715505599976, "l2_grads": 2.023953676223755, "l2_params": 251.26556396484375, "l2_updates": 0.1593758910894394, "train/loss": 2.640695571899414, "uptime": 15945.829935362, "examples_seen": 88576000.0, "progress": 0.7681855723204533, "epoch": 69.1369665312953, "img/sec/core": 754.600316185792, "core_hours_NVIDIA A100-SXM4-40GB": 34.54171341141996, "core_hours": 34.54171341141996} {"step": 86550, "global_schedule": 0.15083876252174377, "l2_grads": 2.3581509590148926, "l2_params": 251.2023162841797, "l2_updates": 0.1606076955795288, "train/loss": 1.7735594511032104, "uptime": 15954.87210659, "examples_seen": 88627200.0, "progress": 0.7686296102235287, "epoch": 69.17693009576425, "img/sec/core": 707.7946035993533, "core_hours_NVIDIA A100-SXM4-40GB": 34.56180712525996, "core_hours": 34.56180712525996} {"step": 86600, "global_schedule": 0.1502912938594818, "l2_grads": 2.397794246673584, "l2_params": 251.14013671875, "l2_updates": 0.15759357810020447, "train/loss": 4.046946048736572, "uptime": 15963.458470745, "examples_seen": 88678400.0, "progress": 0.7690736481266041, "epoch": 69.21689366023321, "img/sec/core": 745.3678745123116, "core_hours_NVIDIA A100-SXM4-40GB": 34.58088793449329, "core_hours": 34.58088793449329} {"step": 86650, "global_schedule": 0.14974462985992432, "l2_grads": 2.261512279510498, "l2_params": 251.07615661621094, "l2_updates": 0.16231022775173187, "train/loss": 1.590517282485962, "uptime": 15972.636174791, "examples_seen": 88729600.0, "progress": 0.7695176860296795, "epoch": 69.25685722470216, "img/sec/core": 697.3421640011662, "core_hours_NVIDIA A100-SXM4-40GB": 34.601282832373286, "core_hours": 34.601282832373286} {"step": 86700, "global_schedule": 0.1491987705230713, "l2_grads": 2.1547234058380127, "l2_params": 251.02040100097656, "l2_updates": 0.1593804657459259, "train/loss": 3.552238941192627, "uptime": 15981.917151503001, "examples_seen": 88780800.0, "progress": 0.7699617239327549, "epoch": 69.29682078917112, "img/sec/core": 689.582594440079, "core_hours_NVIDIA A100-SXM4-40GB": 34.62190722506662, "core_hours": 34.62190722506662} {"step": 86750, "global_schedule": 0.14865368604660034, "l2_grads": 2.413935422897339, "l2_params": 250.95938110351562, "l2_updates": 0.1560775190591812, "train/loss": 3.866565227508545, "uptime": 15990.866611327, "examples_seen": 88832000.0, "progress": 0.7704057618358303, "epoch": 69.33678435364008, "img/sec/core": 715.1269602706471, "core_hours_NVIDIA A100-SXM4-40GB": 34.6417949135644, "core_hours": 34.6417949135644} {"step": 86800, "global_schedule": 0.14810946583747864, "l2_grads": 2.4124879837036133, "l2_params": 250.8961639404297, "l2_updates": 0.15732787549495697, "train/loss": 4.122668743133545, "uptime": 15999.491482047999, "examples_seen": 88883200.0, "progress": 0.7708497997389057, "epoch": 69.37674791810903, "img/sec/core": 742.0401078496565, "core_hours_NVIDIA A100-SXM4-40GB": 34.6609612929444, "core_hours": 34.6609612929444} {"step": 86850, "global_schedule": 0.14756610989570618, "l2_grads": 2.2259879112243652, "l2_params": 250.8372344970703, "l2_updates": 0.15735003352165222, "train/loss": 1.709049105644226, "uptime": 16007.930180495, "examples_seen": 88934400.0, "progress": 0.7712938376419811, "epoch": 69.416711482578, "img/sec/core": 758.4107952423725, "core_hours_NVIDIA A100-SXM4-40GB": 34.67971395615996, "core_hours": 34.67971395615996} {"step": 86900, "global_schedule": 0.14702355861663818, "l2_grads": 2.2915258407592773, "l2_params": 250.77320861816406, "l2_updates": 0.15556266903877258, "train/loss": 3.8723104000091553, "uptime": 16016.407740427001, "examples_seen": 88985600.0, "progress": 0.7717378755450566, "epoch": 69.45667504704696, "img/sec/core": 754.9342088211815, "core_hours_NVIDIA A100-SXM4-40GB": 34.69855297823107, "core_hours": 34.69855297823107} {"step": 86950, "global_schedule": 0.14648184180259705, "l2_grads": 2.3403165340423584, "l2_params": 250.7152557373047, "l2_updates": 0.15639284253120422, "train/loss": 1.8112373352050781, "uptime": 16025.350597163002, "examples_seen": 89036800.0, "progress": 0.7721819134481319, "epoch": 69.4966386115159, "img/sec/core": 715.6549846354714, "core_hours_NVIDIA A100-SXM4-40GB": 34.718425993199965, "core_hours": 34.718425993199965} {"step": 87000, "global_schedule": 0.1459408700466156, "l2_grads": 2.252797842025757, "l2_params": 250.65118408203125, "l2_updates": 0.15599054098129272, "train/loss": 1.7500399351119995, "uptime": 16034.5388621, "examples_seen": 89088000.0, "progress": 0.7726259513512074, "epoch": 69.53660217598487, "img/sec/core": 696.5406465620373, "core_hours_NVIDIA A100-SXM4-40GB": 34.73884435972663, "core_hours": 34.73884435972663} {"step": 87050, "global_schedule": 0.14540082216262817, "l2_grads": 2.3052332401275635, "l2_params": 250.59034729003906, "l2_updates": 0.15292812883853912, "train/loss": 2.1546876430511475, "uptime": 16043.824737879002, "examples_seen": 89139200.0, "progress": 0.7730699892542827, "epoch": 69.57656574045382, "img/sec/core": 767.6559347982553, "core_hours_NVIDIA A100-SXM4-40GB": 34.75737117828885, "core_hours": 34.75737117828885} {"step": 87100, "global_schedule": 0.14486148953437805, "l2_grads": 2.2800984382629395, "l2_params": 250.52789306640625, "l2_updates": 0.15407401323318481, "train/loss": 1.949615240097046, "uptime": 16052.290722300002, "examples_seen": 89190400.0, "progress": 0.7735140271573582, "epoch": 69.61652930492278, "img/sec/core": 755.9664277345801, "core_hours_NVIDIA A100-SXM4-40GB": 34.77618447700218, "core_hours": 34.77618447700218} {"step": 87150, "global_schedule": 0.1443231999874115, "l2_grads": 2.222395181655884, "l2_params": 250.46804809570312, "l2_updates": 0.1560666412115097, "train/loss": 1.757170557975769, "uptime": 16061.210719457, "examples_seen": 89241600.0, "progress": 0.7739580650604335, "epoch": 69.65649286939174, "img/sec/core": 717.4890179173565, "core_hours_NVIDIA A100-SXM4-40GB": 34.79600669290662, "core_hours": 34.79600669290662} {"step": 87200, "global_schedule": 0.1437855362892151, "l2_grads": 2.259192943572998, "l2_params": 250.41238403320312, "l2_updates": 0.1543309986591339, "train/loss": 2.070828676223755, "uptime": 16069.73524611, "examples_seen": 89292800.0, "progress": 0.774402102963509, "epoch": 69.69645643386069, "img/sec/core": 750.7748242827801, "core_hours_NVIDIA A100-SXM4-40GB": 34.814950085468844, "core_hours": 34.814950085468844} {"step": 87250, "global_schedule": 0.14324882626533508, "l2_grads": 2.4042062759399414, "l2_params": 250.35450744628906, "l2_updates": 0.1519625335931778, "train/loss": 1.667283296585083, "uptime": 16078.211395655, "examples_seen": 89344000.0, "progress": 0.7748461408665843, "epoch": 69.73641999832965, "img/sec/core": 755.0598259294668, "core_hours_NVIDIA A100-SXM4-40GB": 34.83378597334662, "core_hours": 34.83378597334662} {"step": 87300, "global_schedule": 0.14271283149719238, "l2_grads": 2.1528804302215576, "l2_params": 250.28662109375, "l2_updates": 0.15272830426692963, "train/loss": 2.642775774002075, "uptime": 16086.681592173, "examples_seen": 89395200.0, "progress": 0.7752901787696598, "epoch": 69.7763835627986, "img/sec/core": 755.5904973869157, "core_hours_NVIDIA A100-SXM4-40GB": 34.85260863227551, "core_hours": 34.85260863227551} {"step": 87350, "global_schedule": 0.1421777904033661, "l2_grads": 2.091722011566162, "l2_params": 250.2298583984375, "l2_updates": 0.15024393796920776, "train/loss": 2.4103078842163086, "uptime": 16095.652483404001, "examples_seen": 89446400.0, "progress": 0.7757342166727352, "epoch": 69.81634712726756, "img/sec/core": 713.4185261195557, "core_hours_NVIDIA A100-SXM4-40GB": 34.87254394612218, "core_hours": 34.87254394612218} {"step": 87400, "global_schedule": 0.14164355397224426, "l2_grads": 2.253443479537964, "l2_params": 250.1703643798828, "l2_updates": 0.15303954482078552, "train/loss": 1.974982738494873, "uptime": 16103.994357960999, "examples_seen": 89497600.0, "progress": 0.7761782545758106, "epoch": 69.85631069173652, "img/sec/core": 767.2136467973002, "core_hours_NVIDIA A100-SXM4-40GB": 34.89108144513773, "core_hours": 34.89108144513773} {"step": 87450, "global_schedule": 0.14111018180847168, "l2_grads": 2.34836483001709, "l2_params": 250.11219787597656, "l2_updates": 0.147905632853508, "train/loss": 3.1437249183654785, "uptime": 16112.32096747, "examples_seen": 89548800.0, "progress": 0.776622292478886, "epoch": 69.89627425620547, "img/sec/core": 768.6201680386496, "core_hours_NVIDIA A100-SXM4-40GB": 34.909585021824405, "core_hours": 34.909585021824405} {"step": 87500, "global_schedule": 0.14057764410972595, "l2_grads": 2.2498161792755127, "l2_params": 250.05271911621094, "l2_updates": 0.1518746018409729, "train/loss": 2.0960421562194824, "uptime": 16120.750335244002, "examples_seen": 89600000.0, "progress": 0.7770663303819614, "epoch": 69.93623782067444, "img/sec/core": 759.2502986687379, "core_hours_NVIDIA A100-SXM4-40GB": 34.92831695021107, "core_hours": 34.92831695021107, "val/acc@1": 0.74108, "val/loss": 1.0298700146484374, "z/secs/eval/val": 2.6187502869979653} {"step": 87550, "global_schedule": 0.1400458812713623, "l2_grads": 2.0738685131073, "l2_params": 249.99273681640625, "l2_updates": 0.150785893201828, "train/loss": 2.25579833984375, "uptime": 16131.585756976, "examples_seen": 89651200.0, "progress": 0.7775103682850368, "epoch": 69.97620138514338, "img/sec/core": 779.0090808159055, "core_hours_NVIDIA A100-SXM4-40GB": 34.94657376206662, "core_hours": 34.94657376206662} {"step": 87600, "global_schedule": 0.13951504230499268, "l2_grads": 2.3261184692382812, "l2_params": 249.93385314941406, "l2_updates": 0.1488313227891922, "train/loss": 1.6426899433135986, "uptime": 16140.990246029001, "examples_seen": 89702400.0, "progress": 0.7779544061881122, "epoch": 70.01616494961235, "img/sec/core": 680.5260725947613, "core_hours_NVIDIA A100-SXM4-40GB": 34.96747262662885, "core_hours": 34.96747262662885} {"step": 87650, "global_schedule": 0.1389850378036499, "l2_grads": 2.1684980392456055, "l2_params": 249.8775634765625, "l2_updates": 0.14956985414028168, "train/loss": 1.9234272241592407, "uptime": 16149.385770192, "examples_seen": 89753600.0, "progress": 0.7783984440911876, "epoch": 70.05612851408131, "img/sec/core": 762.3109499471287, "core_hours_NVIDIA A100-SXM4-40GB": 34.98612934699107, "core_hours": 34.98612934699107} {"step": 87700, "global_schedule": 0.13845586776733398, "l2_grads": 2.3901431560516357, "l2_params": 249.81838989257812, "l2_updates": 0.14520220458507538, "train/loss": 4.011021614074707, "uptime": 16157.843873756, "examples_seen": 89804800.0, "progress": 0.778842481994263, "epoch": 70.09609207855026, "img/sec/core": 756.670801152151, "core_hours_NVIDIA A100-SXM4-40GB": 35.00492513268885, "core_hours": 35.00492513268885} {"step": 87750, "global_schedule": 0.13792747259140015, "l2_grads": 2.3283793926239014, "l2_params": 249.76123046875, "l2_updates": 0.14768856763839722, "train/loss": 1.639061689376831, "uptime": 16166.187157131002, "examples_seen": 89856000.0, "progress": 0.7792865198973384, "epoch": 70.13605564301922, "img/sec/core": 767.0840977517541, "core_hours_NVIDIA A100-SXM4-40GB": 35.02346576241108, "core_hours": 35.02346576241108} {"step": 87800, "global_schedule": 0.13740003108978271, "l2_grads": 2.395209789276123, "l2_params": 249.70144653320312, "l2_updates": 0.14584262669086456, "train/loss": 1.6931291818618774, "uptime": 16174.623238537, "examples_seen": 89907200.0, "progress": 0.7797305578004139, "epoch": 70.17601920748817, "img/sec/core": 758.646069423825, "core_hours_NVIDIA A100-SXM4-40GB": 35.04221260997996, "core_hours": 35.04221260997996} {"step": 87850, "global_schedule": 0.13687333464622498, "l2_grads": 2.3247265815734863, "l2_params": 249.6392059326172, "l2_updates": 0.14616064727306366, "train/loss": 1.6694574356079102, "uptime": 16183.010052176001, "examples_seen": 89958400.0, "progress": 0.7801745957034892, "epoch": 70.21598277195713, "img/sec/core": 763.102684223028, "core_hours_NVIDIA A100-SXM4-40GB": 35.06084997362218, "core_hours": 35.06084997362218} {"step": 87900, "global_schedule": 0.13634765148162842, "l2_grads": 2.3407857418060303, "l2_params": 249.57656860351562, "l2_updates": 0.14702577888965607, "train/loss": 1.8421353101730347, "uptime": 16191.449495152001, "examples_seen": 90009600.0, "progress": 0.7806186336065647, "epoch": 70.25594633642609, "img/sec/core": 758.3438881215966, "core_hours_NVIDIA A100-SXM4-40GB": 35.07960429134663, "core_hours": 35.07960429134663} {"step": 87950, "global_schedule": 0.13582265377044678, "l2_grads": 2.1876559257507324, "l2_params": 249.5266876220703, "l2_updates": 0.14551453292369843, "train/loss": 3.1201114654541016, "uptime": 16199.892735651001, "examples_seen": 90060800.0, "progress": 0.78106267150964, "epoch": 70.29590990089504, "img/sec/core": 758.0028071873378, "core_hours_NVIDIA A100-SXM4-40GB": 35.09836704801107, "core_hours": 35.09836704801107} {"step": 88000, "global_schedule": 0.13529860973358154, "l2_grads": 2.4440765380859375, "l2_params": 249.46856689453125, "l2_updates": 0.1431865394115448, "train/loss": 4.049307346343994, "uptime": 16208.404857119001, "examples_seen": 90112000.0, "progress": 0.7815067094127155, "epoch": 70.335873465364, "img/sec/core": 751.868969922435, "core_hours_NVIDIA A100-SXM4-40GB": 35.11728287349551, "core_hours": 35.11728287349551} {"step": 88050, "global_schedule": 0.13477540016174316, "l2_grads": 2.3419885635375977, "l2_params": 249.40956115722656, "l2_updates": 0.14244776964187622, "train/loss": 1.7242231369018555, "uptime": 16217.657686189, "examples_seen": 90163200.0, "progress": 0.7819507473157908, "epoch": 70.37583702983295, "img/sec/core": 771.4886197871344, "core_hours_NVIDIA A100-SXM4-40GB": 35.13571765251552, "core_hours": 35.13571765251552} {"step": 88100, "global_schedule": 0.13425305485725403, "l2_grads": 2.1580111980438232, "l2_params": 249.3513641357422, "l2_updates": 0.14174306392669678, "train/loss": 2.4526526927948, "uptime": 16226.706360618, "examples_seen": 90214400.0, "progress": 0.7823947852188663, "epoch": 70.41580059430191, "img/sec/core": 707.2859179781361, "core_hours_NVIDIA A100-SXM4-40GB": 35.155825817913296, "core_hours": 35.155825817913296} {"step": 88150, "global_schedule": 0.13373157382011414, "l2_grads": 2.2769174575805664, "l2_params": 249.29373168945312, "l2_updates": 0.14454025030136108, "train/loss": 1.7992154359817505, "uptime": 16235.146466016, "examples_seen": 90265600.0, "progress": 0.7828388231219416, "epoch": 70.45576415877088, "img/sec/core": 758.2843694720398, "core_hours_NVIDIA A100-SXM4-40GB": 35.174581607686626, "core_hours": 35.174581607686626} {"step": 88200, "global_schedule": 0.13321086764335632, "l2_grads": 2.373474597930908, "l2_params": 249.2355194091797, "l2_updates": 0.14085660874843597, "train/loss": 3.857510566711426, "uptime": 16243.894757777, "examples_seen": 90316800.0, "progress": 0.7832828610250171, "epoch": 70.49572772323982, "img/sec/core": 731.5713941470955, "core_hours_NVIDIA A100-SXM4-40GB": 35.194022256044406, "core_hours": 35.194022256044406} {"step": 88250, "global_schedule": 0.13269108533859253, "l2_grads": 2.2591159343719482, "l2_params": 249.17745971679688, "l2_updates": 0.14197929203510284, "train/loss": 2.1129696369171143, "uptime": 16252.907484244, "examples_seen": 90368000.0, "progress": 0.7837268989280926, "epoch": 70.53569128770879, "img/sec/core": 710.1069829904291, "core_hours_NVIDIA A100-SXM4-40GB": 35.21405053708218, "core_hours": 35.21405053708218} {"step": 88300, "global_schedule": 0.1321721076965332, "l2_grads": 2.453946352005005, "l2_params": 249.11988830566406, "l2_updates": 0.13925839960575104, "train/loss": 3.922086000442505, "uptime": 16261.431463374001, "examples_seen": 90419200.0, "progress": 0.7841709368311679, "epoch": 70.57565485217773, "img/sec/core": 750.8230490000373, "core_hours_NVIDIA A100-SXM4-40GB": 35.23299271292663, "core_hours": 35.23299271292663} {"step": 88350, "global_schedule": 0.13165414333343506, "l2_grads": 2.3893826007843018, "l2_params": 249.0625, "l2_updates": 0.14071820676326752, "train/loss": 1.7361615896224976, "uptime": 16269.883151121, "examples_seen": 90470400.0, "progress": 0.7846149747342434, "epoch": 70.6156184166467, "img/sec/core": 757.2452025660104, "core_hours_NVIDIA A100-SXM4-40GB": 35.251774241253294, "core_hours": 35.251774241253294} {"step": 88400, "global_schedule": 0.13113686442375183, "l2_grads": 2.3990089893341064, "l2_params": 249.0056610107422, "l2_updates": 0.1398242712020874, "train/loss": 1.8995264768600464, "uptime": 16278.587042215002, "examples_seen": 90521600.0, "progress": 0.7850590126373187, "epoch": 70.65558198111566, "img/sec/core": 735.3033178930506, "core_hours_NVIDIA A100-SXM4-40GB": 35.27111622146219, "core_hours": 35.27111622146219} {"step": 88450, "global_schedule": 0.1306205689907074, "l2_grads": 2.429960250854492, "l2_params": 248.94912719726562, "l2_updates": 0.1390843540430069, "train/loss": 3.9973387718200684, "uptime": 16287.924090456001, "examples_seen": 90572800.0, "progress": 0.7855030505403942, "epoch": 70.69554554558461, "img/sec/core": 685.4414623132706, "core_hours_NVIDIA A100-SXM4-40GB": 35.2918652175533, "core_hours": 35.2918652175533} {"step": 88500, "global_schedule": 0.13010501861572266, "l2_grads": 2.317612648010254, "l2_params": 248.89291381835938, "l2_updates": 0.13701629638671875, "train/loss": 1.630165696144104, "uptime": 16297.169308613002, "examples_seen": 90624000.0, "progress": 0.7859470884434695, "epoch": 70.73550911005357, "img/sec/core": 692.2497545559605, "core_hours_NVIDIA A100-SXM4-40GB": 35.31241014679107, "core_hours": 35.31241014679107} {"step": 88550, "global_schedule": 0.1295904517173767, "l2_grads": 2.2256855964660645, "l2_params": 248.84181213378906, "l2_updates": 0.14019393920898438, "train/loss": 3.7295498847961426, "uptime": 16306.363763283001, "examples_seen": 90675200.0, "progress": 0.786391126346545, "epoch": 70.77547267452252, "img/sec/core": 696.0717334201854, "core_hours_NVIDIA A100-SXM4-40GB": 35.33284226827996, "core_hours": 35.33284226827996} {"step": 88600, "global_schedule": 0.12907671928405762, "l2_grads": 2.3674726486206055, "l2_params": 248.78439331054688, "l2_updates": 0.13692381978034973, "train/loss": 1.8844984769821167, "uptime": 16315.0859387, "examples_seen": 90726400.0, "progress": 0.7868351642496203, "epoch": 70.81543623899148, "img/sec/core": 733.7618992994611, "core_hours_NVIDIA A100-SXM4-40GB": 35.35222488031774, "core_hours": 35.35222488031774} {"step": 88650, "global_schedule": 0.12856388092041016, "l2_grads": 2.2220661640167236, "l2_params": 248.72824096679688, "l2_updates": 0.13630899786949158, "train/loss": 1.7192140817642212, "uptime": 16323.870161470002, "examples_seen": 90777600.0, "progress": 0.7872792021526958, "epoch": 70.85539980346044, "img/sec/core": 728.578972502365, "core_hours_NVIDIA A100-SXM4-40GB": 35.37174537536219, "core_hours": 35.37174537536219} {"step": 88700, "global_schedule": 0.12805190682411194, "l2_grads": 2.2908475399017334, "l2_params": 248.67103576660156, "l2_updates": 0.13653801381587982, "train/loss": 1.715866208076477, "uptime": 16332.784105531, "examples_seen": 90828800.0, "progress": 0.7877232400557712, "epoch": 70.89536336792939, "img/sec/core": 717.9762354581724, "core_hours_NVIDIA A100-SXM4-40GB": 35.39155413994218, "core_hours": 35.39155413994218} {"step": 88750, "global_schedule": 0.1275407075881958, "l2_grads": 2.473921537399292, "l2_params": 248.61386108398438, "l2_updates": 0.13500644266605377, "train/loss": 3.9733307361602783, "uptime": 16341.499864911, "examples_seen": 90880000.0, "progress": 0.7881672779588466, "epoch": 70.93532693239835, "img/sec/core": 734.302052290001, "core_hours_NVIDIA A100-SXM4-40GB": 35.410922494119966, "core_hours": 35.410922494119966} {"step": 88800, "global_schedule": 0.12703049182891846, "l2_grads": 2.4692416191101074, "l2_params": 248.5574188232422, "l2_updates": 0.1334095448255539, "train/loss": 4.047794818878174, "uptime": 16350.069657401002, "examples_seen": 90931200.0, "progress": 0.788611315861922, "epoch": 70.9752904968673, "img/sec/core": 746.8092147466853, "core_hours_NVIDIA A100-SXM4-40GB": 35.42996647743108, "core_hours": 35.42996647743108} {"step": 88850, "global_schedule": 0.12652111053466797, "l2_grads": 2.391335964202881, "l2_params": 248.50411987304688, "l2_updates": 0.1356796771287918, "train/loss": 1.5595238208770752, "uptime": 16359.360135998, "examples_seen": 90982400.0, "progress": 0.7890553537649974, "epoch": 71.01525406133626, "img/sec/core": 688.8773202779465, "core_hours_NVIDIA A100-SXM4-40GB": 35.45061198542441, "core_hours": 35.45061198542441} {"step": 88900, "global_schedule": 0.1260126531124115, "l2_grads": 2.223928451538086, "l2_params": 248.44387817382812, "l2_updates": 0.13453978300094604, "train/loss": 2.255359411239624, "uptime": 16368.049720714002, "examples_seen": 91033600.0, "progress": 0.7894993916680728, "epoch": 71.05521762580523, "img/sec/core": 736.5139082210508, "core_hours_NVIDIA A100-SXM4-40GB": 35.46992217368219, "core_hours": 35.46992217368219} {"step": 88950, "global_schedule": 0.12550494074821472, "l2_grads": 2.320315361022949, "l2_params": 248.38662719726562, "l2_updates": 0.13225559890270233, "train/loss": 1.9155274629592896, "uptime": 16376.673919241, "examples_seen": 91084800.0, "progress": 0.7899434295711482, "epoch": 71.09518119027418, "img/sec/core": 742.0979445178741, "core_hours_NVIDIA A100-SXM4-40GB": 35.48908705929774, "core_hours": 35.48908705929774} {"step": 89000, "global_schedule": 0.12499821186065674, "l2_grads": 2.477222442626953, "l2_params": 248.33154296875, "l2_updates": 0.13285478949546814, "train/loss": 4.021133899688721, "uptime": 16385.60398387, "examples_seen": 91136000.0, "progress": 0.7903874674742236, "epoch": 71.13514475474314, "img/sec/core": 716.6801435251334, "core_hours_NVIDIA A100-SXM4-40GB": 35.50893164736218, "core_hours": 35.50893164736218} {"step": 89050, "global_schedule": 0.12449228763580322, "l2_grads": 2.171626329421997, "l2_params": 248.27838134765625, "l2_updates": 0.13132546842098236, "train/loss": 3.0767297744750977, "uptime": 16394.814095324, "examples_seen": 91187200.0, "progress": 0.790831505377299, "epoch": 71.1751083192121, "img/sec/core": 750.541509131561, "core_hours_NVIDIA A100-SXM4-40GB": 35.527880928713294, "core_hours": 35.527880928713294} {"step": 89100, "global_schedule": 0.12398740649223328, "l2_grads": 2.3733510971069336, "l2_params": 248.2232666015625, "l2_updates": 0.132469043135643, "train/loss": 1.554516315460205, "uptime": 16403.820832589, "examples_seen": 91238400.0, "progress": 0.7912755432803744, "epoch": 71.21507188368105, "img/sec/core": 710.5791821942171, "core_hours_NVIDIA A100-SXM4-40GB": 35.547895900413295, "core_hours": 35.547895900413295} {"step": 89150, "global_schedule": 0.12348324060440063, "l2_grads": 2.37580943107605, "l2_params": 248.1685028076172, "l2_updates": 0.1324198842048645, "train/loss": 1.6618531942367554, "uptime": 16412.832265222998, "examples_seen": 91289600.0, "progress": 0.7917195811834499, "epoch": 71.25503544815001, "img/sec/core": 710.2089379054247, "core_hours_NVIDIA A100-SXM4-40GB": 35.567921306266626, "core_hours": 35.567921306266626} {"step": 89200, "global_schedule": 0.1229800283908844, "l2_grads": 2.1538498401641846, "l2_params": 248.1156005859375, "l2_updates": 0.13078434765338898, "train/loss": 3.0713071823120117, "uptime": 16421.288408583998, "examples_seen": 91340800.0, "progress": 0.7921636190865252, "epoch": 71.29499901261896, "img/sec/core": 756.846203615377, "core_hours_NVIDIA A100-SXM4-40GB": 35.58671273595773, "core_hours": 35.58671273595773} {"step": 89250, "global_schedule": 0.1224777102470398, "l2_grads": 2.419577121734619, "l2_params": 248.0619354248047, "l2_updates": 0.13069678843021393, "train/loss": 1.5804004669189453, "uptime": 16430.191611873, "examples_seen": 91392000.0, "progress": 0.7926076569896007, "epoch": 71.33496257708792, "img/sec/core": 718.8423977587171, "core_hours_NVIDIA A100-SXM4-40GB": 35.60649763215552, "core_hours": 35.60649763215552} {"step": 89300, "global_schedule": 0.12197625637054443, "l2_grads": 2.4054856300354004, "l2_params": 248.00669860839844, "l2_updates": 0.129476398229599, "train/loss": 1.6566280126571655, "uptime": 16439.528372095003, "examples_seen": 91443200.0, "progress": 0.793051694892676, "epoch": 71.37492614155688, "img/sec/core": 685.4626067102711, "core_hours_NVIDIA A100-SXM4-40GB": 35.62724598820441, "core_hours": 35.62724598820441} {"step": 89350, "global_schedule": 0.12147563695907593, "l2_grads": 2.261725425720215, "l2_params": 247.95411682128906, "l2_updates": 0.1275402158498764, "train/loss": 2.505121946334839, "uptime": 16448.757713161, "examples_seen": 91494400.0, "progress": 0.7934957327957515, "epoch": 71.41488970602583, "img/sec/core": 693.4406209754187, "core_hours_NVIDIA A100-SXM4-40GB": 35.64775563501773, "core_hours": 35.64775563501773} {"step": 89400, "global_schedule": 0.12097597122192383, "l2_grads": 2.474186658859253, "l2_params": 247.89956665039062, "l2_updates": 0.12685583531856537, "train/loss": 1.6976675987243652, "uptime": 16457.259323457, "examples_seen": 91545600.0, "progress": 0.7939397706988268, "epoch": 71.4548532704948, "img/sec/core": 752.7985613515248, "core_hours_NVIDIA A100-SXM4-40GB": 35.66664810234218, "core_hours": 35.66664810234218} {"step": 89450, "global_schedule": 0.12047719955444336, "l2_grads": 2.418856382369995, "l2_params": 247.84390258789062, "l2_updates": 0.1275988072156906, "train/loss": 1.530436635017395, "uptime": 16465.691708792, "examples_seen": 91596800.0, "progress": 0.7943838086019023, "epoch": 71.49481683496374, "img/sec/core": 758.9785980766285, "core_hours_NVIDIA A100-SXM4-40GB": 35.68538673641995, "core_hours": 35.68538673641995} {"step": 89500, "global_schedule": 0.11997923254966736, "l2_grads": 2.3794937133789062, "l2_params": 247.7908935546875, "l2_updates": 0.12922121584415436, "train/loss": 1.6386909484863281, "uptime": 16474.322835228, "examples_seen": 91648000.0, "progress": 0.7948278465049776, "epoch": 71.5347803994327, "img/sec/core": 741.5022879638427, "core_hours_NVIDIA A100-SXM4-40GB": 35.70456701738885, "core_hours": 35.70456701738885} {"step": 89550, "global_schedule": 0.11948230862617493, "l2_grads": 2.362593412399292, "l2_params": 247.7374267578125, "l2_updates": 0.12750941514968872, "train/loss": 3.7090907096862793, "uptime": 16483.05904657, "examples_seen": 91699200.0, "progress": 0.7952718844080531, "epoch": 71.57474396390167, "img/sec/core": 732.583009894983, "core_hours_NVIDIA A100-SXM4-40GB": 35.72398082037106, "core_hours": 35.72398082037106} {"step": 89600, "global_schedule": 0.11898612976074219, "l2_grads": 2.2559432983398438, "l2_params": 247.68524169921875, "l2_updates": 0.12745212018489838, "train/loss": 1.3898801803588867, "uptime": 16491.244871711002, "examples_seen": 91750400.0, "progress": 0.7957159223111285, "epoch": 71.61470752837062, "img/sec/core": 781.8393246569125, "core_hours_NVIDIA A100-SXM4-40GB": 35.742171542906625, "core_hours": 35.742171542906625} {"step": 89650, "global_schedule": 0.11849093437194824, "l2_grads": 2.298790216445923, "l2_params": 247.62982177734375, "l2_updates": 0.12537163496017456, "train/loss": 2.8813538551330566, "uptime": 16500.035355023, "examples_seen": 91801600.0, "progress": 0.7961599602142039, "epoch": 71.65467109283958, "img/sec/core": 728.0600818913495, "core_hours_NVIDIA A100-SXM4-40GB": 35.76170595026663, "core_hours": 35.76170595026663} {"step": 89700, "global_schedule": 0.11799651384353638, "l2_grads": 2.489556074142456, "l2_params": 247.57838439941406, "l2_updates": 0.12326446175575256, "train/loss": 1.7975218296051025, "uptime": 16509.303595888, "examples_seen": 91852800.0, "progress": 0.7966039981172793, "epoch": 71.69463465730853, "img/sec/core": 690.53017646193, "core_hours_NVIDIA A100-SXM4-40GB": 35.78230204107774, "core_hours": 35.78230204107774} {"step": 89750, "global_schedule": 0.1175031065940857, "l2_grads": 2.4879982471466064, "l2_params": 247.5260467529297, "l2_updates": 0.12529762089252472, "train/loss": 1.6887141466140747, "uptime": 16518.036035570003, "examples_seen": 91904000.0, "progress": 0.7970480360203547, "epoch": 71.73459822177749, "img/sec/core": 732.8994225052471, "core_hours_NVIDIA A100-SXM4-40GB": 35.80170746259329, "core_hours": 35.80170746259329} {"step": 89800, "global_schedule": 0.11701059341430664, "l2_grads": 2.307891845703125, "l2_params": 247.47134399414062, "l2_updates": 0.12386492639780045, "train/loss": 3.0692384243011475, "uptime": 16526.660437156002, "examples_seen": 91955200.0, "progress": 0.7974920739234301, "epoch": 71.77456178624645, "img/sec/core": 742.0804720398978, "core_hours_NVIDIA A100-SXM4-40GB": 35.820872799451074, "core_hours": 35.820872799451074} {"step": 89850, "global_schedule": 0.11651894450187683, "l2_grads": 2.2518551349639893, "l2_params": 247.4190673828125, "l2_updates": 0.12535671889781952, "train/loss": 2.0832183361053467, "uptime": 16535.093343119, "examples_seen": 92006400.0, "progress": 0.7979361118265055, "epoch": 71.8145253507154, "img/sec/core": 758.9317405032762, "core_hours_NVIDIA A100-SXM4-40GB": 35.83961259047996, "core_hours": 35.83961259047996} {"step": 89900, "global_schedule": 0.11602815985679626, "l2_grads": 2.441244602203369, "l2_params": 247.36570739746094, "l2_updates": 0.12258270382881165, "train/loss": 1.7154027223587036, "uptime": 16544.16902858, "examples_seen": 92057600.0, "progress": 0.7983801497295809, "epoch": 71.85448891518436, "img/sec/core": 705.1808954267387, "core_hours_NVIDIA A100-SXM4-40GB": 35.859780780393294, "core_hours": 35.859780780393294} {"step": 89950, "global_schedule": 0.1155383288860321, "l2_grads": 2.512528657913208, "l2_params": 247.3116912841797, "l2_updates": 0.12169557809829712, "train/loss": 3.9588918685913086, "uptime": 16553.035312157997, "examples_seen": 92108800.0, "progress": 0.7988241876326563, "epoch": 71.89445247965331, "img/sec/core": 721.8356985425054, "core_hours_NVIDIA A100-SXM4-40GB": 35.87948363278885, "core_hours": 35.87948363278885} {"step": 90000, "global_schedule": 0.11504939198493958, "l2_grads": 2.4326059818267822, "l2_params": 247.25741577148438, "l2_updates": 0.12142833322286606, "train/loss": 1.6137664318084717, "uptime": 16561.574194859, "examples_seen": 92160000.0, "progress": 0.7992682255357317, "epoch": 71.93441604412227, "img/sec/core": 749.5125795847191, "core_hours_NVIDIA A100-SXM4-40GB": 35.89845892767996, "core_hours": 35.89845892767996, "val/acc@1": 0.74454, "val/loss": 1.0246201013183593, "z/secs/eval/val": 5.9087017249985365} {"step": 90050, "global_schedule": 0.11456134915351868, "l2_grads": 2.185931444168091, "l2_params": 247.2086944580078, "l2_updates": 0.12268241494894028, "train/loss": 2.831557273864746, "uptime": 16576.750720785, "examples_seen": 92211200.0, "progress": 0.7997122634388072, "epoch": 71.97437960859124, "img/sec/core": 743.0791016198958, "core_hours_NVIDIA A100-SXM4-40GB": 35.91759850809774, "core_hours": 35.91759850809774} {"step": 90100, "global_schedule": 0.1140742301940918, "l2_grads": 2.5902957916259766, "l2_params": 247.15670776367188, "l2_updates": 0.11913681030273438, "train/loss": 3.9980525970458984, "uptime": 16586.932468168, "examples_seen": 92262400.0, "progress": 0.8001563013418825, "epoch": 72.01434317306018, "img/sec/core": 628.5757993453203, "core_hours_NVIDIA A100-SXM4-40GB": 35.94022461339329, "core_hours": 35.94022461339329} {"step": 90150, "global_schedule": 0.11358794569969177, "l2_grads": 2.5479183197021484, "l2_params": 247.10711669921875, "l2_updates": 0.12044331431388855, "train/loss": 1.5420032739639282, "uptime": 16596.149386807003, "examples_seen": 92313600.0, "progress": 0.800600339244958, "epoch": 72.05430673752915, "img/sec/core": 694.3752300164617, "core_hours_NVIDIA A100-SXM4-40GB": 35.96070665481329, "core_hours": 35.96070665481329} {"step": 90200, "global_schedule": 0.11310264468193054, "l2_grads": 2.514979362487793, "l2_params": 247.05517578125, "l2_updates": 0.12151488661766052, "train/loss": 1.6146330833435059, "uptime": 16604.626377952998, "examples_seen": 92364800.0, "progress": 0.8010443771480333, "epoch": 72.0942703019981, "img/sec/core": 754.9848631162913, "core_hours_NVIDIA A100-SXM4-40GB": 35.979544412915516, "core_hours": 35.979544412915516} {"step": 90250, "global_schedule": 0.11261814832687378, "l2_grads": 2.3822555541992188, "l2_params": 247.00340270996094, "l2_updates": 0.12262389063835144, "train/loss": 1.7080271244049072, "uptime": 16613.163044394, "examples_seen": 92416000.0, "progress": 0.8014884150511088, "epoch": 72.13423386646706, "img/sec/core": 749.7071654647835, "core_hours_NVIDIA A100-SXM4-40GB": 35.9985147827844, "core_hours": 35.9985147827844} {"step": 90300, "global_schedule": 0.11213472485542297, "l2_grads": 2.4992291927337646, "l2_params": 246.95240783691406, "l2_updates": 0.12030305713415146, "train/loss": 1.7306549549102783, "uptime": 16621.829203583, "examples_seen": 92467200.0, "progress": 0.8019324529541841, "epoch": 72.17419743093602, "img/sec/core": 738.5047816941907, "core_hours_NVIDIA A100-SXM4-40GB": 36.017772914315515, "core_hours": 36.017772914315515} {"step": 90350, "global_schedule": 0.11165207624435425, "l2_grads": 2.481097459793091, "l2_params": 246.9031524658203, "l2_updates": 0.11762033402919769, "train/loss": 3.7235138416290283, "uptime": 16631.300480418002, "examples_seen": 92518400.0, "progress": 0.8023764908572596, "epoch": 72.21416099540497, "img/sec/core": 675.7272658686871, "core_hours_NVIDIA A100-SXM4-40GB": 36.038820196171066, "core_hours": 36.038820196171066} {"step": 90400, "global_schedule": 0.11117038130760193, "l2_grads": 2.482228994369507, "l2_params": 246.85372924804688, "l2_updates": 0.11744660884141922, "train/loss": 1.7025229930877686, "uptime": 16640.854198350004, "examples_seen": 92569600.0, "progress": 0.8028205287603349, "epoch": 72.25412455987393, "img/sec/core": 669.8962692379843, "core_hours_NVIDIA A100-SXM4-40GB": 36.06005068046441, "core_hours": 36.06005068046441} {"step": 90450, "global_schedule": 0.11068955063819885, "l2_grads": 2.1247527599334717, "l2_params": 246.80291748046875, "l2_updates": 0.11838717758655548, "train/loss": 2.620372772216797, "uptime": 16650.342487643, "examples_seen": 92620800.0, "progress": 0.8032645666634104, "epoch": 72.29408812434288, "img/sec/core": 674.515690064554, "core_hours_NVIDIA A100-SXM4-40GB": 36.08113576778218, "core_hours": 36.08113576778218} {"step": 90500, "global_schedule": 0.11020976305007935, "l2_grads": 2.249781847000122, "l2_params": 246.75753784179688, "l2_updates": 0.11779525130987167, "train/loss": 1.7138885259628296, "uptime": 16659.830118644997, "examples_seen": 92672000.0, "progress": 0.8037086045664857, "epoch": 72.33405168881184, "img/sec/core": 674.5624907474536, "core_hours_NVIDIA A100-SXM4-40GB": 36.10221939223106, "core_hours": 36.10221939223106} {"step": 90550, "global_schedule": 0.10973075032234192, "l2_grads": 2.386775016784668, "l2_params": 246.70631408691406, "l2_updates": 0.11699708551168442, "train/loss": 1.7135926485061646, "uptime": 16668.928158359, "examples_seen": 92723200.0, "progress": 0.8041526424695612, "epoch": 72.3740152532808, "img/sec/core": 703.4482373330354, "core_hours_NVIDIA A100-SXM4-40GB": 36.12243725826218, "core_hours": 36.12243725826218} {"step": 90600, "global_schedule": 0.10925272107124329, "l2_grads": 2.246089220046997, "l2_params": 246.65919494628906, "l2_updates": 0.11642130464315414, "train/loss": 2.5328030586242676, "uptime": 16677.793227262002, "examples_seen": 92774400.0, "progress": 0.8045966803726367, "epoch": 72.41397881774975, "img/sec/core": 721.9346031065985, "core_hours_NVIDIA A100-SXM4-40GB": 36.142137411379956, "core_hours": 36.142137411379956} {"step": 90650, "global_schedule": 0.10877561569213867, "l2_grads": 2.617741107940674, "l2_params": 246.60670471191406, "l2_updates": 0.11379580944776535, "train/loss": 3.9700875282287598, "uptime": 16686.326525705, "examples_seen": 92825600.0, "progress": 0.805040718275712, "epoch": 72.45394238221871, "img/sec/core": 750.0030665458481, "core_hours_NVIDIA A100-SXM4-40GB": 36.16110029680885, "core_hours": 36.16110029680885} {"step": 90700, "global_schedule": 0.10829934477806091, "l2_grads": 2.2566463947296143, "l2_params": 246.55535888671875, "l2_updates": 0.11566433310508728, "train/loss": 1.6646366119384766, "uptime": 16694.897582409, "examples_seen": 92876800.0, "progress": 0.8054847561787875, "epoch": 72.49390594668766, "img/sec/core": 746.6990618569612, "core_hours_NVIDIA A100-SXM4-40GB": 36.1801470894844, "core_hours": 36.1801470894844} {"step": 90750, "global_schedule": 0.10782414674758911, "l2_grads": 2.5172948837280273, "l2_params": 246.50344848632812, "l2_updates": 0.11372049152851105, "train/loss": 1.5394147634506226, "uptime": 16704.211092106998, "examples_seen": 92928000.0, "progress": 0.8059287940818628, "epoch": 72.53386951115662, "img/sec/core": 687.1738160506841, "core_hours_NVIDIA A100-SXM4-40GB": 36.20084377770218, "core_hours": 36.20084377770218} {"step": 90800, "global_schedule": 0.10734972357749939, "l2_grads": 2.2748281955718994, "l2_params": 246.45115661621094, "l2_updates": 0.11468406021595001, "train/loss": 2.0143890380859375, "uptime": 16712.895224747, "examples_seen": 92979200.0, "progress": 0.8063728319849383, "epoch": 72.57383307562559, "img/sec/core": 736.9763067092827, "core_hours_NVIDIA A100-SXM4-40GB": 36.220141850235514, "core_hours": 36.220141850235514} {"step": 90850, "global_schedule": 0.10687628388404846, "l2_grads": 2.232466220855713, "l2_params": 246.3987579345703, "l2_updates": 0.11476340144872665, "train/loss": 2.070209264755249, "uptime": 16721.514468858004, "examples_seen": 93030400.0, "progress": 0.8068168698880136, "epoch": 72.61379664009453, "img/sec/core": 742.5245088289981, "core_hours_NVIDIA A100-SXM4-40GB": 36.23929572603774, "core_hours": 36.23929572603774} {"step": 90900, "global_schedule": 0.10640367865562439, "l2_grads": 2.173201084136963, "l2_params": 246.34756469726562, "l2_updates": 0.11399044096469879, "train/loss": 2.9039342403411865, "uptime": 16730.174307850997, "examples_seen": 93081600.0, "progress": 0.807260907791089, "epoch": 72.6537602045635, "img/sec/core": 739.0437634205051, "core_hours_NVIDIA A100-SXM4-40GB": 36.258539812688845, "core_hours": 36.258539812688845} {"step": 90950, "global_schedule": 0.1059320867061615, "l2_grads": 2.293255090713501, "l2_params": 246.29896545410156, "l2_updates": 0.11487658321857452, "train/loss": 1.673622488975525, "uptime": 16738.572096496, "examples_seen": 93132800.0, "progress": 0.8077049456941644, "epoch": 72.69372376903246, "img/sec/core": 762.1053911388526, "core_hours_NVIDIA A100-SXM4-40GB": 36.27720156523329, "core_hours": 36.27720156523329} {"step": 91000, "global_schedule": 0.10546141862869263, "l2_grads": 2.5525896549224854, "l2_params": 246.25247192382812, "l2_updates": 0.11265803873538971, "train/loss": 1.6272481679916382, "uptime": 16747.269153082, "examples_seen": 93184000.0, "progress": 0.8081489835972399, "epoch": 72.73368733350141, "img/sec/core": 735.8811497562174, "core_hours_NVIDIA A100-SXM4-40GB": 36.29652835764662, "core_hours": 36.29652835764662} {"step": 91050, "global_schedule": 0.10499167442321777, "l2_grads": 2.5862009525299072, "l2_params": 246.2035369873047, "l2_updates": 0.110916368663311, "train/loss": 1.5371967554092407, "uptime": 16756.438891368, "examples_seen": 93235200.0, "progress": 0.8085930215003153, "epoch": 72.77365089797037, "img/sec/core": 781.8031640079619, "core_hours_NVIDIA A100-SXM4-40GB": 36.31471992155551, "core_hours": 36.31471992155551} {"step": 91100, "global_schedule": 0.10452279448509216, "l2_grads": 2.5394716262817383, "l2_params": 246.15309143066406, "l2_updates": 0.11118563264608383, "train/loss": 1.7657732963562012, "uptime": 16765.897245359003, "examples_seen": 93286400.0, "progress": 0.8090370594033907, "epoch": 72.81361446243932, "img/sec/core": 676.6505045263315, "core_hours_NVIDIA A100-SXM4-40GB": 36.33573848597996, "core_hours": 36.33573848597996} {"step": 91150, "global_schedule": 0.10405489802360535, "l2_grads": 2.480292797088623, "l2_params": 246.1043701171875, "l2_updates": 0.11349547654390335, "train/loss": 1.617598533630371, "uptime": 16774.632002397004, "examples_seen": 93337600.0, "progress": 0.8094810973064661, "epoch": 72.85357802690828, "img/sec/core": 732.70498219432, "core_hours_NVIDIA A100-SXM4-40GB": 36.35514905717552, "core_hours": 36.35514905717552} {"step": 91200, "global_schedule": 0.10358792543411255, "l2_grads": 2.4754388332366943, "l2_params": 246.05455017089844, "l2_updates": 0.10967330634593964, "train/loss": 1.672536015510559, "uptime": 16783.603575690002, "examples_seen": 93388800.0, "progress": 0.8099251352095415, "epoch": 72.89354159137724, "img/sec/core": 713.3642886242623, "core_hours_NVIDIA A100-SXM4-40GB": 36.37508588671551, "core_hours": 36.37508588671551} {"step": 91250, "global_schedule": 0.10312190651893616, "l2_grads": 2.471407890319824, "l2_params": 246.00245666503906, "l2_updates": 0.10974129289388657, "train/loss": 1.525846242904663, "uptime": 16793.037030146, "examples_seen": 93440000.0, "progress": 0.8103691731126169, "epoch": 72.93350515584619, "img/sec/core": 678.4365186529269, "core_hours_NVIDIA A100-SXM4-40GB": 36.39604911883996, "core_hours": 36.39604911883996} {"step": 91300, "global_schedule": 0.1026567816734314, "l2_grads": 2.240370273590088, "l2_params": 245.9570770263672, "l2_updates": 0.11148197203874588, "train/loss": 2.436889171600342, "uptime": 16802.294852191997, "examples_seen": 93491200.0, "progress": 0.8108132110156923, "epoch": 72.97346872031515, "img/sec/core": 691.307304050685, "core_hours_NVIDIA A100-SXM4-40GB": 36.41662205671995, "core_hours": 36.41662205671995} {"step": 91350, "global_schedule": 0.10219255089759827, "l2_grads": 2.222341775894165, "l2_params": 245.90866088867188, "l2_updates": 0.10899277776479721, "train/loss": 2.1068484783172607, "uptime": 16811.854466295998, "examples_seen": 93542400.0, "progress": 0.8112572489187677, "epoch": 73.0134322847841, "img/sec/core": 669.483091092739, "core_hours_NVIDIA A100-SXM4-40GB": 36.437865643617734, "core_hours": 36.437865643617734} {"step": 91400, "global_schedule": 0.10172930359840393, "l2_grads": 2.308473587036133, "l2_params": 245.8611297607422, "l2_updates": 0.10781458020210266, "train/loss": 2.7599592208862305, "uptime": 16821.300767715, "examples_seen": 93593600.0, "progress": 0.8117012868218431, "epoch": 73.05339584925306, "img/sec/core": 677.5138454852695, "core_hours_NVIDIA A100-SXM4-40GB": 36.45885742454884, "core_hours": 36.45885742454884} {"step": 91450, "global_schedule": 0.10126692056655884, "l2_grads": 2.1778082847595215, "l2_params": 245.8126678466797, "l2_updates": 0.10879312455654144, "train/loss": 2.586796283721924, "uptime": 16830.410857937997, "examples_seen": 93644800.0, "progress": 0.8121453247249185, "epoch": 73.09335941372203, "img/sec/core": 702.5177405864434, "core_hours_NVIDIA A100-SXM4-40GB": 36.47910206948884, "core_hours": 36.47910206948884} {"step": 91500, "global_schedule": 0.1008056104183197, "l2_grads": 2.3184025287628174, "l2_params": 245.7638702392578, "l2_updates": 0.1048094853758812, "train/loss": 2.6842620372772217, "uptime": 16839.890132119, "examples_seen": 93696000.0, "progress": 0.812589362627994, "epoch": 73.13332297819098, "img/sec/core": 675.1571774162788, "core_hours_NVIDIA A100-SXM4-40GB": 36.5001671232244, "core_hours": 36.5001671232244} {"step": 91550, "global_schedule": 0.10034510493278503, "l2_grads": 2.2921090126037598, "l2_params": 245.7184295654297, "l2_updates": 0.10628648102283478, "train/loss": 3.1852118968963623, "uptime": 16849.246385303, "examples_seen": 93747200.0, "progress": 0.8130334005310693, "epoch": 73.17328654265994, "img/sec/core": 684.0345033570372, "core_hours_NVIDIA A100-SXM4-40GB": 36.52095879696662, "core_hours": 36.52095879696662} {"step": 91600, "global_schedule": 0.09988561272621155, "l2_grads": 2.5006659030914307, "l2_params": 245.67149353027344, "l2_updates": 0.10644591599702835, "train/loss": 3.7130537033081055, "uptime": 16857.909005837, "examples_seen": 93798400.0, "progress": 0.8134774384341448, "epoch": 73.21325010712889, "img/sec/core": 738.8064587246638, "core_hours_NVIDIA A100-SXM4-40GB": 36.540209064819955, "core_hours": 36.540209064819955} {"step": 91650, "global_schedule": 0.0994269847869873, "l2_grads": 2.487670660018921, "l2_params": 245.6234893798828, "l2_updates": 0.10629861056804657, "train/loss": 1.6243149042129517, "uptime": 16867.113715629, "examples_seen": 93849600.0, "progress": 0.8139214763372201, "epoch": 73.25321367159785, "img/sec/core": 695.2962281941926, "core_hours_NVIDIA A100-SXM4-40GB": 36.56066397546884, "core_hours": 36.56066397546884} {"step": 91700, "global_schedule": 0.09896942973136902, "l2_grads": 2.4722402095794678, "l2_params": 245.5781707763672, "l2_updates": 0.1071227416396141, "train/loss": 1.6244975328445435, "uptime": 16876.369187090997, "examples_seen": 93900800.0, "progress": 0.8143655142402956, "epoch": 73.29317723606681, "img/sec/core": 691.4828732688081, "core_hours_NVIDIA A100-SXM4-40GB": 36.58123168982884, "core_hours": 36.58123168982884} {"step": 91750, "global_schedule": 0.0985126793384552, "l2_grads": 2.3672897815704346, "l2_params": 245.5314483642578, "l2_updates": 0.10553296655416489, "train/loss": 1.6611531972885132, "uptime": 16885.092041183998, "examples_seen": 93952000.0, "progress": 0.8148095521433709, "epoch": 73.33314080053576, "img/sec/core": 733.704809431038, "core_hours_NVIDIA A100-SXM4-40GB": 36.60061581003551, "core_hours": 36.60061581003551} {"step": 91800, "global_schedule": 0.09805694222450256, "l2_grads": 2.465367078781128, "l2_params": 245.4855499267578, "l2_updates": 0.10491595417261124, "train/loss": 2.9551002979278564, "uptime": 16894.292278766, "examples_seen": 94003200.0, "progress": 0.8152535900464464, "epoch": 73.37310436500472, "img/sec/core": 695.6342097643897, "core_hours_NVIDIA A100-SXM4-40GB": 36.621060782439955, "core_hours": 36.621060782439955} {"step": 91850, "global_schedule": 0.09760212898254395, "l2_grads": 2.3916444778442383, "l2_params": 245.43869018554688, "l2_updates": 0.10357032716274261, "train/loss": 2.8807857036590576, "uptime": 16902.659920044003, "examples_seen": 94054400.0, "progress": 0.8156976279495217, "epoch": 73.41306792947367, "img/sec/core": 764.8511435147594, "core_hours_NVIDIA A100-SXM4-40GB": 36.63965554083551, "core_hours": 36.63965554083551} {"step": 91900, "global_schedule": 0.09714820981025696, "l2_grads": 2.3673558235168457, "l2_params": 245.3907928466797, "l2_updates": 0.10406212508678436, "train/loss": 1.6336909532546997, "uptime": 16911.159780431, "examples_seen": 94105600.0, "progress": 0.8161416658525972, "epoch": 73.45303149394263, "img/sec/core": 752.9535437767646, "core_hours_NVIDIA A100-SXM4-40GB": 36.65854411947329, "core_hours": 36.65854411947329} {"step": 91950, "global_schedule": 0.09669536352157593, "l2_grads": 2.276313066482544, "l2_params": 245.3433074951172, "l2_updates": 0.10353925079107285, "train/loss": 2.5199692249298096, "uptime": 16919.669474172, "examples_seen": 94156800.0, "progress": 0.8165857037556726, "epoch": 73.4929950584116, "img/sec/core": 752.0834703094012, "core_hours_NVIDIA A100-SXM4-40GB": 36.67745455000885, "core_hours": 36.67745455000885} {"step": 92000, "global_schedule": 0.09624332189559937, "l2_grads": 2.389901876449585, "l2_params": 245.2966766357422, "l2_updates": 0.1022576093673706, "train/loss": 2.9512481689453125, "uptime": 16928.179197404002, "examples_seen": 94208000.0, "progress": 0.817029741658748, "epoch": 73.53295862288054, "img/sec/core": 752.0808639149525, "core_hours_NVIDIA A100-SXM4-40GB": 36.696365046079954, "core_hours": 36.696365046079954} {"step": 92050, "global_schedule": 0.09579229354858398, "l2_grads": 2.4308230876922607, "l2_params": 245.24957275390625, "l2_updates": 0.10409116744995117, "train/loss": 1.6283375024795532, "uptime": 16937.685758843, "examples_seen": 94259200.0, "progress": 0.8174737795618234, "epoch": 73.5729221873495, "img/sec/core": 746.3364130275568, "core_hours_NVIDIA A100-SXM4-40GB": 36.715421093693294, "core_hours": 36.715421093693294} {"step": 92100, "global_schedule": 0.09534215927124023, "l2_grads": 2.3531947135925293, "l2_params": 245.20257568359375, "l2_updates": 0.10054271668195724, "train/loss": 3.429654836654663, "uptime": 16947.241219768002, "examples_seen": 94310400.0, "progress": 0.8179178174648988, "epoch": 73.61288575181845, "img/sec/core": 669.7740747655702, "core_hours_NVIDIA A100-SXM4-40GB": 36.7366554513044, "core_hours": 36.7366554513044} {"step": 92150, "global_schedule": 0.09489300847053528, "l2_grads": 2.2365975379943848, "l2_params": 245.15745544433594, "l2_updates": 0.10106737911701202, "train/loss": 3.1490941047668457, "uptime": 16956.601580383, "examples_seen": 94361600.0, "progress": 0.8183618553679742, "epoch": 73.65284931628742, "img/sec/core": 683.7343413612306, "core_hours_NVIDIA A100-SXM4-40GB": 36.75745625267107, "core_hours": 36.75745625267107} {"step": 92200, "global_schedule": 0.09444484114646912, "l2_grads": 2.4537017345428467, "l2_params": 245.10858154296875, "l2_updates": 0.10174848884344101, "train/loss": 1.6121805906295776, "uptime": 16965.33659557, "examples_seen": 94412800.0, "progress": 0.8188058932710496, "epoch": 73.69281288075638, "img/sec/core": 732.6833283042084, "core_hours_NVIDIA A100-SXM4-40GB": 36.77686739753107, "core_hours": 36.77686739753107} {"step": 92250, "global_schedule": 0.09399762749671936, "l2_grads": 2.3009212017059326, "l2_params": 245.0641326904297, "l2_updates": 0.10007758438587189, "train/loss": 1.7409117221832275, "uptime": 16974.350722536, "examples_seen": 94464000.0, "progress": 0.819249931174125, "epoch": 73.73277644522533, "img/sec/core": 709.9966557095662, "core_hours_NVIDIA A100-SXM4-40GB": 36.796898790788845, "core_hours": 36.796898790788845} {"step": 92300, "global_schedule": 0.09355127811431885, "l2_grads": 2.3524560928344727, "l2_params": 245.01731872558594, "l2_updates": 0.09997714310884476, "train/loss": 1.5799630880355835, "uptime": 16982.837635212003, "examples_seen": 94515200.0, "progress": 0.8196939690772004, "epoch": 73.77274000969429, "img/sec/core": 754.1022565363207, "core_hours_NVIDIA A100-SXM4-40GB": 36.81575859673551, "core_hours": 36.81575859673551} {"step": 92350, "global_schedule": 0.09310594201087952, "l2_grads": 2.250988483428955, "l2_params": 244.97373962402344, "l2_updates": 0.09879890084266663, "train/loss": 2.47944712638855, "uptime": 16991.159738217, "examples_seen": 94566400.0, "progress": 0.8201380069802758, "epoch": 73.81270357416324, "img/sec/core": 769.0363837306727, "core_hours_NVIDIA A100-SXM4-40GB": 36.83425215896885, "core_hours": 36.83425215896885} {"step": 92400, "global_schedule": 0.09266158938407898, "l2_grads": 2.4051761627197266, "l2_params": 244.9264373779297, "l2_updates": 0.09973477572202682, "train/loss": 1.7437576055526733, "uptime": 17000.391035296998, "examples_seen": 94617600.0, "progress": 0.8205820448833513, "epoch": 73.8526671386322, "img/sec/core": 693.293688258342, "core_hours_NVIDIA A100-SXM4-40GB": 36.85476615247996, "core_hours": 36.85476615247996} {"step": 92450, "global_schedule": 0.09221816062927246, "l2_grads": 2.421105146408081, "l2_params": 244.8828125, "l2_updates": 0.0969834178686142, "train/loss": 3.4813549518585205, "uptime": 17009.568071256, "examples_seen": 94668800.0, "progress": 0.8210260827864266, "epoch": 73.89263070310116, "img/sec/core": 697.3929304181067, "core_hours_NVIDIA A100-SXM4-40GB": 36.87515956572218, "core_hours": 36.87515956572218} {"step": 92500, "global_schedule": 0.09177571535110474, "l2_grads": 2.384312629699707, "l2_params": 244.83526611328125, "l2_updates": 0.09833041578531265, "train/loss": 1.612502932548523, "uptime": 17018.779980740997, "examples_seen": 94720000.0, "progress": 0.8214701206895021, "epoch": 73.93259426757011, "img/sec/core": 694.752809981715, "core_hours_NVIDIA A100-SXM4-40GB": 36.89563047568884, "core_hours": 36.89563047568884, "val/acc@1": 0.75138, "val/loss": 0.994913837890625, "z/secs/eval/val": 3.55312373599736} {"step": 92550, "global_schedule": 0.09133413434028625, "l2_grads": 2.463043451309204, "l2_params": 244.7908935546875, "l2_updates": 0.09811152517795563, "train/loss": 1.6995915174484253, "uptime": 17031.261381099997, "examples_seen": 94771200.0, "progress": 0.8219141585925774, "epoch": 73.97255783203907, "img/sec/core": 716.9716126157236, "core_hours_NVIDIA A100-SXM4-40GB": 36.91546699637107, "core_hours": 36.91546699637107} {"step": 92600, "global_schedule": 0.09089359641075134, "l2_grads": 2.6080050468444824, "l2_params": 244.74378967285156, "l2_updates": 0.09720872342586517, "train/loss": 1.5636509656906128, "uptime": 17040.479844526002, "examples_seen": 94822400.0, "progress": 0.8223581964956529, "epoch": 74.01252139650802, "img/sec/core": 694.2588698620315, "core_hours_NVIDIA A100-SXM4-40GB": 36.935952470651074, "core_hours": 36.935952470651074} {"step": 92650, "global_schedule": 0.09045392274856567, "l2_grads": 2.5452721118927, "l2_params": 244.7015380859375, "l2_updates": 0.09651830792427063, "train/loss": 1.5387616157531738, "uptime": 17049.003742643, "examples_seen": 94873600.0, "progress": 0.8228022343987282, "epoch": 74.05248496097698, "img/sec/core": 750.830184987255, "core_hours_NVIDIA A100-SXM4-40GB": 36.954894466466634, "core_hours": 36.954894466466634} {"step": 92700, "global_schedule": 0.09001538157463074, "l2_grads": 2.5869462490081787, "l2_params": 244.6553497314453, "l2_updates": 0.0954032614827156, "train/loss": 1.7489137649536133, "uptime": 17057.633960869003, "examples_seen": 94924800.0, "progress": 0.8232462723018037, "epoch": 74.09244852544595, "img/sec/core": 741.5803207291424, "core_hours_NVIDIA A100-SXM4-40GB": 36.97407272919108, "core_hours": 36.97407272919108} {"step": 92750, "global_schedule": 0.08957764506340027, "l2_grads": 2.509046792984009, "l2_params": 244.6082000732422, "l2_updates": 0.09679347276687622, "train/loss": 1.6247906684875488, "uptime": 17067.001246614003, "examples_seen": 94976000.0, "progress": 0.823690310204879, "epoch": 74.1324120899149, "img/sec/core": 683.2288641793664, "core_hours_NVIDIA A100-SXM4-40GB": 36.99488891973552, "core_hours": 36.99488891973552} {"step": 92800, "global_schedule": 0.08914095163345337, "l2_grads": 2.667522430419922, "l2_params": 244.5654754638672, "l2_updates": 0.09426168352365494, "train/loss": 1.6922820806503296, "uptime": 17076.035442241002, "examples_seen": 95027200.0, "progress": 0.8241343481079545, "epoch": 74.17237565438386, "img/sec/core": 708.4194613711595, "core_hours_NVIDIA A100-SXM4-40GB": 37.01496491001774, "core_hours": 37.01496491001774} {"step": 92850, "global_schedule": 0.08870512247085571, "l2_grads": 2.640186309814453, "l2_params": 244.52488708496094, "l2_updates": 0.09402498602867126, "train/loss": 1.5948785543441772, "uptime": 17085.23594379, "examples_seen": 95078400.0, "progress": 0.82457838601103, "epoch": 74.21233921885282, "img/sec/core": 695.6142516704422, "core_hours_NVIDIA A100-SXM4-40GB": 37.035410469015524, "core_hours": 37.035410469015524} {"step": 92900, "global_schedule": 0.08827036619186401, "l2_grads": 2.301151752471924, "l2_params": 244.480224609375, "l2_updates": 0.09295184910297394, "train/loss": 2.877965211868286, "uptime": 17094.037789496004, "examples_seen": 95129600.0, "progress": 0.8250224239141053, "epoch": 74.25230278332177, "img/sec/core": 727.1202215730121, "core_hours_NVIDIA A100-SXM4-40GB": 37.05497012613997, "core_hours": 37.05497012613997} {"step": 92950, "global_schedule": 0.08783656358718872, "l2_grads": 2.5292246341705322, "l2_params": 244.4390869140625, "l2_updates": 0.09365926682949066, "train/loss": 1.6402828693389893, "uptime": 17103.363900361997, "examples_seen": 95180800.0, "progress": 0.8254664618171808, "epoch": 74.29226634779073, "img/sec/core": 686.2453269062323, "core_hours_NVIDIA A100-SXM4-40GB": 37.075694816953295, "core_hours": 37.075694816953295} {"step": 93000, "global_schedule": 0.08740371465682983, "l2_grads": 2.4690072536468506, "l2_params": 244.39381408691406, "l2_updates": 0.09339363127946854, "train/loss": 1.49106764793396, "uptime": 17112.816321917002, "examples_seen": 95232000.0, "progress": 0.8259104997202561, "epoch": 74.33222991225968, "img/sec/core": 677.0751772717974, "core_hours_NVIDIA A100-SXM4-40GB": 37.09670019818663, "core_hours": 37.09670019818663} {"step": 93050, "global_schedule": 0.08697181940078735, "l2_grads": 2.465553045272827, "l2_params": 244.35568237304688, "l2_updates": 0.09239266812801361, "train/loss": 1.7146412134170532, "uptime": 17122.624256295, "examples_seen": 95283200.0, "progress": 0.8263545376233316, "epoch": 74.37219347672864, "img/sec/core": 703.2993566674468, "core_hours_NVIDIA A100-SXM4-40GB": 37.11692234411552, "core_hours": 37.11692234411552} {"step": 93100, "global_schedule": 0.08654084801673889, "l2_grads": 2.5032477378845215, "l2_params": 244.31419372558594, "l2_updates": 0.0921870693564415, "train/loss": 1.5754215717315674, "uptime": 17131.386991771004, "examples_seen": 95334400.0, "progress": 0.8267985755264069, "epoch": 74.4121570411976, "img/sec/core": 730.3655368267458, "core_hours_NVIDIA A100-SXM4-40GB": 37.13639508961774, "core_hours": 37.13639508961774} {"step": 93150, "global_schedule": 0.086110919713974, "l2_grads": 2.292546272277832, "l2_params": 244.26724243164062, "l2_updates": 0.09163866192102432, "train/loss": 2.206996202468872, "uptime": 17139.89008566, "examples_seen": 95385600.0, "progress": 0.8272426134294824, "epoch": 74.45212060566655, "img/sec/core": 752.667215433324, "core_hours_NVIDIA A100-SXM4-40GB": 37.155290853815515, "core_hours": 37.155290853815515} {"step": 93200, "global_schedule": 0.08568194508552551, "l2_grads": 2.438019275665283, "l2_params": 244.22360229492188, "l2_updates": 0.0925421193242073, "train/loss": 1.499851942062378, "uptime": 17148.459717832004, "examples_seen": 95436800.0, "progress": 0.8276866513325577, "epoch": 74.49208417013551, "img/sec/core": 746.8231858199485, "core_hours_NVIDIA A100-SXM4-40GB": 37.17433448086441, "core_hours": 37.17433448086441} {"step": 93250, "global_schedule": 0.08525395393371582, "l2_grads": 2.540304660797119, "l2_params": 244.1818389892578, "l2_updates": 0.091066375374794, "train/loss": 2.211088180541992, "uptime": 17156.911896689002, "examples_seen": 95488000.0, "progress": 0.8281306892356332, "epoch": 74.53204773460446, "img/sec/core": 757.2012031786268, "core_hours_NVIDIA A100-SXM4-40GB": 37.19311710054663, "core_hours": 37.19311710054663} {"step": 93300, "global_schedule": 0.08482685685157776, "l2_grads": 2.470001459121704, "l2_params": 244.1365203857422, "l2_updates": 0.09169424325227737, "train/loss": 1.8456732034683228, "uptime": 17165.638559411003, "examples_seen": 95539200.0, "progress": 0.8285747271387086, "epoch": 74.57201129907342, "img/sec/core": 733.3845943036671, "core_hours_NVIDIA A100-SXM4-40GB": 37.2125096843733, "core_hours": 37.2125096843733} {"step": 93350, "global_schedule": 0.08440080285072327, "l2_grads": 2.480319023132324, "l2_params": 244.09715270996094, "l2_updates": 0.09067334979772568, "train/loss": 1.5941675901412964, "uptime": 17174.542044055, "examples_seen": 95590400.0, "progress": 0.829018765041784, "epoch": 74.61197486354239, "img/sec/core": 718.8196819449696, "core_hours_NVIDIA A100-SXM4-40GB": 37.2322952058044, "core_hours": 37.2322952058044} {"step": 93400, "global_schedule": 0.08397570252418518, "l2_grads": 2.6064348220825195, "l2_params": 244.05470275878906, "l2_updates": 0.08915911614894867, "train/loss": 1.6675033569335938, "uptime": 17183.305593601, "examples_seen": 95641600.0, "progress": 0.8294628029448594, "epoch": 74.65193842801133, "img/sec/core": 730.2976911815281, "core_hours_NVIDIA A100-SXM4-40GB": 37.251769760351074, "core_hours": 37.251769760351074} {"step": 93450, "global_schedule": 0.08355161547660828, "l2_grads": 2.3693113327026367, "l2_params": 244.01065063476562, "l2_updates": 0.08946095407009125, "train/loss": 2.2849974632263184, "uptime": 17191.775655721, "examples_seen": 95692800.0, "progress": 0.8299068408479348, "epoch": 74.6919019924803, "img/sec/core": 755.6024866557547, "core_hours_NVIDIA A100-SXM4-40GB": 37.270592120617735, "core_hours": 37.270592120617735} {"step": 93500, "global_schedule": 0.083128422498703, "l2_grads": 2.646125316619873, "l2_params": 243.97052001953125, "l2_updates": 0.0882020965218544, "train/loss": 1.6828365325927734, "uptime": 17200.271409189, "examples_seen": 95744000.0, "progress": 0.8303508787510102, "epoch": 74.73186555694924, "img/sec/core": 753.3175278809997, "core_hours_NVIDIA A100-SXM4-40GB": 37.28947157276885, "core_hours": 37.28947157276885} {"step": 93550, "global_schedule": 0.08270624279975891, "l2_grads": 2.4581689834594727, "l2_params": 243.93289184570312, "l2_updates": 0.08774574100971222, "train/loss": 1.5721346139907837, "uptime": 17208.654098853003, "examples_seen": 95795200.0, "progress": 0.8307949166540856, "epoch": 74.77182912141821, "img/sec/core": 763.478102676711, "core_hours_NVIDIA A100-SXM4-40GB": 37.30809977202218, "core_hours": 37.30809977202218} {"step": 93600, "global_schedule": 0.082285076379776, "l2_grads": 2.5151705741882324, "l2_params": 243.894287109375, "l2_updates": 0.08760888129472733, "train/loss": 1.7047268152236938, "uptime": 17217.190245529004, "examples_seen": 95846400.0, "progress": 0.831238954557161, "epoch": 74.81179268588717, "img/sec/core": 749.7528150487027, "core_hours_NVIDIA A100-SXM4-40GB": 37.327068986857746, "core_hours": 37.327068986857746} {"step": 93650, "global_schedule": 0.08186489343643188, "l2_grads": 2.524643898010254, "l2_params": 243.85047912597656, "l2_updates": 0.08713249117136002, "train/loss": 1.6482725143432617, "uptime": 17226.176706305, "examples_seen": 95897600.0, "progress": 0.8316829924602364, "epoch": 74.85175625035612, "img/sec/core": 712.1824886937676, "core_hours_NVIDIA A100-SXM4-40GB": 37.347038899693295, "core_hours": 37.347038899693295} {"step": 93700, "global_schedule": 0.0814456045627594, "l2_grads": 2.5912013053894043, "l2_params": 243.81101989746094, "l2_updates": 0.0874861478805542, "train/loss": 1.6411606073379517, "uptime": 17234.310562524, "examples_seen": 95948800.0, "progress": 0.8321270303633118, "epoch": 74.89171981482508, "img/sec/core": 786.8346609140438, "core_hours_NVIDIA A100-SXM4-40GB": 37.36511413573552, "core_hours": 37.36511413573552} {"step": 93750, "global_schedule": 0.08102735877037048, "l2_grads": 2.3489797115325928, "l2_params": 243.7689971923828, "l2_updates": 0.08638399094343185, "train/loss": 2.305307149887085, "uptime": 17242.86059079, "examples_seen": 96000000.0, "progress": 0.8325710682663873, "epoch": 74.93168337929403, "img/sec/core": 748.5355370637228, "core_hours_NVIDIA A100-SXM4-40GB": 37.38411419854885, "core_hours": 37.38411419854885} {"step": 93800, "global_schedule": 0.08061012625694275, "l2_grads": 2.2692031860351562, "l2_params": 243.7279815673828, "l2_updates": 0.08644068241119385, "train/loss": 3.0410654544830322, "uptime": 17251.46216412, "examples_seen": 96051200.0, "progress": 0.8330151061694626, "epoch": 74.97164694376299, "img/sec/core": 744.0499260382722, "core_hours_NVIDIA A100-SXM4-40GB": 37.40322880594885, "core_hours": 37.40322880594885} {"step": 93850, "global_schedule": 0.08019378781318665, "l2_grads": 2.5849945545196533, "l2_params": 243.68109130859375, "l2_updates": 0.08588490635156631, "train/loss": 1.5324842929840088, "uptime": 17260.977661824, "examples_seen": 96102400.0, "progress": 0.8334591440725381, "epoch": 75.01161050823195, "img/sec/core": 672.5869942997882, "core_hours_NVIDIA A100-SXM4-40GB": 37.42437435640218, "core_hours": 37.42437435640218} {"step": 93900, "global_schedule": 0.07977855205535889, "l2_grads": 2.486041784286499, "l2_params": 243.64178466796875, "l2_updates": 0.08453471213579178, "train/loss": 1.9039562940597534, "uptime": 17269.496406362, "examples_seen": 96153600.0, "progress": 0.8339031819756134, "epoch": 75.0515740727009, "img/sec/core": 751.2844142058011, "core_hours_NVIDIA A100-SXM4-40GB": 37.443304899819964, "core_hours": 37.443304899819964} {"step": 93950, "global_schedule": 0.07936421036720276, "l2_grads": 2.3229994773864746, "l2_params": 243.60089111328125, "l2_updates": 0.08468276262283325, "train/loss": 2.9870779514312744, "uptime": 17278.194608683, "examples_seen": 96204800.0, "progress": 0.8343472198786889, "epoch": 75.09153763716986, "img/sec/core": 735.7842188320137, "core_hours_NVIDIA A100-SXM4-40GB": 37.462634238311075, "core_hours": 37.462634238311075} {"step": 94000, "global_schedule": 0.07895088195800781, "l2_grads": 2.502512216567993, "l2_params": 243.5635528564453, "l2_updates": 0.08343768864870071, "train/loss": 3.6596455574035645, "uptime": 17286.818920166, "examples_seen": 96256000.0, "progress": 0.8347912577817642, "epoch": 75.13150120163881, "img/sec/core": 742.0882249691341, "core_hours_NVIDIA A100-SXM4-40GB": 37.48179937493997, "core_hours": 37.48179937493997} {"step": 94050, "global_schedule": 0.07853847742080688, "l2_grads": 2.399972438812256, "l2_params": 243.5264129638672, "l2_updates": 0.08287351578474045, "train/loss": 2.2840118408203125, "uptime": 17296.213443303, "examples_seen": 96307200.0, "progress": 0.8352352956848397, "epoch": 75.17146476610777, "img/sec/core": 734.1365431395943, "core_hours_NVIDIA A100-SXM4-40GB": 37.50117209566219, "core_hours": 37.50117209566219} {"step": 94100, "global_schedule": 0.07812714576721191, "l2_grads": 2.460327625274658, "l2_params": 243.48794555664062, "l2_updates": 0.0834403708577156, "train/loss": 1.9664311408996582, "uptime": 17304.705682301, "examples_seen": 96358400.0, "progress": 0.835679333587915, "epoch": 75.21142833057674, "img/sec/core": 753.6292845156331, "core_hours_NVIDIA A100-SXM4-40GB": 37.520043737879966, "core_hours": 37.520043737879966} {"step": 94150, "global_schedule": 0.07771679759025574, "l2_grads": 2.5420384407043457, "l2_params": 243.4475860595703, "l2_updates": 0.08396319299936295, "train/loss": 1.5971347093582153, "uptime": 17313.211745815002, "examples_seen": 96409600.0, "progress": 0.8361233714909905, "epoch": 75.25139189504569, "img/sec/core": 752.4044453073343, "core_hours_NVIDIA A100-SXM4-40GB": 37.53894610124441, "core_hours": 37.53894610124441} {"step": 94200, "global_schedule": 0.07730743288993835, "l2_grads": 2.53171968460083, "l2_params": 243.4081573486328, "l2_updates": 0.08313128352165222, "train/loss": 1.5598121881484985, "uptime": 17321.851370764, "examples_seen": 96460800.0, "progress": 0.8365674093940659, "epoch": 75.29135545951465, "img/sec/core": 740.7728967148666, "core_hours_NVIDIA A100-SXM4-40GB": 37.55814526779774, "core_hours": 37.55814526779774} {"step": 94250, "global_schedule": 0.07689899206161499, "l2_grads": 2.5206351280212402, "l2_params": 243.37042236328125, "l2_updates": 0.0826534777879715, "train/loss": 1.6226279735565186, "uptime": 17330.915467764004, "examples_seen": 96512000.0, "progress": 0.8370114472971413, "epoch": 75.3313190239836, "img/sec/core": 706.082470211697, "core_hours_NVIDIA A100-SXM4-40GB": 37.578287705575526, "core_hours": 37.578287705575526} {"step": 94300, "global_schedule": 0.07649162411689758, "l2_grads": 2.4505553245544434, "l2_params": 243.33181762695312, "l2_updates": 0.08204136043787003, "train/loss": 2.048027753829956, "uptime": 17339.921865764998, "examples_seen": 96563200.0, "progress": 0.8374554852002167, "epoch": 75.37128258845256, "img/sec/core": 710.6059491586649, "core_hours_NVIDIA A100-SXM4-40GB": 37.59830192335552, "core_hours": 37.59830192335552} {"step": 94350, "global_schedule": 0.07608523964881897, "l2_grads": 2.6092488765716553, "l2_params": 243.2904510498047, "l2_updates": 0.08266197144985199, "train/loss": 1.5570456981658936, "uptime": 17348.541808461, "examples_seen": 96614400.0, "progress": 0.8378995231032921, "epoch": 75.41124615292152, "img/sec/core": 742.4643325029351, "core_hours_NVIDIA A100-SXM4-40GB": 37.61745735156886, "core_hours": 37.61745735156886} {"step": 94400, "global_schedule": 0.07567983865737915, "l2_grads": 2.3648247718811035, "l2_params": 243.25393676757812, "l2_updates": 0.08126980811357498, "train/loss": 2.497617244720459, "uptime": 17358.132438752, "examples_seen": 96665600.0, "progress": 0.8383435610063675, "epoch": 75.45120971739047, "img/sec/core": 667.3179765886075, "core_hours_NVIDIA A100-SXM4-40GB": 37.63876986332664, "core_hours": 37.63876986332664} {"step": 94450, "global_schedule": 0.07527545094490051, "l2_grads": 2.352963924407959, "l2_params": 243.21568298339844, "l2_updates": 0.07949239760637283, "train/loss": 2.687241554260254, "uptime": 17367.771969300004, "examples_seen": 96716800.0, "progress": 0.8387875989094429, "epoch": 75.49117328185943, "img/sec/core": 663.93274736059, "core_hours_NVIDIA A100-SXM4-40GB": 37.66019104232219, "core_hours": 37.66019104232219} {"step": 94500, "global_schedule": 0.0748719871044159, "l2_grads": 2.342111110687256, "l2_params": 243.17849731445312, "l2_updates": 0.08049360662698746, "train/loss": 3.1253397464752197, "uptime": 17377.212748217004, "examples_seen": 96768000.0, "progress": 0.8392316368125183, "epoch": 75.53113684632838, "img/sec/core": 677.9101657041809, "core_hours_NVIDIA A100-SXM4-40GB": 37.68117055102664, "core_hours": 37.68117055102664} {"step": 94550, "global_schedule": 0.07446956634521484, "l2_grads": 2.490800619125366, "l2_params": 243.14173889160156, "l2_updates": 0.08045714348554611, "train/loss": 1.4649507999420166, "uptime": 17386.077021579003, "examples_seen": 96819200.0, "progress": 0.8396756747155937, "epoch": 75.57110041079734, "img/sec/core": 721.9993944947607, "core_hours_NVIDIA A100-SXM4-40GB": 37.70086893627553, "core_hours": 37.70086893627553} {"step": 94600, "global_schedule": 0.07406815886497498, "l2_grads": 2.608426809310913, "l2_params": 243.10084533691406, "l2_updates": 0.07988032698631287, "train/loss": 1.577786922454834, "uptime": 17394.758782191, "examples_seen": 96870400.0, "progress": 0.8401197126186691, "epoch": 75.6110639752663, "img/sec/core": 737.1776631522177, "core_hours_NVIDIA A100-SXM4-40GB": 37.72016173763552, "core_hours": 37.72016173763552} {"step": 94650, "global_schedule": 0.0736677348613739, "l2_grads": 2.4266903400421143, "l2_params": 243.06265258789062, "l2_updates": 0.07833892852067947, "train/loss": 2.1211342811584473, "uptime": 17403.411095789997, "examples_seen": 96921600.0, "progress": 0.8405637505217446, "epoch": 75.65102753973525, "img/sec/core": 739.6865505129517, "core_hours_NVIDIA A100-SXM4-40GB": 37.739389101188856, "core_hours": 37.739389101188856} {"step": 94700, "global_schedule": 0.07326826453208923, "l2_grads": 2.5593760013580322, "l2_params": 243.0237274169922, "l2_updates": 0.07755203545093536, "train/loss": 1.721083402633667, "uptime": 17412.001907599, "examples_seen": 96972800.0, "progress": 0.8410077884248199, "epoch": 75.69099110420422, "img/sec/core": 744.9819810153912, "core_hours_NVIDIA A100-SXM4-40GB": 37.758479794097745, "core_hours": 37.758479794097745} {"step": 94750, "global_schedule": 0.07286986708641052, "l2_grads": 2.5172886848449707, "l2_params": 242.98805236816406, "l2_updates": 0.07787493616342545, "train/loss": 1.3849692344665527, "uptime": 17420.607181866, "examples_seen": 97024000.0, "progress": 0.8414518263278954, "epoch": 75.73095466867316, "img/sec/core": 743.7299267198434, "core_hours_NVIDIA A100-SXM4-40GB": 37.77760262580219, "core_hours": 37.77760262580219} {"step": 94800, "global_schedule": 0.07247239351272583, "l2_grads": 2.626498222351074, "l2_params": 242.94873046875, "l2_updates": 0.07786766439676285, "train/loss": 1.5447553396224976, "uptime": 17429.218431455003, "examples_seen": 97075200.0, "progress": 0.8418958642309707, "epoch": 75.77091823314213, "img/sec/core": 743.2138546041613, "core_hours_NVIDIA A100-SXM4-40GB": 37.796738735999966, "core_hours": 37.796738735999966} {"step": 94850, "global_schedule": 0.07207605242729187, "l2_grads": 2.445159673690796, "l2_params": 242.91452026367188, "l2_updates": 0.0759730190038681, "train/loss": 2.519770622253418, "uptime": 17438.262975147, "examples_seen": 97126400.0, "progress": 0.8423399021340462, "epoch": 75.81088179761109, "img/sec/core": 707.6089427996468, "core_hours_NVIDIA A100-SXM4-40GB": 37.81683772198219, "core_hours": 37.81683772198219} {"step": 94900, "global_schedule": 0.07168057560920715, "l2_grads": 2.489657402038574, "l2_params": 242.8751678466797, "l2_updates": 0.07691098004579544, "train/loss": 1.4831593036651611, "uptime": 17447.952908572, "examples_seen": 97177600.0, "progress": 0.8427839400371215, "epoch": 75.85084536208004, "img/sec/core": 660.4792540150287, "core_hours_NVIDIA A100-SXM4-40GB": 37.83837090737108, "core_hours": 37.83837090737108} {"step": 94950, "global_schedule": 0.0712861716747284, "l2_grads": 2.594482183456421, "l2_params": 242.83859252929688, "l2_updates": 0.07639233022928238, "train/loss": 1.605122447013855, "uptime": 17457.363923924997, "examples_seen": 97228800.0, "progress": 0.843227977940197, "epoch": 75.890808926549, "img/sec/core": 680.0541450568401, "core_hours_NVIDIA A100-SXM4-40GB": 37.85928427482218, "core_hours": 37.85928427482218} {"step": 95000, "global_schedule": 0.07089278101921082, "l2_grads": 2.374174118041992, "l2_params": 242.80084228515625, "l2_updates": 0.07545223832130432, "train/loss": 1.9480420351028442, "uptime": 17466.159896906, "examples_seen": 97280000.0, "progress": 0.8436720158432723, "epoch": 75.93077249101796, "img/sec/core": 727.6056911296271, "core_hours_NVIDIA A100-SXM4-40GB": 37.87883088144664, "core_hours": 37.87883088144664, "val/acc@1": 0.7543, "val/loss": 0.9844632897949219, "z/secs/eval/val": 2.5618762640006025} {"step": 95050, "global_schedule": 0.07050031423568726, "l2_grads": 2.4287500381469727, "l2_params": 242.76048278808594, "l2_updates": 0.07483506947755814, "train/loss": 1.3780514001846313, "uptime": 17478.676452788997, "examples_seen": 97331200.0, "progress": 0.8441160537463478, "epoch": 75.97073605548691, "img/sec/core": 717.2693131104069, "core_hours_NVIDIA A100-SXM4-40GB": 37.898659169039966, "core_hours": 37.898659169039966} {"step": 95100, "global_schedule": 0.07010897994041443, "l2_grads": 2.6749918460845947, "l2_params": 242.72354125976562, "l2_updates": 0.07433785498142242, "train/loss": 1.5769734382629395, "uptime": 17488.850324571, "examples_seen": 97382400.0, "progress": 0.8445600916494233, "epoch": 76.01069961995587, "img/sec/core": 629.0623802948478, "core_hours_NVIDIA A100-SXM4-40GB": 37.92126777299997, "core_hours": 37.92126777299997} {"step": 95150, "global_schedule": 0.06971853971481323, "l2_grads": 2.5571653842926025, "l2_params": 242.68768310546875, "l2_updates": 0.07468225061893463, "train/loss": 1.53322172164917, "uptime": 17497.673152034004, "examples_seen": 97433600.0, "progress": 0.8450041295524986, "epoch": 76.05066318442482, "img/sec/core": 725.3910412323147, "core_hours_NVIDIA A100-SXM4-40GB": 37.94087405625108, "core_hours": 37.94087405625108} {"step": 95200, "global_schedule": 0.069329172372818, "l2_grads": 2.6612322330474854, "l2_params": 242.65087890625, "l2_updates": 0.07416853308677673, "train/loss": 3.664583683013916, "uptime": 17507.295404086, "examples_seen": 97484800.0, "progress": 0.845448167455574, "epoch": 76.09062674889378, "img/sec/core": 665.1249588364964, "core_hours_NVIDIA A100-SXM4-40GB": 37.96225683858886, "core_hours": 37.96225683858886} {"step": 95250, "global_schedule": 0.06894075870513916, "l2_grads": 2.484476327896118, "l2_params": 242.61553955078125, "l2_updates": 0.07440667599439621, "train/loss": 1.8946620225906372, "uptime": 17516.737787361002, "examples_seen": 97536000.0, "progress": 0.8458922053586494, "epoch": 76.13059031336275, "img/sec/core": 677.7949817971224, "core_hours_NVIDIA A100-SXM4-40GB": 37.98323991253331, "core_hours": 37.98323991253331} {"step": 95300, "global_schedule": 0.06855341792106628, "l2_grads": 2.372303009033203, "l2_params": 242.5806884765625, "l2_updates": 0.0724954828619957, "train/loss": 2.3574209213256836, "uptime": 17525.402413105003, "examples_seen": 97587200.0, "progress": 0.8463362432617249, "epoch": 76.1705538778317, "img/sec/core": 738.635480526245, "core_hours_NVIDIA A100-SXM4-40GB": 38.00249463640886, "core_hours": 38.00249463640886} {"step": 95350, "global_schedule": 0.0681670606136322, "l2_grads": 2.448540210723877, "l2_params": 242.54483032226562, "l2_updates": 0.0730249434709549, "train/loss": 1.7293732166290283, "uptime": 17533.962674087, "examples_seen": 97638400.0, "progress": 0.8467802811648002, "epoch": 76.21051744230066, "img/sec/core": 747.6407569183965, "core_hours_NVIDIA A100-SXM4-40GB": 38.021517438591076, "core_hours": 38.021517438591076} {"step": 95400, "global_schedule": 0.06778174638748169, "l2_grads": 2.756514072418213, "l2_params": 242.5083770751953, "l2_updates": 0.07254133373498917, "train/loss": 3.8320300579071045, "uptime": 17542.657818557003, "examples_seen": 97689600.0, "progress": 0.8472243190678757, "epoch": 76.2504810067696, "img/sec/core": 736.0429745680942, "core_hours_NVIDIA A100-SXM4-40GB": 38.04083998185775, "core_hours": 38.04083998185775} {"step": 95450, "global_schedule": 0.06739738583564758, "l2_grads": 2.527301073074341, "l2_params": 242.47496032714844, "l2_updates": 0.07103903591632843, "train/loss": 2.281034231185913, "uptime": 17551.672500578003, "examples_seen": 97740800.0, "progress": 0.847668356970951, "epoch": 76.29044457123857, "img/sec/core": 709.9529395592073, "core_hours_NVIDIA A100-SXM4-40GB": 38.06087260857108, "core_hours": 38.06087260857108} {"step": 95500, "global_schedule": 0.06701406836509705, "l2_grads": 2.4592161178588867, "l2_params": 242.44027709960938, "l2_updates": 0.0713619515299797, "train/loss": 3.4870641231536865, "uptime": 17561.337574108, "examples_seen": 97792000.0, "progress": 0.8481123948740265, "epoch": 76.33040813570753, "img/sec/core": 662.1780972628172, "core_hours_NVIDIA A100-SXM4-40GB": 38.08235054974886, "core_hours": 38.08235054974886} {"step": 95550, "global_schedule": 0.06663179397583008, "l2_grads": 2.526015043258667, "l2_params": 242.40371704101562, "l2_updates": 0.0721343532204628, "train/loss": 1.5164514780044556, "uptime": 17570.007084203004, "examples_seen": 97843200.0, "progress": 0.8485564327771018, "epoch": 76.37037170017648, "img/sec/core": 738.2193376405082, "core_hours_NVIDIA A100-SXM4-40GB": 38.10161612773775, "core_hours": 38.10161612773775} {"step": 95600, "global_schedule": 0.06625053286552429, "l2_grads": 2.521150827407837, "l2_params": 242.36741638183594, "l2_updates": 0.07203762233257294, "train/loss": 1.4565908908843994, "uptime": 17578.814860341, "examples_seen": 97894400.0, "progress": 0.8490004706801773, "epoch": 76.41033526464544, "img/sec/core": 726.6306386228429, "core_hours_NVIDIA A100-SXM4-40GB": 38.12118896359996, "core_hours": 38.12118896359996} {"step": 95650, "global_schedule": 0.0658702552318573, "l2_grads": 2.5286974906921387, "l2_params": 242.32965087890625, "l2_updates": 0.07038750499486923, "train/loss": 1.6381587982177734, "uptime": 17588.106804663003, "examples_seen": 97945600.0, "progress": 0.8494445085832527, "epoch": 76.45029882911439, "img/sec/core": 688.7686557533443, "core_hours_NVIDIA A100-SXM4-40GB": 38.14183772875997, "core_hours": 38.14183772875997} {"step": 95700, "global_schedule": 0.0654909610748291, "l2_grads": 2.581576108932495, "l2_params": 242.2945556640625, "l2_updates": 0.0701119527220726, "train/loss": 1.5628153085708618, "uptime": 17596.675046729004, "examples_seen": 97996800.0, "progress": 0.8498885464863281, "epoch": 76.49026239358335, "img/sec/core": 746.9443499262304, "core_hours_NVIDIA A100-SXM4-40GB": 38.16087826668442, "core_hours": 38.16087826668442} {"step": 95750, "global_schedule": 0.06511276960372925, "l2_grads": 2.897129774093628, "l2_params": 242.2601318359375, "l2_updates": 0.06892070919275284, "train/loss": 1.5026230812072754, "uptime": 17605.242252596, "examples_seen": 98048000.0, "progress": 0.8503325843894035, "epoch": 76.53022595805231, "img/sec/core": 747.0346924489122, "core_hours_NVIDIA A100-SXM4-40GB": 38.17991650194441, "core_hours": 38.17991650194441} {"step": 95800, "global_schedule": 0.06473556160926819, "l2_grads": 2.437344789505005, "l2_params": 242.22479248046875, "l2_updates": 0.06892517954111099, "train/loss": 2.2939445972442627, "uptime": 17613.971055094, "examples_seen": 98099200.0, "progress": 0.8507766222924789, "epoch": 76.57018952252126, "img/sec/core": 733.2048126264597, "core_hours_NVIDIA A100-SXM4-40GB": 38.19931384082886, "core_hours": 38.19931384082886} {"step": 95850, "global_schedule": 0.06435936689376831, "l2_grads": 2.4478859901428223, "l2_params": 242.19168090820312, "l2_updates": 0.06832708418369293, "train/loss": 1.6351908445358276, "uptime": 17622.594636932, "examples_seen": 98150400.0, "progress": 0.8512206601955543, "epoch": 76.61015308699022, "img/sec/core": 742.1510133759315, "core_hours_NVIDIA A100-SXM4-40GB": 38.21847735602441, "core_hours": 38.21847735602441} {"step": 95900, "global_schedule": 0.06398415565490723, "l2_grads": 2.4504780769348145, "l2_params": 242.15887451171875, "l2_updates": 0.0692165270447731, "train/loss": 1.6644502878189087, "uptime": 17631.269885324, "examples_seen": 98201600.0, "progress": 0.8516646980986297, "epoch": 76.65011665145917, "img/sec/core": 737.7310378685949, "core_hours_NVIDIA A100-SXM4-40GB": 38.23775568578442, "core_hours": 38.23775568578442} {"step": 95950, "global_schedule": 0.06361004710197449, "l2_grads": 2.7211978435516357, "l2_params": 242.12423706054688, "l2_updates": 0.06786271929740906, "train/loss": 1.5946838855743408, "uptime": 17639.969320372, "examples_seen": 98252800.0, "progress": 0.8521087360017051, "epoch": 76.69008021592813, "img/sec/core": 735.6799567660133, "core_hours_NVIDIA A100-SXM4-40GB": 38.257087763668856, "core_hours": 38.257087763668856} {"step": 96000, "global_schedule": 0.06323686242103577, "l2_grads": 2.691667079925537, "l2_params": 242.09239196777344, "l2_updates": 0.06708884984254837, "train/loss": 3.9037892818450928, "uptime": 17649.414286298, "examples_seen": 98304000.0, "progress": 0.8525527739047805, "epoch": 76.7300437803971, "img/sec/core": 677.6096441367604, "core_hours_NVIDIA A100-SXM4-40GB": 38.27807657683774, "core_hours": 38.27807657683774} {"step": 96050, "global_schedule": 0.06286484003067017, "l2_grads": 2.643176555633545, "l2_params": 242.05978393554688, "l2_updates": 0.06719701737165451, "train/loss": 1.6556222438812256, "uptime": 17659.502398267003, "examples_seen": 98355200.0, "progress": 0.8529968118078559, "epoch": 76.77000734486604, "img/sec/core": 698.8829977343214, "core_hours_NVIDIA A100-SXM4-40GB": 38.29842650989997, "core_hours": 38.29842650989997} {"step": 96100, "global_schedule": 0.062493711709976196, "l2_grads": 2.438234806060791, "l2_params": 242.0244903564453, "l2_updates": 0.06759316474199295, "train/loss": 1.6396300792694092, "uptime": 17668.147009077, "examples_seen": 98406400.0, "progress": 0.8534408497109314, "epoch": 76.80997090933501, "img/sec/core": 740.3456489443444, "core_hours_NVIDIA A100-SXM4-40GB": 38.31763675614442, "core_hours": 38.31763675614442} {"step": 96150, "global_schedule": 0.06212368607521057, "l2_grads": 2.6864771842956543, "l2_params": 241.990966796875, "l2_updates": 0.06715275347232819, "train/loss": 1.6014271974563599, "uptime": 17677.034868101, "examples_seen": 98457600.0, "progress": 0.8538848876140067, "epoch": 76.84993447380396, "img/sec/core": 720.0834287218767, "core_hours_NVIDIA A100-SXM4-40GB": 38.337387553975525, "core_hours": 38.337387553975525} {"step": 96200, "global_schedule": 0.06175467371940613, "l2_grads": 2.8994274139404297, "l2_params": 241.95794677734375, "l2_updates": 0.06523100286722183, "train/loss": 1.551838755607605, "uptime": 17685.706817435, "examples_seen": 98508800.0, "progress": 0.8543289255170822, "epoch": 76.88989803827292, "img/sec/core": 738.0116918935978, "core_hours_NVIDIA A100-SXM4-40GB": 38.356658552495524, "core_hours": 38.356658552495524} {"step": 96250, "global_schedule": 0.06138661503791809, "l2_grads": 2.398988723754883, "l2_params": 241.92596435546875, "l2_updates": 0.06640509516000748, "train/loss": 1.9542385339736938, "uptime": 17695.215813359, "examples_seen": 98560000.0, "progress": 0.8547729634201575, "epoch": 76.92986160274188, "img/sec/core": 673.0468759427308, "core_hours_NVIDIA A100-SXM4-40GB": 38.37778965454886, "core_hours": 38.37778965454886} {"step": 96300, "global_schedule": 0.061019718647003174, "l2_grads": 2.6883344650268555, "l2_params": 241.8933563232422, "l2_updates": 0.06538187712430954, "train/loss": 1.638024091720581, "uptime": 17704.050978582003, "examples_seen": 98611200.0, "progress": 0.855217001323233, "epoch": 76.96982516721083, "img/sec/core": 724.3780776547795, "core_hours_NVIDIA A100-SXM4-40GB": 38.39742335504442, "core_hours": 38.39742335504442} {"step": 96350, "global_schedule": 0.060653746128082275, "l2_grads": 2.658850908279419, "l2_params": 241.86196899414062, "l2_updates": 0.06410183757543564, "train/loss": 3.6488516330718994, "uptime": 17713.5931844, "examples_seen": 98662400.0, "progress": 0.8556610392263083, "epoch": 77.00978873167979, "img/sec/core": 670.7044599613463, "core_hours_NVIDIA A100-SXM4-40GB": 38.41862825686219, "core_hours": 38.41862825686219} {"step": 96400, "global_schedule": 0.060288846492767334, "l2_grads": 2.6356308460235596, "l2_params": 241.8304901123047, "l2_updates": 0.06396882236003876, "train/loss": 1.5517255067825317, "uptime": 17722.148363287997, "examples_seen": 98713600.0, "progress": 0.8561050771293838, "epoch": 77.04975229614874, "img/sec/core": 748.0848832952925, "core_hours_NVIDIA A100-SXM4-40GB": 38.43763976550219, "core_hours": 38.43763976550219} {"step": 96450, "global_schedule": 0.0599249005317688, "l2_grads": 2.437120199203491, "l2_params": 241.79983520507812, "l2_updates": 0.06333060562610626, "train/loss": 2.144663095474243, "uptime": 17730.837996975002, "examples_seen": 98764800.0, "progress": 0.8565491150324591, "epoch": 77.0897158606177, "img/sec/core": 736.5097575486577, "core_hours_NVIDIA A100-SXM4-40GB": 38.45695006258441, "core_hours": 38.45695006258441} {"step": 96500, "global_schedule": 0.059562087059020996, "l2_grads": 2.601541519165039, "l2_params": 241.76748657226562, "l2_updates": 0.0627938061952591, "train/loss": 1.678092360496521, "uptime": 17739.433906131002, "examples_seen": 98816000.0, "progress": 0.8569931529355346, "epoch": 77.12967942508666, "img/sec/core": 744.5402090519864, "core_hours_NVIDIA A100-SXM4-40GB": 38.47605208293108, "core_hours": 38.47605208293108} {"step": 96550, "global_schedule": 0.05920025706291199, "l2_grads": 2.562910556793213, "l2_params": 241.73626708984375, "l2_updates": 0.0633862167596817, "train/loss": 1.5032707452774048, "uptime": 17748.151182524998, "examples_seen": 98867200.0, "progress": 0.85743719083861, "epoch": 77.16964298955561, "img/sec/core": 734.1742662198029, "core_hours_NVIDIA A100-SXM4-40GB": 38.495423808251076, "core_hours": 38.495423808251076} {"step": 96600, "global_schedule": 0.058839499950408936, "l2_grads": 2.6129748821258545, "l2_params": 241.70269775390625, "l2_updates": 0.06358885765075684, "train/loss": 1.5950214862823486, "uptime": 17756.679421749002, "examples_seen": 98918400.0, "progress": 0.8578812287416854, "epoch": 77.20960655402457, "img/sec/core": 750.4479918889726, "core_hours_NVIDIA A100-SXM4-40GB": 38.51437545097108, "core_hours": 38.51437545097108} {"step": 96650, "global_schedule": 0.05847969651222229, "l2_grads": 2.634598970413208, "l2_params": 241.67127990722656, "l2_updates": 0.06313160061836243, "train/loss": 1.46794593334198, "uptime": 17766.374729299998, "examples_seen": 98969600.0, "progress": 0.8583252666447608, "epoch": 77.24957011849352, "img/sec/core": 660.1131492048913, "core_hours_NVIDIA A100-SXM4-40GB": 38.53592057886219, "core_hours": 38.53592057886219} {"step": 96700, "global_schedule": 0.05812099575996399, "l2_grads": 2.3431220054626465, "l2_params": 241.64053344726562, "l2_updates": 0.06218836084008217, "train/loss": 2.866224765777588, "uptime": 17776.057085599998, "examples_seen": 99020800.0, "progress": 0.8587693045478362, "epoch": 77.28953368296249, "img/sec/core": 660.9961254989269, "core_hours_NVIDIA A100-SXM4-40GB": 38.55743692619553, "core_hours": 38.55743692619553} {"step": 96750, "global_schedule": 0.05776333808898926, "l2_grads": 2.6969447135925293, "l2_params": 241.61024475097656, "l2_updates": 0.06159026175737381, "train/loss": 3.8190319538116455, "uptime": 17784.910509941998, "examples_seen": 99072000.0, "progress": 0.8592133424509116, "epoch": 77.32949724743145, "img/sec/core": 722.8841353100992, "core_hours_NVIDIA A100-SXM4-40GB": 38.57711120251108, "core_hours": 38.57711120251108} {"step": 96800, "global_schedule": 0.05740669369697571, "l2_grads": 2.456671953201294, "l2_params": 241.57864379882812, "l2_updates": 0.06092674657702446, "train/loss": 1.8547219038009644, "uptime": 17794.464525331, "examples_seen": 99123200.0, "progress": 0.859657380353987, "epoch": 77.3694608119004, "img/sec/core": 669.8754125274739, "core_hours_NVIDIA A100-SXM4-40GB": 38.598342347819965, "core_hours": 38.598342347819965} {"step": 96850, "global_schedule": 0.057051122188568115, "l2_grads": 2.766810655593872, "l2_params": 241.5472412109375, "l2_updates": 0.06082301214337349, "train/loss": 1.5254316329956055, "uptime": 17804.225462752, "examples_seen": 99174400.0, "progress": 0.8601014182570624, "epoch": 77.40942437636936, "img/sec/core": 655.6747291741121, "core_hours_NVIDIA A100-SXM4-40GB": 38.62003331986663, "core_hours": 38.62003331986663} {"step": 96900, "global_schedule": 0.05669650435447693, "l2_grads": 2.5788798332214355, "l2_params": 241.5164794921875, "l2_updates": 0.0608384869992733, "train/loss": 3.366405963897705, "uptime": 17814.015214382, "examples_seen": 99225600.0, "progress": 0.8605454561601378, "epoch": 77.44938794083832, "img/sec/core": 653.7448795317424, "core_hours_NVIDIA A100-SXM4-40GB": 38.64178832348885, "core_hours": 38.64178832348885} {"step": 96950, "global_schedule": 0.05634298920631409, "l2_grads": 2.4750771522521973, "l2_params": 241.48626708984375, "l2_updates": 0.059882909059524536, "train/loss": 2.521078586578369, "uptime": 17823.784123038, "examples_seen": 99276800.0, "progress": 0.8609894940632132, "epoch": 77.48935150530727, "img/sec/core": 655.1397116470878, "core_hours_NVIDIA A100-SXM4-40GB": 38.66349700939109, "core_hours": 38.66349700939109} {"step": 97000, "global_schedule": 0.055990517139434814, "l2_grads": 2.4393084049224854, "l2_params": 241.45509338378906, "l2_updates": 0.06036077067255974, "train/loss": 1.6373300552368164, "uptime": 17833.027017661, "examples_seen": 99328000.0, "progress": 0.8614335319662887, "epoch": 77.52931506977623, "img/sec/core": 692.4237764298142, "core_hours_NVIDIA A100-SXM4-40GB": 38.68403677521997, "core_hours": 38.68403677521997} {"step": 97050, "global_schedule": 0.05563908815383911, "l2_grads": 2.342071056365967, "l2_params": 241.42562866210938, "l2_updates": 0.059144336730241776, "train/loss": 2.434966802597046, "uptime": 17843.072772866, "examples_seen": 99379200.0, "progress": 0.861877569869364, "epoch": 77.56927863424518, "img/sec/core": 705.8653774238162, "core_hours_NVIDIA A100-SXM4-40GB": 38.704185407915524, "core_hours": 38.704185407915524} {"step": 97100, "global_schedule": 0.0552886426448822, "l2_grads": 2.6647465229034424, "l2_params": 241.3942413330078, "l2_updates": 0.05950785055756569, "train/loss": 1.5101728439331055, "uptime": 17852.387849059, "examples_seen": 99430400.0, "progress": 0.8623216077724395, "epoch": 77.60924219871414, "img/sec/core": 687.0582556059732, "core_hours_NVIDIA A100-SXM4-40GB": 38.72488557723331, "core_hours": 38.72488557723331} {"step": 97150, "global_schedule": 0.05493927001953125, "l2_grads": 2.6611344814300537, "l2_params": 241.3641357421875, "l2_updates": 0.05892932415008545, "train/loss": 1.4821215867996216, "uptime": 17861.472406292, "examples_seen": 99481600.0, "progress": 0.8627656456755148, "epoch": 77.6492057631831, "img/sec/core": 704.492231800995, "core_hours_NVIDIA A100-SXM4-40GB": 38.74507348219553, "core_hours": 38.74507348219553} {"step": 97200, "global_schedule": 0.05459091067314148, "l2_grads": 2.5331015586853027, "l2_params": 241.3352508544922, "l2_updates": 0.057879600673913956, "train/loss": 3.3928489685058594, "uptime": 17870.699088727997, "examples_seen": 99532800.0, "progress": 0.8632096835785903, "epoch": 77.68916932765205, "img/sec/core": 693.6404329936162, "core_hours_NVIDIA A100-SXM4-40GB": 38.76557722094219, "core_hours": 38.76557722094219} {"step": 97250, "global_schedule": 0.05424371361732483, "l2_grads": 2.466689348220825, "l2_params": 241.3045654296875, "l2_updates": 0.056877996772527695, "train/loss": 2.2894797325134277, "uptime": 17880.354217143, "examples_seen": 99584000.0, "progress": 0.8636537214816656, "epoch": 77.72913289212102, "img/sec/core": 662.86016352268, "core_hours_NVIDIA A100-SXM4-40GB": 38.78703306186442, "core_hours": 38.78703306186442} {"step": 97300, "global_schedule": 0.0538974404335022, "l2_grads": 2.7474524974823, "l2_params": 241.2753143310547, "l2_updates": 0.05761916935443878, "train/loss": 3.748631477355957, "uptime": 17890.066436220004, "examples_seen": 99635200.0, "progress": 0.8640977593847411, "epoch": 77.76909645658996, "img/sec/core": 658.9637187195048, "core_hours_NVIDIA A100-SXM4-40GB": 38.80861577092442, "core_hours": 38.80861577092442} {"step": 97350, "global_schedule": 0.05355226993560791, "l2_grads": 2.814411163330078, "l2_params": 241.24786376953125, "l2_updates": 0.056289203464984894, "train/loss": 3.550191640853882, "uptime": 17899.510216617004, "examples_seen": 99686400.0, "progress": 0.8645417972878164, "epoch": 77.80906002105893, "img/sec/core": 677.6947081524072, "core_hours_NVIDIA A100-SXM4-40GB": 38.82960194958442, "core_hours": 38.82960194958442} {"step": 97400, "global_schedule": 0.05320814251899719, "l2_grads": 2.670572280883789, "l2_params": 241.21743774414062, "l2_updates": 0.0570099763572216, "train/loss": 1.586724042892456, "uptime": 17908.211941677997, "examples_seen": 99737600.0, "progress": 0.8649858351908919, "epoch": 77.84902358552789, "img/sec/core": 735.486349561444, "core_hours_NVIDIA A100-SXM4-40GB": 38.84893911638663, "core_hours": 38.84893911638663} {"step": 97450, "global_schedule": 0.05286499857902527, "l2_grads": 2.7438595294952393, "l2_params": 241.18582153320312, "l2_updates": 0.05680100992321968, "train/loss": 1.6459060907363892, "uptime": 17917.032331827002, "examples_seen": 99788800.0, "progress": 0.8654298730939674, "epoch": 77.88898714999684, "img/sec/core": 725.5914865312989, "core_hours_NVIDIA A100-SXM4-40GB": 38.868539983384416, "core_hours": 38.868539983384416} {"step": 97500, "global_schedule": 0.05252295732498169, "l2_grads": 2.586667060852051, "l2_params": 241.1593017578125, "l2_updates": 0.05580757185816765, "train/loss": 2.1555049419403076, "uptime": 17926.00695016, "examples_seen": 99840000.0, "progress": 0.8658739109970427, "epoch": 77.9289507144658, "img/sec/core": 713.1222479364632, "core_hours_NVIDIA A100-SXM4-40GB": 38.88848357967996, "core_hours": 38.88848357967996, "val/acc@1": 0.7601, "val/loss": 0.9612634558105468, "z/secs/eval/val": 2.5755859310011147} {"step": 97550, "global_schedule": 0.05218198895454407, "l2_grads": 2.35697340965271, "l2_params": 241.12960815429688, "l2_updates": 0.05613929405808449, "train/loss": 1.9805306196212769, "uptime": 17937.462093905, "examples_seen": 99891200.0, "progress": 0.8663179489001182, "epoch": 77.96891427893475, "img/sec/core": 720.8357632669887, "core_hours_NVIDIA A100-SXM4-40GB": 38.90821376365109, "core_hours": 38.90821376365109} {"step": 97600, "global_schedule": 0.05184203386306763, "l2_grads": 2.8439178466796875, "l2_params": 241.10108947753906, "l2_updates": 0.054589200764894485, "train/loss": 1.589473843574524, "uptime": 17948.003694327002, "examples_seen": 99942400.0, "progress": 0.8667619868031935, "epoch": 78.00887784340371, "img/sec/core": 607.1184396862701, "core_hours_NVIDIA A100-SXM4-40GB": 38.93163954236664, "core_hours": 38.93163954236664} {"step": 97650, "global_schedule": 0.05150309205055237, "l2_grads": 2.726306438446045, "l2_params": 241.07199096679688, "l2_updates": 0.0549454465508461, "train/loss": 1.5415387153625488, "uptime": 17957.430049605, "examples_seen": 99993600.0, "progress": 0.867206024706269, "epoch": 78.04884140787267, "img/sec/core": 678.9474628584451, "core_hours_NVIDIA A100-SXM4-40GB": 38.95258699853998, "core_hours": 38.95258699853998} {"step": 97700, "global_schedule": 0.05116528272628784, "l2_grads": 2.780036687850952, "l2_params": 241.04331970214844, "l2_updates": 0.054595351219177246, "train/loss": 3.652442455291748, "uptime": 17967.122571767002, "examples_seen": 100044800.0, "progress": 0.8676500626093443, "epoch": 78.08880497234162, "img/sec/core": 660.3028492512767, "core_hours_NVIDIA A100-SXM4-40GB": 38.97412593667775, "core_hours": 38.97412593667775} {"step": 97750, "global_schedule": 0.0508284866809845, "l2_grads": 2.812196969985962, "l2_params": 241.01649475097656, "l2_updates": 0.054080139845609665, "train/loss": 1.4756474494934082, "uptime": 17976.883924447, "examples_seen": 100096000.0, "progress": 0.8680941005124198, "epoch": 78.12876853681058, "img/sec/core": 655.6468360283708, "core_hours_NVIDIA A100-SXM4-40GB": 38.9958178315222, "core_hours": 38.9958178315222} {"step": 97800, "global_schedule": 0.05049276351928711, "l2_grads": 2.5681686401367188, "l2_params": 240.9879608154297, "l2_updates": 0.05486539378762245, "train/loss": 1.5371508598327637, "uptime": 17986.599854345004, "examples_seen": 100147200.0, "progress": 0.8685381384154951, "epoch": 78.16873210127953, "img/sec/core": 658.7120396285605, "core_hours_NVIDIA A100-SXM4-40GB": 39.01740878685109, "core_hours": 39.01740878685109} {"step": 97850, "global_schedule": 0.050158023834228516, "l2_grads": 2.6655313968658447, "l2_params": 240.9608154296875, "l2_updates": 0.05383044481277466, "train/loss": 1.5917943716049194, "uptime": 17996.438082589004, "examples_seen": 100198400.0, "progress": 0.8689821763185706, "epoch": 78.2086956657485, "img/sec/core": 650.5236350765997, "core_hours_NVIDIA A100-SXM4-40GB": 39.0392715162822, "core_hours": 39.0392715162822} {"step": 97900, "global_schedule": 0.049824416637420654, "l2_grads": 2.437783718109131, "l2_params": 240.93310546875, "l2_updates": 0.05384925752878189, "train/loss": 2.0021448135375977, "uptime": 18005.803997773, "examples_seen": 100249600.0, "progress": 0.869426214221646, "epoch": 78.24865923021746, "img/sec/core": 683.3288444607243, "core_hours_NVIDIA A100-SXM4-40GB": 39.060084661135534, "core_hours": 39.060084661135534} {"step": 97950, "global_schedule": 0.04949185252189636, "l2_grads": 2.6021811962127686, "l2_params": 240.90289306640625, "l2_updates": 0.052652422338724136, "train/loss": 1.5206373929977417, "uptime": 18014.5255806, "examples_seen": 100300800.0, "progress": 0.8698702521247214, "epoch": 78.2886227946864, "img/sec/core": 733.8117549246225, "core_hours_NVIDIA A100-SXM4-40GB": 39.07946595630664, "core_hours": 39.07946595630664} {"step": 98000, "global_schedule": 0.04916033148765564, "l2_grads": 2.8581995964050293, "l2_params": 240.87486267089844, "l2_updates": 0.05319984257221222, "train/loss": 3.805586814880371, "uptime": 18023.708417392, "examples_seen": 100352000.0, "progress": 0.8703142900277968, "epoch": 78.32858635915537, "img/sec/core": 696.9523846461498, "core_hours_NVIDIA A100-SXM4-40GB": 39.09987226028886, "core_hours": 39.09987226028886} {"step": 98050, "global_schedule": 0.0488298237323761, "l2_grads": 2.608948230743408, "l2_params": 240.84881591796875, "l2_updates": 0.05262526124715805, "train/loss": 1.6421830654144287, "uptime": 18033.680937462, "examples_seen": 100403200.0, "progress": 0.8707583279308722, "epoch": 78.36854992362431, "img/sec/core": 687.7220852331131, "core_hours_NVIDIA A100-SXM4-40GB": 39.12055244859109, "core_hours": 39.12055244859109} {"step": 98100, "global_schedule": 0.04850044846534729, "l2_grads": 2.71097993850708, "l2_params": 240.822509765625, "l2_updates": 0.051255203783512115, "train/loss": 2.1023309230804443, "uptime": 18042.515524930997, "examples_seen": 100454400.0, "progress": 0.8712023658339476, "epoch": 78.40851348809328, "img/sec/core": 724.4254496837879, "core_hours_NVIDIA A100-SXM4-40GB": 39.140184865188864, "core_hours": 39.140184865188864} {"step": 98150, "global_schedule": 0.04817208647727966, "l2_grads": 2.441984176635742, "l2_params": 240.79368591308594, "l2_updates": 0.05144277960062027, "train/loss": 2.2446112632751465, "uptime": 18052.095494007997, "examples_seen": 100505600.0, "progress": 0.871646403737023, "epoch": 78.44847705256224, "img/sec/core": 668.0606115280061, "core_hours_NVIDIA A100-SXM4-40GB": 39.16147368535998, "core_hours": 39.16147368535998} {"step": 98200, "global_schedule": 0.04784482717514038, "l2_grads": 2.5643081665039062, "l2_params": 240.76730346679688, "l2_updates": 0.051396455615758896, "train/loss": 2.476989269256592, "uptime": 18061.455088798997, "examples_seen": 100556800.0, "progress": 0.8720904416400984, "epoch": 78.48844061703119, "img/sec/core": 683.7902861087773, "core_hours_NVIDIA A100-SXM4-40GB": 39.18227278489553, "core_hours": 39.18227278489553} {"step": 98250, "global_schedule": 0.04751861095428467, "l2_grads": 2.6956052780151367, "l2_params": 240.7404022216797, "l2_updates": 0.050471555441617966, "train/loss": 1.5178664922714233, "uptime": 18070.217470309, "examples_seen": 100608000.0, "progress": 0.8725344795431738, "epoch": 78.52840418150015, "img/sec/core": 730.3950407426341, "core_hours_NVIDIA A100-SXM4-40GB": 39.20174474380665, "core_hours": 39.20174474380665} {"step": 98300, "global_schedule": 0.04719340801239014, "l2_grads": 2.475451707839966, "l2_params": 240.71505737304688, "l2_updates": 0.05048608034849167, "train/loss": 3.0315470695495605, "uptime": 18079.355508615998, "examples_seen": 100659200.0, "progress": 0.8729785174462492, "epoch": 78.5683677459691, "img/sec/core": 700.3691366776238, "core_hours_NVIDIA A100-SXM4-40GB": 39.22205149559998, "core_hours": 39.22205149559998} {"step": 98350, "global_schedule": 0.04686930775642395, "l2_grads": 2.67372989654541, "l2_params": 240.6896209716797, "l2_updates": 0.05010545626282692, "train/loss": 1.513332724571228, "uptime": 18088.762423416003, "examples_seen": 100710400.0, "progress": 0.8734225553493247, "epoch": 78.60833131043806, "img/sec/core": 680.3505863579047, "core_hours_NVIDIA A100-SXM4-40GB": 39.24295575071109, "core_hours": 39.24295575071109} {"step": 98400, "global_schedule": 0.046546220779418945, "l2_grads": 2.6555798053741455, "l2_params": 240.6630401611328, "l2_updates": 0.04943646490573883, "train/loss": 1.4951834678649902, "uptime": 18097.397120449998, "examples_seen": 100761600.0, "progress": 0.8738665932524, "epoch": 78.64829487490702, "img/sec/core": 741.1956638201265, "core_hours_NVIDIA A100-SXM4-40GB": 39.2621439663422, "core_hours": 39.2621439663422} {"step": 98450, "global_schedule": 0.04622429609298706, "l2_grads": 2.661497116088867, "l2_params": 240.6356201171875, "l2_updates": 0.04954101890325546, "train/loss": 1.361689567565918, "uptime": 18106.363507139, "examples_seen": 100812800.0, "progress": 0.8743106311554755, "epoch": 78.68825843937597, "img/sec/core": 713.7769340074512, "core_hours_NVIDIA A100-SXM4-40GB": 39.28206927009553, "core_hours": 39.28206927009553} {"step": 98500, "global_schedule": 0.04590332508087158, "l2_grads": 2.526308536529541, "l2_params": 240.609375, "l2_updates": 0.049722786992788315, "train/loss": 1.3953479528427124, "uptime": 18115.130904576, "examples_seen": 100864000.0, "progress": 0.8747546690585508, "epoch": 78.72822200384493, "img/sec/core": 729.9771734985095, "core_hours_NVIDIA A100-SXM4-40GB": 39.301552375511086, "core_hours": 39.301552375511086} {"step": 98550, "global_schedule": 0.045583486557006836, "l2_grads": 2.6112825870513916, "l2_params": 240.58480834960938, "l2_updates": 0.04829374700784683, "train/loss": 2.1340670585632324, "uptime": 18123.777010173, "examples_seen": 100915200.0, "progress": 0.8751987069616263, "epoch": 78.76818556831388, "img/sec/core": 740.2176538557537, "core_hours_NVIDIA A100-SXM4-40GB": 39.32076594350442, "core_hours": 39.32076594350442} {"step": 98600, "global_schedule": 0.04526466131210327, "l2_grads": 2.5092153549194336, "l2_params": 240.5576934814453, "l2_updates": 0.04887520521879196, "train/loss": 3.2138493061065674, "uptime": 18132.519430025, "examples_seen": 100966400.0, "progress": 0.8756427448647016, "epoch": 78.80814913278284, "img/sec/core": 732.0627593210784, "core_hours_NVIDIA A100-SXM4-40GB": 39.340193543175545, "core_hours": 39.340193543175545} {"step": 98650, "global_schedule": 0.04494693875312805, "l2_grads": 2.747589111328125, "l2_params": 240.53134155273438, "l2_updates": 0.0481920950114727, "train/loss": 3.671018362045288, "uptime": 18141.527189595, "examples_seen": 101017600.0, "progress": 0.8760867827677771, "epoch": 78.8481126972518, "img/sec/core": 710.498537429435, "core_hours_NVIDIA A100-SXM4-40GB": 39.360210786664425, "core_hours": 39.360210786664425} {"step": 98700, "global_schedule": 0.04463028907775879, "l2_grads": 2.5010664463043213, "l2_params": 240.50592041015625, "l2_updates": 0.04781176522374153, "train/loss": 1.673018455505371, "uptime": 18151.395633687003, "examples_seen": 101068800.0, "progress": 0.8765308206708524, "epoch": 78.88807626172076, "img/sec/core": 648.5318192345927, "core_hours_NVIDIA A100-SXM4-40GB": 39.382140662424426, "core_hours": 39.382140662424426} {"step": 98750, "global_schedule": 0.04431471228599548, "l2_grads": 2.5939409732818604, "l2_params": 240.47946166992188, "l2_updates": 0.04727524518966675, "train/loss": 1.4131799936294556, "uptime": 18160.581575941003, "examples_seen": 101120000.0, "progress": 0.8769748585739279, "epoch": 78.92803982618972, "img/sec/core": 696.7167681914237, "core_hours_NVIDIA A100-SXM4-40GB": 39.40255386743331, "core_hours": 39.40255386743331} {"step": 98800, "global_schedule": 0.044000208377838135, "l2_grads": 2.519551992416382, "l2_params": 240.45481872558594, "l2_updates": 0.0468902587890625, "train/loss": 1.3866997957229614, "uptime": 18170.261313643998, "examples_seen": 101171200.0, "progress": 0.8774188964770033, "epoch": 78.96800339065867, "img/sec/core": 661.174940517017, "core_hours_NVIDIA A100-SXM4-40GB": 39.4240643956622, "core_hours": 39.4240643956622} {"step": 98850, "global_schedule": 0.04368671774864197, "l2_grads": 2.4299817085266113, "l2_params": 240.4313201904297, "l2_updates": 0.04677363112568855, "train/loss": 2.8185179233551025, "uptime": 18180.658481963997, "examples_seen": 101222400.0, "progress": 0.8778629343800787, "epoch": 79.00796695512763, "img/sec/core": 615.5522160480081, "core_hours_NVIDIA A100-SXM4-40GB": 39.44716921415109, "core_hours": 39.44716921415109} {"step": 98900, "global_schedule": 0.043374329805374146, "l2_grads": 2.5104167461395264, "l2_params": 240.4059600830078, "l2_updates": 0.04576478525996208, "train/loss": 2.636510133743286, "uptime": 18190.406397216997, "examples_seen": 101273600.0, "progress": 0.8783069722831541, "epoch": 79.04793051959659, "img/sec/core": 656.5506402028541, "core_hours_NVIDIA A100-SXM4-40GB": 39.46883124804664, "core_hours": 39.46883124804664} {"step": 98950, "global_schedule": 0.04306304454803467, "l2_grads": 2.336505174636841, "l2_params": 240.38253784179688, "l2_updates": 0.04607232287526131, "train/loss": 2.3940749168395996, "uptime": 18200.184770879, "examples_seen": 101324800.0, "progress": 0.8787510101862295, "epoch": 79.08789408406554, "img/sec/core": 654.5055672060238, "core_hours_NVIDIA A100-SXM4-40GB": 39.490560967295536, "core_hours": 39.490560967295536} {"step": 99000, "global_schedule": 0.04275280237197876, "l2_grads": 2.539904832839966, "l2_params": 240.35812377929688, "l2_updates": 0.04541279003024101, "train/loss": 2.3072547912597656, "uptime": 18210.086892731997, "examples_seen": 101376000.0, "progress": 0.8791950480893049, "epoch": 79.1278576485345, "img/sec/core": 646.3261203012985, "core_hours_NVIDIA A100-SXM4-40GB": 39.51256568252442, "core_hours": 39.51256568252442} {"step": 99050, "global_schedule": 0.04244360327720642, "l2_grads": 2.7604849338531494, "l2_params": 240.33404541015625, "l2_updates": 0.04552498459815979, "train/loss": 1.5629816055297852, "uptime": 18219.654141829, "examples_seen": 101427200.0, "progress": 0.8796390859923803, "epoch": 79.16782121300346, "img/sec/core": 719.7424800541864, "core_hours_NVIDIA A100-SXM4-40GB": 39.53232583649109, "core_hours": 39.53232583649109} {"step": 99100, "global_schedule": 0.04213550686836243, "l2_grads": 2.9240317344665527, "l2_params": 240.30955505371094, "l2_updates": 0.04489101842045784, "train/loss": 1.6073063611984253, "uptime": 18229.421958086998, "examples_seen": 101478400.0, "progress": 0.8800831238954557, "epoch": 79.20778477747241, "img/sec/core": 655.2129801540606, "core_hours_NVIDIA A100-SXM4-40GB": 39.5540320948422, "core_hours": 39.5540320948422} {"step": 99150, "global_schedule": 0.04182848334312439, "l2_grads": 2.618421792984009, "l2_params": 240.28500366210938, "l2_updates": 0.045424122363328934, "train/loss": 1.5140060186386108, "uptime": 18238.636370399, "examples_seen": 101529600.0, "progress": 0.8805271617985311, "epoch": 79.24774834194137, "img/sec/core": 694.5641005953445, "core_hours_NVIDIA A100-SXM4-40GB": 39.57450856664664, "core_hours": 39.57450856664664} {"step": 99200, "global_schedule": 0.04152253270149231, "l2_grads": 2.496368885040283, "l2_params": 240.26136779785156, "l2_updates": 0.04406999424099922, "train/loss": 2.1598026752471924, "uptime": 18248.069518748, "examples_seen": 101580800.0, "progress": 0.8809711997016065, "epoch": 79.28771190641032, "img/sec/core": 678.4585340141895, "core_hours_NVIDIA A100-SXM4-40GB": 39.595471118533304, "core_hours": 39.595471118533304} {"step": 99250, "global_schedule": 0.0412176251411438, "l2_grads": 2.4829630851745605, "l2_params": 240.23861694335938, "l2_updates": 0.043631091713905334, "train/loss": 1.5236718654632568, "uptime": 18257.237112851, "examples_seen": 101632000.0, "progress": 0.881415237604682, "epoch": 79.32767547087929, "img/sec/core": 698.1111868712808, "core_hours_NVIDIA A100-SXM4-40GB": 39.615843549873304, "core_hours": 39.615843549873304} {"step": 99300, "global_schedule": 0.04091385006904602, "l2_grads": 2.6067540645599365, "l2_params": 240.21588134765625, "l2_updates": 0.043117087334394455, "train/loss": 3.2691826820373535, "uptime": 18266.62004653, "examples_seen": 101683200.0, "progress": 0.8818592755077573, "epoch": 79.36763903534825, "img/sec/core": 682.0894422736457, "core_hours_NVIDIA A100-SXM4-40GB": 39.63669451360442, "core_hours": 39.63669451360442} {"step": 99350, "global_schedule": 0.04061111807823181, "l2_grads": 2.754967451095581, "l2_params": 240.1925811767578, "l2_updates": 0.04411632567644119, "train/loss": 1.5725040435791016, "uptime": 18276.333495462997, "examples_seen": 101734400.0, "progress": 0.8823033134108328, "epoch": 79.4076025998172, "img/sec/core": 658.8802848654587, "core_hours_NVIDIA A100-SXM4-40GB": 39.65827995567775, "core_hours": 39.65827995567775} {"step": 99400, "global_schedule": 0.04030948877334595, "l2_grads": 2.5917372703552246, "l2_params": 240.1681365966797, "l2_updates": 0.04332658275961876, "train/loss": 2.1099205017089844, "uptime": 18286.242295351003, "examples_seen": 101785600.0, "progress": 0.8827473513139081, "epoch": 79.44756616428616, "img/sec/core": 645.8905288570045, "core_hours_NVIDIA A100-SXM4-40GB": 39.680299510984426, "core_hours": 39.680299510984426} {"step": 99450, "global_schedule": 0.04000893235206604, "l2_grads": 2.7101571559906006, "l2_params": 240.14366149902344, "l2_updates": 0.043381623923778534, "train/loss": 1.5414751768112183, "uptime": 18295.941326844004, "examples_seen": 101836800.0, "progress": 0.8831913892169836, "epoch": 79.4875297287551, "img/sec/core": 659.8596988388467, "core_hours_NVIDIA A100-SXM4-40GB": 39.7018529143022, "core_hours": 39.7018529143022} {"step": 99500, "global_schedule": 0.039709389209747314, "l2_grads": 2.705247163772583, "l2_params": 240.12120056152344, "l2_updates": 0.04321299493312836, "train/loss": 1.4103676080703735, "uptime": 18305.261457075, "examples_seen": 101888000.0, "progress": 0.8836354271200589, "epoch": 79.52749329322407, "img/sec/core": 686.6856837165956, "core_hours_NVIDIA A100-SXM4-40GB": 39.72256431481553, "core_hours": 39.72256431481553} {"step": 99550, "global_schedule": 0.03941097855567932, "l2_grads": 2.8094563484191895, "l2_params": 240.0988006591797, "l2_updates": 0.04183567315340042, "train/loss": 3.7675063610076904, "uptime": 18314.941646096, "examples_seen": 101939200.0, "progress": 0.8840794650231344, "epoch": 79.56745685769303, "img/sec/core": 661.144114656792, "core_hours_NVIDIA A100-SXM4-40GB": 39.744075845973306, "core_hours": 39.744075845973306} {"step": 99600, "global_schedule": 0.0391136109828949, "l2_grads": 2.820314645767212, "l2_params": 240.07562255859375, "l2_updates": 0.04155822470784187, "train/loss": 3.3031256198883057, "uptime": 18324.361043830002, "examples_seen": 101990400.0, "progress": 0.8845235029262097, "epoch": 79.60742042216198, "img/sec/core": 679.448960616524, "core_hours_NVIDIA A100-SXM4-40GB": 39.765007840937756, "core_hours": 39.765007840937756} {"step": 99650, "global_schedule": 0.038817405700683594, "l2_grads": 2.680968761444092, "l2_params": 240.05186462402344, "l2_updates": 0.04114382714033127, "train/loss": 1.480997920036316, "uptime": 18333.687345206003, "examples_seen": 102041600.0, "progress": 0.8849675408292852, "epoch": 79.64738398663094, "img/sec/core": 686.2313088518799, "core_hours_NVIDIA A100-SXM4-40GB": 39.78573295510664, "core_hours": 39.78573295510664} {"step": 99700, "global_schedule": 0.03852221369743347, "l2_grads": 2.4554202556610107, "l2_params": 240.03199768066406, "l2_updates": 0.04132828488945961, "train/loss": 1.8795676231384277, "uptime": 18342.753324701, "examples_seen": 102092800.0, "progress": 0.8854115787323606, "epoch": 79.68734755109989, "img/sec/core": 705.9358565204369, "core_hours_NVIDIA A100-SXM4-40GB": 39.80587957620664, "core_hours": 39.80587957620664} {"step": 99750, "global_schedule": 0.038228124380111694, "l2_grads": 2.754056215286255, "l2_params": 240.0106658935547, "l2_updates": 0.04074656218290329, "train/loss": 3.690049171447754, "uptime": 18352.517859264997, "examples_seen": 102144000.0, "progress": 0.885855616635436, "epoch": 79.72731111556885, "img/sec/core": 655.4331860933933, "core_hours_NVIDIA A100-SXM4-40GB": 39.82757854190442, "core_hours": 39.82757854190442} {"step": 99800, "global_schedule": 0.037935078144073486, "l2_grads": 2.4734251499176025, "l2_params": 239.9891815185547, "l2_updates": 0.040816739201545715, "train/loss": 2.9077141284942627, "uptime": 18361.64844209, "examples_seen": 102195200.0, "progress": 0.8862996545385114, "epoch": 79.76727468003781, "img/sec/core": 700.9410157778815, "core_hours_NVIDIA A100-SXM4-40GB": 39.84786872595998, "core_hours": 39.84786872595998} {"step": 99850, "global_schedule": 0.03764316439628601, "l2_grads": 2.391275644302368, "l2_params": 239.96705627441406, "l2_updates": 0.03996444121003151, "train/loss": 2.5880794525146484, "uptime": 18370.876945048003, "examples_seen": 102246400.0, "progress": 0.8867436924415868, "epoch": 79.80723824450676, "img/sec/core": 693.503597401011, "core_hours_NVIDIA A100-SXM4-40GB": 39.86837651031109, "core_hours": 39.86837651031109} {"step": 99900, "global_schedule": 0.03735232353210449, "l2_grads": 2.7477359771728516, "l2_params": 239.94581604003906, "l2_updates": 0.039469074457883835, "train/loss": 3.6971890926361084, "uptime": 18380.611437436004, "examples_seen": 102297600.0, "progress": 0.8871877303446623, "epoch": 79.84720180897573, "img/sec/core": 657.4559560895902, "core_hours_NVIDIA A100-SXM4-40GB": 39.89000871561776, "core_hours": 39.89000871561776} {"step": 99950, "global_schedule": 0.03706258535385132, "l2_grads": 2.8075318336486816, "l2_params": 239.9235076904297, "l2_updates": 0.039383549243211746, "train/loss": 1.498148798942566, "uptime": 18390.532335195, "examples_seen": 102348800.0, "progress": 0.8876317682477376, "epoch": 79.88716537344467, "img/sec/core": 645.1029085744657, "core_hours_NVIDIA A100-SXM4-40GB": 39.91205515508219, "core_hours": 39.91205515508219} {"step": 100000, "global_schedule": 0.0367739200592041, "l2_grads": 2.7385239601135254, "l2_params": 239.90101623535156, "l2_updates": 0.03895201534032822, "train/loss": 3.6053524017333984, "uptime": 18399.622473933, "examples_seen": 102400000.0, "progress": 0.888075806150813, "epoch": 79.92712893791364, "img/sec/core": 704.0596611849022, "core_hours_NVIDIA A100-SXM4-40GB": 39.93225546338886, "core_hours": 39.93225546338886, "val/acc@1": 0.76224, "val/loss": 0.9499039221191407, "z/secs/eval/val": 2.6651548279987765} {"step": 100050, "global_schedule": 0.036486297845840454, "l2_grads": 2.716036319732666, "l2_params": 239.88172912597656, "l2_updates": 0.03885716572403908, "train/loss": 1.56413996219635, "uptime": 18411.358742491, "examples_seen": 102451200.0, "progress": 0.8885198440538884, "epoch": 79.9670925023826, "img/sec/core": 786.9302340900841, "core_hours_NVIDIA A100-SXM4-40GB": 39.9503285041822, "core_hours": 39.9503285041822} {"step": 100100, "global_schedule": 0.03619977831840515, "l2_grads": 2.6224169731140137, "l2_params": 239.85842895507812, "l2_updates": 0.03879905864596367, "train/loss": 1.5484232902526855, "uptime": 18421.393468882998, "examples_seen": 102502400.0, "progress": 0.8889638819569639, "epoch": 80.00705606685155, "img/sec/core": 637.7852021061433, "core_hours_NVIDIA A100-SXM4-40GB": 39.972627896164425, "core_hours": 39.972627896164425} {"step": 100150, "global_schedule": 0.03591439127922058, "l2_grads": 2.5807881355285645, "l2_params": 239.83872985839844, "l2_updates": 0.03794536739587784, "train/loss": 1.4533294439315796, "uptime": 18430.037553080998, "examples_seen": 102553600.0, "progress": 0.8894079198600392, "epoch": 80.04701963132051, "img/sec/core": 740.390752033701, "core_hours_NVIDIA A100-SXM4-40GB": 39.99183697215997, "core_hours": 39.99183697215997} {"step": 100200, "global_schedule": 0.03563007712364197, "l2_grads": 2.748852252960205, "l2_params": 239.8162384033203, "l2_updates": 0.03819146007299423, "train/loss": 3.6398048400878906, "uptime": 18438.950654325003, "examples_seen": 102604800.0, "progress": 0.8898519577631147, "epoch": 80.08698319578946, "img/sec/core": 718.0441268192073, "core_hours_NVIDIA A100-SXM4-40GB": 40.01164386381331, "core_hours": 40.01164386381331} {"step": 100250, "global_schedule": 0.035346806049346924, "l2_grads": 2.5977656841278076, "l2_params": 239.79574584960938, "l2_updates": 0.03832007944583893, "train/loss": 2.30264949798584, "uptime": 18447.886237788, "examples_seen": 102656000.0, "progress": 0.8902959956661901, "epoch": 80.12694676025842, "img/sec/core": 716.2375044114826, "core_hours_NVIDIA A100-SXM4-40GB": 40.03150071595332, "core_hours": 40.03150071595332} {"step": 100300, "global_schedule": 0.03506466746330261, "l2_grads": 2.746793270111084, "l2_params": 239.77406311035156, "l2_updates": 0.037536557763814926, "train/loss": 1.7946110963821411, "uptime": 18456.771607383, "examples_seen": 102707200.0, "progress": 0.8907400335692655, "epoch": 80.16691032472738, "img/sec/core": 720.285175712063, "core_hours_NVIDIA A100-SXM4-40GB": 40.05124598171997, "core_hours": 40.05124598171997} {"step": 100350, "global_schedule": 0.03478357195854187, "l2_grads": 2.478101968765259, "l2_params": 239.7530975341797, "l2_updates": 0.037079233676195145, "train/loss": 2.6516635417938232, "uptime": 18466.439768429, "examples_seen": 102758400.0, "progress": 0.8911840714723409, "epoch": 80.20687388919633, "img/sec/core": 661.9666314565427, "core_hours_NVIDIA A100-SXM4-40GB": 40.072730784044424, "core_hours": 40.072730784044424} {"step": 100400, "global_schedule": 0.03450363874435425, "l2_grads": 2.9169392585754395, "l2_params": 239.73304748535156, "l2_updates": 0.03666917234659195, "train/loss": 1.4263060092926025, "uptime": 18475.399356322, "examples_seen": 102809600.0, "progress": 0.8916281093754163, "epoch": 80.2468374536653, "img/sec/core": 714.3185687144497, "core_hours_NVIDIA A100-SXM4-40GB": 40.0926409793622, "core_hours": 40.0926409793622} {"step": 100450, "global_schedule": 0.03422471880912781, "l2_grads": 2.7996084690093994, "l2_params": 239.71400451660156, "l2_updates": 0.03665443882346153, "train/loss": 1.4276119470596313, "uptime": 18485.002184655, "examples_seen": 102860800.0, "progress": 0.8920721472784917, "epoch": 80.28680101813424, "img/sec/core": 666.4703125023997, "core_hours_NVIDIA A100-SXM4-40GB": 40.11398059787997, "core_hours": 40.11398059787997} {"step": 100500, "global_schedule": 0.03394696116447449, "l2_grads": 2.6933906078338623, "l2_params": 239.69500732421875, "l2_updates": 0.036022916436195374, "train/loss": 3.7089667320251465, "uptime": 18494.695148949002, "examples_seen": 102912000.0, "progress": 0.8925161851815671, "epoch": 80.3267645826032, "img/sec/core": 660.2727303927848, "core_hours_NVIDIA A100-SXM4-40GB": 40.13552051853331, "core_hours": 40.13552051853331} {"step": 100550, "global_schedule": 0.033670276403427124, "l2_grads": 2.730445146560669, "l2_params": 239.67445373535156, "l2_updates": 0.03613920509815216, "train/loss": 1.4431557655334473, "uptime": 18503.988362759002, "examples_seen": 102963200.0, "progress": 0.8929602230846425, "epoch": 80.36672814707217, "img/sec/core": 688.6745673615023, "core_hours_NVIDIA A100-SXM4-40GB": 40.15617210477775, "core_hours": 40.15617210477775} {"step": 100600, "global_schedule": 0.03339466452598572, "l2_grads": 2.6087234020233154, "l2_params": 239.6552276611328, "l2_updates": 0.03563600033521652, "train/loss": 2.917605400085449, "uptime": 18512.704642571, "examples_seen": 103014400.0, "progress": 0.8934042609877179, "epoch": 80.40669171154111, "img/sec/core": 734.2582085522739, "core_hours_NVIDIA A100-SXM4-40GB": 40.17554161547109, "core_hours": 40.17554161547109} {"step": 100650, "global_schedule": 0.03312012553215027, "l2_grads": 2.7486162185668945, "l2_params": 239.63525390625, "l2_updates": 0.03555416688323021, "train/loss": 1.4829826354980469, "uptime": 18521.333307333, "examples_seen": 103065600.0, "progress": 0.8938482988907933, "epoch": 80.44665527601008, "img/sec/core": 741.7138313433089, "core_hours_NVIDIA A100-SXM4-40GB": 40.19471642605332, "core_hours": 40.19471642605332} {"step": 100700, "global_schedule": 0.03284671902656555, "l2_grads": 2.779829978942871, "l2_params": 239.6153564453125, "l2_updates": 0.03505340591073036, "train/loss": 3.514320135116577, "uptime": 18530.058684187003, "examples_seen": 103116800.0, "progress": 0.8942923367938688, "epoch": 80.48661884047903, "img/sec/core": 733.4926739658714, "core_hours_NVIDIA A100-SXM4-40GB": 40.21410615239554, "core_hours": 40.21410615239554} {"step": 100750, "global_schedule": 0.03257441520690918, "l2_grads": 2.7876036167144775, "l2_params": 239.59750366210938, "l2_updates": 0.03542466461658478, "train/loss": 3.721400260925293, "uptime": 18538.795784909, "examples_seen": 103168000.0, "progress": 0.8947363746969441, "epoch": 80.52658240494799, "img/sec/core": 732.5084377115554, "core_hours_NVIDIA A100-SXM4-40GB": 40.23352193177776, "core_hours": 40.23352193177776} {"step": 100800, "global_schedule": 0.03230315446853638, "l2_grads": 2.4721474647521973, "l2_params": 239.5778350830078, "l2_updates": 0.0341559536755085, "train/loss": 2.2871570587158203, "uptime": 18547.839195769004, "examples_seen": 103219200.0, "progress": 0.8951804126000196, "epoch": 80.56654596941695, "img/sec/core": 707.6975821486182, "core_hours_NVIDIA A100-SXM4-40GB": 40.253618400355535, "core_hours": 40.253618400355535} {"step": 100850, "global_schedule": 0.03203308582305908, "l2_grads": 2.823763608932495, "l2_params": 239.558837890625, "l2_updates": 0.03459075465798378, "train/loss": 1.6983250379562378, "uptime": 18556.662417787004, "examples_seen": 103270400.0, "progress": 0.8956244505030949, "epoch": 80.6065095338859, "img/sec/core": 725.3586033473591, "core_hours_NVIDIA A100-SXM4-40GB": 40.27322556039554, "core_hours": 40.27322556039554} {"step": 100900, "global_schedule": 0.03176400065422058, "l2_grads": 2.497809886932373, "l2_params": 239.5405731201172, "l2_updates": 0.033734217286109924, "train/loss": 1.8198237419128418, "uptime": 18565.375401609002, "examples_seen": 103321600.0, "progress": 0.8960684884061704, "epoch": 80.64647309835486, "img/sec/core": 734.5359673274031, "core_hours_NVIDIA A100-SXM4-40GB": 40.29258774666665, "core_hours": 40.29258774666665} {"step": 100950, "global_schedule": 0.0314960777759552, "l2_grads": 2.844087839126587, "l2_params": 239.52151489257812, "l2_updates": 0.033580709248781204, "train/loss": 3.505676031112671, "uptime": 18574.686112100004, "examples_seen": 103372800.0, "progress": 0.8965125263092457, "epoch": 80.68643666282382, "img/sec/core": 687.3804105696853, "core_hours_NVIDIA A100-SXM4-40GB": 40.31327821442442, "core_hours": 40.31327821442442} {"step": 101000, "global_schedule": 0.031229227781295776, "l2_grads": 2.5860347747802734, "l2_params": 239.50341796875, "l2_updates": 0.03291349858045578, "train/loss": 1.6620795726776123, "uptime": 18584.347131241004, "examples_seen": 103424000.0, "progress": 0.8969565642123212, "epoch": 80.72640022729277, "img/sec/core": 662.4559900558841, "core_hours_NVIDIA A100-SXM4-40GB": 40.334747145848866, "core_hours": 40.334747145848866} {"step": 101050, "global_schedule": 0.030963480472564697, "l2_grads": 2.819258451461792, "l2_params": 239.4860382080078, "l2_updates": 0.03283235430717468, "train/loss": 1.5343647003173828, "uptime": 18593.617323926002, "examples_seen": 103475200.0, "progress": 0.8974006021153965, "epoch": 80.76636379176173, "img/sec/core": 768.727130167606, "core_hours_NVIDIA A100-SXM4-40GB": 40.35324814791331, "core_hours": 40.35324814791331} {"step": 101100, "global_schedule": 0.03069886565208435, "l2_grads": 2.8301897048950195, "l2_params": 239.4663848876953, "l2_updates": 0.03314734622836113, "train/loss": 1.5157437324523926, "uptime": 18602.281181026003, "examples_seen": 103526400.0, "progress": 0.897844640018472, "epoch": 80.80632735623068, "img/sec/core": 738.7010111235293, "core_hours_NVIDIA A100-SXM4-40GB": 40.37250116369109, "core_hours": 40.37250116369109} {"step": 101150, "global_schedule": 0.03043532371520996, "l2_grads": 2.7239742279052734, "l2_params": 239.4476776123047, "l2_updates": 0.03265543282032013, "train/loss": 1.4691603183746338, "uptime": 18611.144507158002, "examples_seen": 103577600.0, "progress": 0.8982886779215474, "epoch": 80.84629092069964, "img/sec/core": 722.076555086259, "core_hours_NVIDIA A100-SXM4-40GB": 40.39219744398442, "core_hours": 40.39219744398442} {"step": 101200, "global_schedule": 0.03017285466194153, "l2_grads": 2.747438430786133, "l2_params": 239.42880249023438, "l2_updates": 0.03207997605204582, "train/loss": 3.674617290496826, "uptime": 18620.658733581004, "examples_seen": 103628800.0, "progress": 0.8987327158246228, "epoch": 80.8862544851686, "img/sec/core": 672.6768646715519, "core_hours_NVIDIA A100-SXM4-40GB": 40.41334016936887, "core_hours": 40.41334016936887} {"step": 101250, "global_schedule": 0.029911547899246216, "l2_grads": 2.56225848197937, "l2_params": 239.40988159179688, "l2_updates": 0.03218495473265648, "train/loss": 2.3770790100097656, "uptime": 18630.434887543, "examples_seen": 103680000.0, "progress": 0.8991767537276982, "epoch": 80.92621804963755, "img/sec/core": 654.6541743180916, "core_hours_NVIDIA A100-SXM4-40GB": 40.4350649559511, "core_hours": 40.4350649559511} {"step": 101300, "global_schedule": 0.02965131402015686, "l2_grads": 2.9664525985717773, "l2_params": 239.39283752441406, "l2_updates": 0.03179292380809784, "train/loss": 1.5829949378967285, "uptime": 18640.227326957, "examples_seen": 103731200.0, "progress": 0.8996207916307736, "epoch": 80.96618161410652, "img/sec/core": 653.5654426261426, "core_hours_NVIDIA A100-SXM4-40GB": 40.456825932426646, "core_hours": 40.456825932426646} {"step": 101350, "global_schedule": 0.02939218282699585, "l2_grads": 2.7355244159698486, "l2_params": 239.37567138671875, "l2_updates": 0.031744133681058884, "train/loss": 3.400954246520996, "uptime": 18649.852168662997, "examples_seen": 103782400.0, "progress": 0.900064829533849, "epoch": 81.00614517857547, "img/sec/core": 664.9460007234998, "core_hours_NVIDIA A100-SXM4-40GB": 40.478214469551084, "core_hours": 40.478214469551084} {"step": 101400, "global_schedule": 0.02913418412208557, "l2_grads": 2.79821515083313, "l2_params": 239.35748291015625, "l2_updates": 0.03135501220822334, "train/loss": 1.4816533327102661, "uptime": 18659.414663037, "examples_seen": 103833600.0, "progress": 0.9005088674369244, "epoch": 81.04610874304443, "img/sec/core": 669.281439516562, "core_hours_NVIDIA A100-SXM4-40GB": 40.49946445704886, "core_hours": 40.49946445704886} {"step": 101450, "global_schedule": 0.028877228498458862, "l2_grads": 2.6694726943969727, "l2_params": 239.33946228027344, "l2_updates": 0.03077477589249611, "train/loss": 3.3152029514312744, "uptime": 18668.611164192, "examples_seen": 103884800.0, "progress": 0.9009529053399998, "epoch": 81.08607230751339, "img/sec/core": 695.9168375158737, "core_hours_NVIDIA A100-SXM4-40GB": 40.5199011262822, "core_hours": 40.5199011262822} {"step": 101500, "global_schedule": 0.028621405363082886, "l2_grads": 2.5647337436676025, "l2_params": 239.32217407226562, "l2_updates": 0.03038337454199791, "train/loss": 1.9391107559204102, "uptime": 18678.125322214997, "examples_seen": 103936000.0, "progress": 0.9013969432430752, "epoch": 81.12603587198234, "img/sec/core": 672.6817007379998, "core_hours_NVIDIA A100-SXM4-40GB": 40.54104369966664, "core_hours": 40.54104369966664} {"step": 101550, "global_schedule": 0.028366655111312866, "l2_grads": 2.5014381408691406, "l2_params": 239.30520629882812, "l2_updates": 0.030606118962168694, "train/loss": 1.8570271730422974, "uptime": 18686.581010568, "examples_seen": 103987200.0, "progress": 0.9018409811461506, "epoch": 81.1659994364513, "img/sec/core": 756.886930172596, "core_hours_NVIDIA A100-SXM4-40GB": 40.55983411822887, "core_hours": 40.55983411822887} {"step": 101600, "global_schedule": 0.028113096952438354, "l2_grads": 2.7614824771881104, "l2_params": 239.28836059570312, "l2_updates": 0.029330555349588394, "train/loss": 1.757192850112915, "uptime": 18695.211755281, "examples_seen": 104038400.0, "progress": 0.9022850190492261, "epoch": 81.20596300092025, "img/sec/core": 741.5350833354177, "core_hours_NVIDIA A100-SXM4-40GB": 40.57901355092442, "core_hours": 40.57901355092442} {"step": 101650, "global_schedule": 0.027860552072525024, "l2_grads": 2.6557376384735107, "l2_params": 239.27198791503906, "l2_updates": 0.029789667576551437, "train/loss": 1.3498337268829346, "uptime": 18703.982675988, "examples_seen": 104089600.0, "progress": 0.9027290569523014, "epoch": 81.24592656538921, "img/sec/core": 729.6839424043677, "core_hours_NVIDIA A100-SXM4-40GB": 40.59850448582886, "core_hours": 40.59850448582886} {"step": 101700, "global_schedule": 0.027609169483184814, "l2_grads": 2.614915132522583, "l2_params": 239.25550842285156, "l2_updates": 0.02908473275601864, "train/loss": 2.1493120193481445, "uptime": 18712.627704467, "examples_seen": 104140800.0, "progress": 0.9031730948553769, "epoch": 81.28589012985817, "img/sec/core": 740.3098804759229, "core_hours_NVIDIA A100-SXM4-40GB": 40.617715660226644, "core_hours": 40.617715660226644} {"step": 101750, "global_schedule": 0.02735885977745056, "l2_grads": 2.7161052227020264, "l2_params": 239.239501953125, "l2_updates": 0.029529282823204994, "train/loss": 1.4976000785827637, "uptime": 18721.370417516002, "examples_seen": 104192000.0, "progress": 0.9036171327584522, "epoch": 81.32585369432712, "img/sec/core": 732.0382087494395, "core_hours_NVIDIA A100-SXM4-40GB": 40.63714391144664, "core_hours": 40.63714391144664} {"step": 101800, "global_schedule": 0.02710971236228943, "l2_grads": 2.65480899810791, "l2_params": 239.22279357910156, "l2_updates": 0.02920869179069996, "train/loss": 1.460096836090088, "uptime": 18730.077897263, "examples_seen": 104243200.0, "progress": 0.9040611706615277, "epoch": 81.36581725879608, "img/sec/core": 735.0002740120083, "core_hours_NVIDIA A100-SXM4-40GB": 40.65649386643998, "core_hours": 40.65649386643998} {"step": 101850, "global_schedule": 0.026861608028411865, "l2_grads": 2.6682417392730713, "l2_params": 239.207275390625, "l2_updates": 0.028606470674276352, "train/loss": 1.466106653213501, "uptime": 18739.034126744, "examples_seen": 104294400.0, "progress": 0.904505208564603, "epoch": 81.40578082326503, "img/sec/core": 714.5864242958774, "core_hours_NVIDIA A100-SXM4-40GB": 40.676396598619974, "core_hours": 40.676396598619974} {"step": 101900, "global_schedule": 0.026614665985107422, "l2_grads": 2.569321870803833, "l2_params": 239.19049072265625, "l2_updates": 0.02819417230784893, "train/loss": 2.8329319953918457, "uptime": 18747.981610604, "examples_seen": 104345600.0, "progress": 0.9049492464676785, "epoch": 81.445744387734, "img/sec/core": 715.2848890414268, "core_hours_NVIDIA A100-SXM4-40GB": 40.69627989608664, "core_hours": 40.69627989608664} {"step": 101950, "global_schedule": 0.026368796825408936, "l2_grads": 2.7602648735046387, "l2_params": 239.17483520507812, "l2_updates": 0.02771993726491928, "train/loss": 1.8265630006790161, "uptime": 18757.308592457004, "examples_seen": 104396800.0, "progress": 0.9053932843707538, "epoch": 81.48570795220296, "img/sec/core": 686.1812428572202, "core_hours_NVIDIA A100-SXM4-40GB": 40.71700652242665, "core_hours": 40.71700652242665} {"step": 102000, "global_schedule": 0.026124030351638794, "l2_grads": 2.559748411178589, "l2_params": 239.1583709716797, "l2_updates": 0.028080446645617485, "train/loss": 1.546312928199768, "uptime": 18766.459661975998, "examples_seen": 104448000.0, "progress": 0.9058373222738293, "epoch": 81.5256715166719, "img/sec/core": 699.371804215219, "core_hours_NVIDIA A100-SXM4-40GB": 40.73734223246887, "core_hours": 40.73734223246887} {"step": 102050, "global_schedule": 0.025880426168441772, "l2_grads": 2.5470709800720215, "l2_params": 239.14295959472656, "l2_updates": 0.02750716730952263, "train/loss": 2.4430036544799805, "uptime": 18774.900270763, "examples_seen": 104499200.0, "progress": 0.9062813601769047, "epoch": 81.56563508114087, "img/sec/core": 824.7627435201562, "core_hours_NVIDIA A100-SXM4-40GB": 40.75458624880443, "core_hours": 40.75458624880443} {"step": 102100, "global_schedule": 0.025637894868850708, "l2_grads": 2.534083843231201, "l2_params": 239.1289825439453, "l2_updates": 0.027771346271038055, "train/loss": 1.897287368774414, "uptime": 18783.635892509003, "examples_seen": 104550400.0, "progress": 0.9067253980799801, "epoch": 81.60559864560982, "img/sec/core": 732.6324543448154, "core_hours_NVIDIA A100-SXM4-40GB": 40.773998741573315, "core_hours": 40.773998741573315} {"step": 102150, "global_schedule": 0.02539646625518799, "l2_grads": 2.6685619354248047, "l2_params": 239.11280822753906, "l2_updates": 0.02687647193670273, "train/loss": 1.725475549697876, "uptime": 18792.698832371003, "examples_seen": 104601600.0, "progress": 0.9071694359830555, "epoch": 81.64556221007878, "img/sec/core": 706.1726214066931, "core_hours_NVIDIA A100-SXM4-40GB": 40.79413860793331, "core_hours": 40.79413860793331} {"step": 102200, "global_schedule": 0.025156140327453613, "l2_grads": 2.715766429901123, "l2_params": 239.0982208251953, "l2_updates": 0.0271091740578413, "train/loss": 1.6356791257858276, "uptime": 18802.576656762, "examples_seen": 104652800.0, "progress": 0.9076134738861309, "epoch": 81.68552577454774, "img/sec/core": 647.9159526091955, "core_hours_NVIDIA A100-SXM4-40GB": 40.81608932880219, "core_hours": 40.81608932880219} {"step": 102250, "global_schedule": 0.02491697669029236, "l2_grads": 2.7364702224731445, "l2_params": 239.0826873779297, "l2_updates": 0.026413917541503906, "train/loss": 1.5721988677978516, "uptime": 18812.364234505003, "examples_seen": 104704000.0, "progress": 0.9080575117892064, "epoch": 81.72548933901669, "img/sec/core": 653.8900806766095, "core_hours_NVIDIA A100-SXM4-40GB": 40.837839501564424, "core_hours": 40.837839501564424} {"step": 102300, "global_schedule": 0.024678915739059448, "l2_grads": 2.552825689315796, "l2_params": 239.06744384765625, "l2_updates": 0.02616482600569725, "train/loss": 2.2776613235473633, "uptime": 18821.330954310004, "examples_seen": 104755200.0, "progress": 0.9085015496922817, "epoch": 81.76545290348565, "img/sec/core": 713.7504170065066, "core_hours_NVIDIA A100-SXM4-40GB": 40.85776554557553, "core_hours": 40.85776554557553} {"step": 102350, "global_schedule": 0.024441957473754883, "l2_grads": 2.686131238937378, "l2_params": 239.05194091796875, "l2_updates": 0.026510996744036674, "train/loss": 1.3962494134902954, "uptime": 18830.637167768, "examples_seen": 104806400.0, "progress": 0.9089455875953572, "epoch": 81.8054164679546, "img/sec/core": 687.7125727756235, "core_hours_NVIDIA A100-SXM4-40GB": 40.87844601992665, "core_hours": 40.87844601992665} {"step": 102400, "global_schedule": 0.024206072092056274, "l2_grads": 2.528610944747925, "l2_params": 239.03726196289062, "l2_updates": 0.025989774614572525, "train/loss": 2.1903865337371826, "uptime": 18840.602659416, "examples_seen": 104857600.0, "progress": 0.9093896254984325, "epoch": 81.84538003242356, "img/sec/core": 642.2161822076074, "core_hours_NVIDIA A100-SXM4-40GB": 40.9005915569222, "core_hours": 40.9005915569222} {"step": 102450, "global_schedule": 0.023971349000930786, "l2_grads": 2.7312169075012207, "l2_params": 239.0226287841797, "l2_updates": 0.025587933138012886, "train/loss": 3.0573599338531494, "uptime": 18850.254633285003, "examples_seen": 104908800.0, "progress": 0.909833663401508, "epoch": 81.88534359689253, "img/sec/core": 663.0768055180033, "core_hours_NVIDIA A100-SXM4-40GB": 40.9220403877422, "core_hours": 40.9220403877422} {"step": 102500, "global_schedule": 0.02373775839805603, "l2_grads": 2.5343844890594482, "l2_params": 239.0083770751953, "l2_updates": 0.02594793774187565, "train/loss": 1.6001232862472534, "uptime": 18859.203041695997, "examples_seen": 104960000.0, "progress": 0.9102777013045834, "epoch": 81.92530716136147, "img/sec/core": 715.2109856915638, "core_hours_NVIDIA A100-SXM4-40GB": 40.94192573976664, "core_hours": 40.94192573976664, "val/acc@1": 0.76536, "val/loss": 0.9341396875, "z/secs/eval/val": 2.6359289239990176} {"step": 102550, "global_schedule": 0.02350527048110962, "l2_grads": 2.905472993850708, "l2_params": 238.99510192871094, "l2_updates": 0.025051511824131012, "train/loss": 3.774599313735962, "uptime": 18870.771148412998, "examples_seen": 105011200.0, "progress": 0.9107217392076588, "epoch": 81.96527072583044, "img/sec/core": 716.582619342693, "core_hours_NVIDIA A100-SXM4-40GB": 40.96177302860441, "core_hours": 40.96177302860441} {"step": 102600, "global_schedule": 0.023273885250091553, "l2_grads": 2.5009031295776367, "l2_params": 238.9806365966797, "l2_updates": 0.025084776803851128, "train/loss": 1.8316271305084229, "uptime": 18880.61739182, "examples_seen": 105062400.0, "progress": 0.9111657771107342, "epoch": 82.00523429029938, "img/sec/core": 649.9940876383812, "core_hours_NVIDIA A100-SXM4-40GB": 40.98365356950887, "core_hours": 40.98365356950887} {"step": 102650, "global_schedule": 0.02304360270500183, "l2_grads": 2.7848446369171143, "l2_params": 238.9657745361328, "l2_updates": 0.02452705428004265, "train/loss": 3.4309732913970947, "uptime": 18889.944929359, "examples_seen": 105113600.0, "progress": 0.9116098150138096, "epoch": 82.04519785476835, "img/sec/core": 686.1403637608312, "core_hours_NVIDIA A100-SXM4-40GB": 41.00438143070664, "core_hours": 41.00438143070664} {"step": 102700, "global_schedule": 0.022814452648162842, "l2_grads": 2.7143969535827637, "l2_params": 238.9528350830078, "l2_updates": 0.024563461542129517, "train/loss": 1.773769497871399, "uptime": 18899.716474697, "examples_seen": 105164800.0, "progress": 0.912053852916885, "epoch": 82.08516141923731, "img/sec/core": 654.9629335608801, "core_hours_NVIDIA A100-SXM4-40GB": 41.026095975902194, "core_hours": 41.026095975902194} {"step": 102750, "global_schedule": 0.022586405277252197, "l2_grads": 2.5962870121002197, "l2_params": 238.93820190429688, "l2_updates": 0.02431493066251278, "train/loss": 1.777825951576233, "uptime": 18909.554125538, "examples_seen": 105216000.0, "progress": 0.9124978908199604, "epoch": 82.12512498370626, "img/sec/core": 650.5618163766164, "core_hours_NVIDIA A100-SXM4-40GB": 41.047957422215525, "core_hours": 41.047957422215525} {"step": 102800, "global_schedule": 0.02235954999923706, "l2_grads": 2.662858486175537, "l2_params": 238.92410278320312, "l2_updates": 0.024160120636224747, "train/loss": 1.4524800777435303, "uptime": 18918.682926964, "examples_seen": 105267200.0, "progress": 0.9129419287230358, "epoch": 82.16508854817522, "img/sec/core": 701.0777977676398, "core_hours_NVIDIA A100-SXM4-40GB": 41.06824364760664, "core_hours": 41.06824364760664} {"step": 102850, "global_schedule": 0.022133708000183105, "l2_grads": 2.7448270320892334, "l2_params": 238.9108428955078, "l2_updates": 0.023904908448457718, "train/loss": 1.4486764669418335, "uptime": 18927.557166999002, "examples_seen": 105318400.0, "progress": 0.9133859666261112, "epoch": 82.20505211264418, "img/sec/core": 721.1885158345482, "core_hours_NVIDIA A100-SXM4-40GB": 41.087964181017746, "core_hours": 41.087964181017746} {"step": 102900, "global_schedule": 0.021909058094024658, "l2_grads": 2.4720115661621094, "l2_params": 238.89686584472656, "l2_updates": 0.023157628253102303, "train/loss": 2.7929885387420654, "uptime": 18936.393248770997, "examples_seen": 105369600.0, "progress": 0.9138300045291866, "epoch": 82.24501567711313, "img/sec/core": 724.3029393731407, "core_hours_NVIDIA A100-SXM4-40GB": 41.10759991828886, "core_hours": 41.10759991828886} {"step": 102950, "global_schedule": 0.021685481071472168, "l2_grads": 2.725572109222412, "l2_params": 238.88357543945312, "l2_updates": 0.022956615313887596, "train/loss": 3.220125436782837, "uptime": 18945.206930419, "examples_seen": 105420800.0, "progress": 0.9142740424322621, "epoch": 82.28497924158209, "img/sec/core": 726.143767792231, "core_hours_NVIDIA A100-SXM4-40GB": 41.12718587750664, "core_hours": 41.12718587750664} {"step": 103000, "global_schedule": 0.021463096141815186, "l2_grads": 2.6069889068603516, "l2_params": 238.8699188232422, "l2_updates": 0.02281213365495205, "train/loss": 2.542593002319336, "uptime": 18954.082573954, "examples_seen": 105472000.0, "progress": 0.9147180803353374, "epoch": 82.32494280605104, "img/sec/core": 721.0744747422525, "core_hours_NVIDIA A100-SXM4-40GB": 41.146909529806635, "core_hours": 41.146909529806635} {"step": 103050, "global_schedule": 0.021241754293441772, "l2_grads": 2.85089111328125, "l2_params": 238.85629272460938, "l2_updates": 0.02299337647855282, "train/loss": 1.378968596458435, "uptime": 18963.894228310004, "examples_seen": 105523200.0, "progress": 0.9151621182384129, "epoch": 82.36490637052, "img/sec/core": 697.9508973453818, "core_hours_NVIDIA A100-SXM4-40GB": 41.167286639824425, "core_hours": 41.167286639824425} {"step": 103100, "global_schedule": 0.021021604537963867, "l2_grads": 2.8179268836975098, "l2_params": 238.8426513671875, "l2_updates": 0.02263183705508709, "train/loss": 1.5016911029815674, "uptime": 18973.726854865003, "examples_seen": 105574400.0, "progress": 0.9156061561414882, "epoch": 82.40486993498897, "img/sec/core": 650.8942411472406, "core_hours_NVIDIA A100-SXM4-40GB": 41.18913692105776, "core_hours": 41.18913692105776} {"step": 103150, "global_schedule": 0.02080252766609192, "l2_grads": 2.824014663696289, "l2_params": 238.82974243164062, "l2_updates": 0.022433539852499962, "train/loss": 1.6925885677337646, "uptime": 18983.342488185997, "examples_seen": 105625600.0, "progress": 0.9160501940445637, "epoch": 82.44483349945791, "img/sec/core": 665.5827844458133, "core_hours_NVIDIA A100-SXM4-40GB": 41.21050499510442, "core_hours": 41.21050499510442} {"step": 103200, "global_schedule": 0.020584583282470703, "l2_grads": 2.4676120281219482, "l2_params": 238.81597900390625, "l2_updates": 0.02215775102376938, "train/loss": 2.3747496604919434, "uptime": 18993.153888380002, "examples_seen": 105676800.0, "progress": 0.916494231947639, "epoch": 82.48479706392688, "img/sec/core": 652.3024108131931, "core_hours_NVIDIA A100-SXM4-40GB": 41.23230810664665, "core_hours": 41.23230810664665} {"step": 103250, "global_schedule": 0.020367801189422607, "l2_grads": 2.7537620067596436, "l2_params": 238.80401611328125, "l2_updates": 0.021630143746733665, "train/loss": 1.451356053352356, "uptime": 19001.960952096, "examples_seen": 105728000.0, "progress": 0.9169382698507145, "epoch": 82.52476062839582, "img/sec/core": 726.6894173107569, "core_hours_NVIDIA A100-SXM4-40GB": 41.25187935934887, "core_hours": 41.25187935934887} {"step": 103300, "global_schedule": 0.02015209197998047, "l2_grads": 3.0566344261169434, "l2_params": 238.79153442382812, "l2_updates": 0.021483037620782852, "train/loss": 1.583073616027832, "uptime": 19011.080697792997, "examples_seen": 105779200.0, "progress": 0.9173823077537898, "epoch": 82.56472419286479, "img/sec/core": 701.7739543009019, "core_hours_NVIDIA A100-SXM4-40GB": 41.272145460897754, "core_hours": 41.272145460897754} {"step": 103350, "global_schedule": 0.019937515258789062, "l2_grads": 2.563838481903076, "l2_params": 238.77880859375, "l2_updates": 0.021320287138223648, "train/loss": 2.5005431175231934, "uptime": 19019.706107482998, "examples_seen": 105830400.0, "progress": 0.9178263456568653, "epoch": 82.60468775733375, "img/sec/core": 741.9937405894026, "core_hours_NVIDIA A100-SXM4-40GB": 41.29131303798665, "core_hours": 41.29131303798665} {"step": 103400, "global_schedule": 0.01972407102584839, "l2_grads": 2.6026320457458496, "l2_params": 238.76666259765625, "l2_updates": 0.02127237617969513, "train/loss": 3.029270648956299, "uptime": 19028.398691946997, "examples_seen": 105881600.0, "progress": 0.9182703835599407, "epoch": 82.6446513218027, "img/sec/core": 736.2597426008371, "core_hours_NVIDIA A100-SXM4-40GB": 41.31062989235109, "core_hours": 41.31062989235109} {"step": 103450, "global_schedule": 0.019511759281158447, "l2_grads": 2.941089153289795, "l2_params": 238.75567626953125, "l2_updates": 0.020973598584532738, "train/loss": 1.4581282138824463, "uptime": 19037.008051311997, "examples_seen": 105932800.0, "progress": 0.9187144214630161, "epoch": 82.68461488627166, "img/sec/core": 743.3770305858056, "core_hours_NVIDIA A100-SXM4-40GB": 41.32976180205109, "core_hours": 41.32976180205109} {"step": 103500, "global_schedule": 0.01930058002471924, "l2_grads": 2.85593581199646, "l2_params": 238.74386596679688, "l2_updates": 0.020495008677244186, "train/loss": 1.4161003828048706, "uptime": 19046.258129314003, "examples_seen": 105984000.0, "progress": 0.9191584593660915, "epoch": 82.72457845074061, "img/sec/core": 691.8860574597277, "core_hours_NVIDIA A100-SXM4-40GB": 41.35031753094442, "core_hours": 41.35031753094442} {"step": 103550, "global_schedule": 0.019090503454208374, "l2_grads": 2.867823362350464, "l2_params": 238.73184204101562, "l2_updates": 0.020362157374620438, "train/loss": 3.4793648719787598, "uptime": 19054.679246886, "examples_seen": 106035200.0, "progress": 0.9196024972691669, "epoch": 82.76454201520957, "img/sec/core": 759.994139172098, "core_hours_NVIDIA A100-SXM4-40GB": 41.36903112554887, "core_hours": 41.36903112554887} {"step": 103600, "global_schedule": 0.018881559371948242, "l2_grads": 2.561054229736328, "l2_params": 238.71990966796875, "l2_updates": 0.02020583488047123, "train/loss": 2.0606980323791504, "uptime": 19063.245154898003, "examples_seen": 106086400.0, "progress": 0.9200465351722423, "epoch": 82.80450557967853, "img/sec/core": 747.147878664505, "core_hours_NVIDIA A100-SXM4-40GB": 41.388066476686646, "core_hours": 41.388066476686646} {"step": 103650, "global_schedule": 0.018673747777938843, "l2_grads": 2.561102867126465, "l2_params": 238.70858764648438, "l2_updates": 0.019936325028538704, "train/loss": 2.546556234359741, "uptime": 19071.824956458004, "examples_seen": 106137600.0, "progress": 0.9204905730753177, "epoch": 82.84446914414748, "img/sec/core": 745.937998127674, "core_hours_NVIDIA A100-SXM4-40GB": 41.407132702375534, "core_hours": 41.407132702375534} {"step": 103700, "global_schedule": 0.018467068672180176, "l2_grads": 2.7950363159179688, "l2_params": 238.69708251953125, "l2_updates": 0.020097367465496063, "train/loss": 1.5113415718078613, "uptime": 19080.517083858, "examples_seen": 106188800.0, "progress": 0.9209346109783931, "epoch": 82.88443270861644, "img/sec/core": 736.2984578437711, "core_hours_NVIDIA A100-SXM4-40GB": 41.4264485410422, "core_hours": 41.4264485410422} {"step": 103750, "global_schedule": 0.01826155185699463, "l2_grads": 2.7717387676239014, "l2_params": 238.6854705810547, "l2_updates": 0.0195435993373394, "train/loss": 1.4607335329055786, "uptime": 19089.023912099, "examples_seen": 106240000.0, "progress": 0.9213786488814685, "epoch": 82.92439627308539, "img/sec/core": 752.3368074078079, "core_hours_NVIDIA A100-SXM4-40GB": 41.445352603799975, "core_hours": 41.445352603799975} {"step": 103800, "global_schedule": 0.018057137727737427, "l2_grads": 2.838304042816162, "l2_params": 238.6738739013672, "l2_updates": 0.01940963976085186, "train/loss": 3.4000749588012695, "uptime": 19097.637629728997, "examples_seen": 106291200.0, "progress": 0.9218226867845439, "epoch": 82.96435983755435, "img/sec/core": 743.0009056380093, "core_hours_NVIDIA A100-SXM4-40GB": 41.46449419853331, "core_hours": 41.46449419853331} {"step": 103850, "global_schedule": 0.01785379648208618, "l2_grads": 2.558161973953247, "l2_params": 238.66314697265625, "l2_updates": 0.018981430679559708, "train/loss": 2.225004196166992, "uptime": 19107.230735844, "examples_seen": 106342400.0, "progress": 0.9222667246876194, "epoch": 83.00432340202332, "img/sec/core": 667.145752718459, "core_hours_NVIDIA A100-SXM4-40GB": 41.485812212122205, "core_hours": 41.485812212122205} {"step": 103900, "global_schedule": 0.017651647329330444, "l2_grads": 2.7177233695983887, "l2_params": 238.65219116210938, "l2_updates": 0.018894776701927185, "train/loss": 2.016092538833618, "uptime": 19116.472392385003, "examples_seen": 106393600.0, "progress": 0.9227107625906947, "epoch": 83.04428696649227, "img/sec/core": 692.5165387401412, "core_hours_NVIDIA A100-SXM4-40GB": 41.50634922665776, "core_hours": 41.50634922665776} {"step": 103950, "global_schedule": 0.017450600862503052, "l2_grads": 2.750648021697998, "l2_params": 238.64125061035156, "l2_updates": 0.018852567300200462, "train/loss": 1.4415055513381958, "uptime": 19124.908721754, "examples_seen": 106444800.0, "progress": 0.9231548004937702, "epoch": 83.08425053096123, "img/sec/core": 758.6237710819004, "core_hours_NVIDIA A100-SXM4-40GB": 41.525096625255536, "core_hours": 41.525096625255536} {"step": 104000, "global_schedule": 0.017250746488571167, "l2_grads": 2.5825114250183105, "l2_params": 238.63027954101562, "l2_updates": 0.018552424386143684, "train/loss": 3.1628823280334473, "uptime": 19133.539366999, "examples_seen": 106496000.0, "progress": 0.9235988383968455, "epoch": 83.12421409543018, "img/sec/core": 741.5436295113437, "core_hours_NVIDIA A100-SXM4-40GB": 41.54427583691108, "core_hours": 41.54427583691108} {"step": 104050, "global_schedule": 0.01705193519592285, "l2_grads": 2.517854690551758, "l2_params": 238.61952209472656, "l2_updates": 0.01817980781197548, "train/loss": 3.0758159160614014, "uptime": 19142.864296524, "examples_seen": 106547200.0, "progress": 0.924042876299921, "epoch": 83.16417765989914, "img/sec/core": 768.789817726014, "core_hours_NVIDIA A100-SXM4-40GB": 41.56277533039331, "core_hours": 41.56277533039331} {"step": 104100, "global_schedule": 0.016854315996170044, "l2_grads": 2.459601402282715, "l2_params": 238.6086883544922, "l2_updates": 0.017924398183822632, "train/loss": 2.621399402618408, "uptime": 19152.195474983004, "examples_seen": 106598400.0, "progress": 0.9244869142029963, "epoch": 83.2041412243681, "img/sec/core": 685.8726395728501, "core_hours_NVIDIA A100-SXM4-40GB": 41.58351128252443, "core_hours": 41.58351128252443} {"step": 104150, "global_schedule": 0.01665779948234558, "l2_grads": 2.7125730514526367, "l2_params": 238.5996856689453, "l2_updates": 0.017917899414896965, "train/loss": 1.408651351928711, "uptime": 19161.798252581, "examples_seen": 106649600.0, "progress": 0.9249309521060718, "epoch": 83.24410478883705, "img/sec/core": 666.4738337096217, "core_hours_NVIDIA A100-SXM4-40GB": 41.60485078829775, "core_hours": 41.60485078829775} {"step": 104200, "global_schedule": 0.01646244525909424, "l2_grads": 2.8082807064056396, "l2_params": 238.5893096923828, "l2_updates": 0.01779847778379917, "train/loss": 1.474746823310852, "uptime": 19171.237737407, "examples_seen": 106700800.0, "progress": 0.9253749900091471, "epoch": 83.28406835330601, "img/sec/core": 678.0031027088705, "core_hours_NVIDIA A100-SXM4-40GB": 41.625827421244416, "core_hours": 41.625827421244416} {"step": 104250, "global_schedule": 0.01626819372177124, "l2_grads": 2.8565800189971924, "l2_params": 238.57904052734375, "l2_updates": 0.017708921805024147, "train/loss": 1.4254519939422607, "uptime": 19180.753868961, "examples_seen": 106752000.0, "progress": 0.9258190279122226, "epoch": 83.32403191777496, "img/sec/core": 672.5421946600246, "core_hours_NVIDIA A100-SXM4-40GB": 41.646974380253305, "core_hours": 41.646974380253305} {"step": 104300, "global_schedule": 0.016075104475021362, "l2_grads": 2.697129011154175, "l2_params": 238.56752014160156, "l2_updates": 0.017580240964889526, "train/loss": 1.4393717050552368, "uptime": 19189.915919714003, "examples_seen": 106803200.0, "progress": 0.926263065815298, "epoch": 83.36399548224392, "img/sec/core": 698.5335677061951, "core_hours_NVIDIA A100-SXM4-40GB": 41.66733449303776, "core_hours": 41.66733449303776} {"step": 104350, "global_schedule": 0.01588311791419983, "l2_grads": 2.7410953044891357, "l2_params": 238.55795288085938, "l2_updates": 0.01708240807056427, "train/loss": 1.4587212800979614, "uptime": 19198.520827397, "examples_seen": 106854400.0, "progress": 0.9267071037183734, "epoch": 83.40395904671288, "img/sec/core": 743.7616109054823, "core_hours_NVIDIA A100-SXM4-40GB": 41.686456510111086, "core_hours": 41.686456510111086} {"step": 104400, "global_schedule": 0.01569226384162903, "l2_grads": 2.6267354488372803, "l2_params": 238.5482940673828, "l2_updates": 0.016910042613744736, "train/loss": 1.7869988679885864, "uptime": 19207.625330217, "examples_seen": 106905600.0, "progress": 0.9271511416214488, "epoch": 83.44392261118183, "img/sec/core": 702.9488733796541, "core_hours_NVIDIA A100-SXM4-40GB": 41.70668873859997, "core_hours": 41.70668873859997} {"step": 104450, "global_schedule": 0.015502572059631348, "l2_grads": 2.8717753887176514, "l2_params": 238.53851318359375, "l2_updates": 0.01666332222521305, "train/loss": 3.475966691970825, "uptime": 19217.234831351, "examples_seen": 106956800.0, "progress": 0.9275951795245242, "epoch": 83.4838861756508, "img/sec/core": 666.0075180547653, "core_hours_NVIDIA A100-SXM4-40GB": 41.72804318556442, "core_hours": 41.72804318556442} {"step": 104500, "global_schedule": 0.0153140127658844, "l2_grads": 2.538196325302124, "l2_params": 238.52883911132812, "l2_updates": 0.0164728332310915, "train/loss": 1.750781536102295, "uptime": 19226.888385863, "examples_seen": 107008000.0, "progress": 0.9280392174275996, "epoch": 83.52384974011974, "img/sec/core": 662.9682353834388, "core_hours_NVIDIA A100-SXM4-40GB": 41.74949552892442, "core_hours": 41.74949552892442} {"step": 104550, "global_schedule": 0.015126585960388184, "l2_grads": 2.8128747940063477, "l2_params": 238.51890563964844, "l2_updates": 0.016310224309563637, "train/loss": 1.4176784753799438, "uptime": 19235.987766467, "examples_seen": 107059200.0, "progress": 0.928483255330675, "epoch": 83.5638133045887, "img/sec/core": 703.3445767932291, "core_hours_NVIDIA A100-SXM4-40GB": 41.76971637471108, "core_hours": 41.76971637471108} {"step": 104600, "global_schedule": 0.0149402916431427, "l2_grads": 2.9062201976776123, "l2_params": 238.5096893310547, "l2_updates": 0.016045130789279938, "train/loss": 3.6798858642578125, "uptime": 19244.44498804, "examples_seen": 107110400.0, "progress": 0.9289272932337505, "epoch": 83.60377686905767, "img/sec/core": 756.7497132192824, "core_hours_NVIDIA A100-SXM4-40GB": 41.78851020042886, "core_hours": 41.78851020042886} {"step": 104650, "global_schedule": 0.01475512981414795, "l2_grads": 2.7183468341827393, "l2_params": 238.50030517578125, "l2_updates": 0.016077077016234398, "train/loss": 1.5684857368469238, "uptime": 19252.996960356002, "examples_seen": 107161600.0, "progress": 0.9293713311368258, "epoch": 83.64374043352662, "img/sec/core": 748.3653785953516, "core_hours_NVIDIA A100-SXM4-40GB": 41.8075145833533, "core_hours": 41.8075145833533} {"step": 104700, "global_schedule": 0.014571130275726318, "l2_grads": 2.679173231124878, "l2_params": 238.49148559570312, "l2_updates": 0.015752611681818962, "train/loss": 2.0455799102783203, "uptime": 19261.498586501002, "examples_seen": 107212800.0, "progress": 0.9298153690399013, "epoch": 83.68370399799558, "img/sec/core": 752.797157960651, "core_hours_NVIDIA A100-SXM4-40GB": 41.82640708589775, "core_hours": 41.82640708589775} {"step": 104750, "global_schedule": 0.014388233423233032, "l2_grads": 2.701767683029175, "l2_params": 238.4826202392578, "l2_updates": 0.015631835907697678, "train/loss": 1.3026000261306763, "uptime": 19270.135014571002, "examples_seen": 107264000.0, "progress": 0.9302594069429767, "epoch": 83.72366756246453, "img/sec/core": 741.0471028215286, "core_hours_NVIDIA A100-SXM4-40GB": 41.845599148275525, "core_hours": 41.845599148275525} {"step": 104800, "global_schedule": 0.014206469058990479, "l2_grads": 2.6360490322113037, "l2_params": 238.4736785888672, "l2_updates": 0.015043661929666996, "train/loss": 2.2152023315429688, "uptime": 19278.682270511003, "examples_seen": 107315200.0, "progress": 0.930703444846052, "epoch": 83.76363112693349, "img/sec/core": 748.7783266262703, "core_hours_NVIDIA A100-SXM4-40GB": 41.86459305036442, "core_hours": 41.86459305036442} {"step": 104850, "global_schedule": 0.014025866985321045, "l2_grads": 2.755718231201172, "l2_params": 238.4644317626953, "l2_updates": 0.014962059445679188, "train/loss": 2.9829936027526855, "uptime": 19287.354882751002, "examples_seen": 107366400.0, "progress": 0.9311474827491275, "epoch": 83.80359469140245, "img/sec/core": 737.955280703327, "core_hours_NVIDIA A100-SXM4-40GB": 41.88386552200886, "core_hours": 41.88386552200886} {"step": 104900, "global_schedule": 0.013846427202224731, "l2_grads": 2.9338107109069824, "l2_params": 238.4556427001953, "l2_updates": 0.014691676944494247, "train/loss": 1.47105872631073, "uptime": 19295.821819077, "examples_seen": 107417600.0, "progress": 0.9315915206522029, "epoch": 83.8435582558714, "img/sec/core": 755.8814373443539, "core_hours_NVIDIA A100-SXM4-40GB": 41.90268093606664, "core_hours": 41.90268093606664} {"step": 104950, "global_schedule": 0.013668090105056763, "l2_grads": 2.610382080078125, "l2_params": 238.4475555419922, "l2_updates": 0.014576960355043411, "train/loss": 3.020510196685791, "uptime": 19304.810960516, "examples_seen": 107468800.0, "progress": 0.9320355585552783, "epoch": 83.88352182034036, "img/sec/core": 711.9701078718037, "core_hours_NVIDIA A100-SXM4-40GB": 41.922656805931084, "core_hours": 41.922656805931084} {"step": 105000, "global_schedule": 0.013490885496139526, "l2_grads": 2.547485589981079, "l2_params": 238.4383544921875, "l2_updates": 0.014587460085749626, "train/loss": 1.9413890838623047, "uptime": 19313.993645567003, "examples_seen": 107520000.0, "progress": 0.9324795964583537, "epoch": 83.92348538480933, "img/sec/core": 696.9639015663098, "core_hours_NVIDIA A100-SXM4-40GB": 41.94306277271109, "core_hours": 41.94306277271109, "val/acc@1": 0.76744, "val/loss": 0.9231625134277344, "z/secs/eval/val": 4.3053047789981065} {"step": 105050, "global_schedule": 0.01331484317779541, "l2_grads": 2.6515424251556396, "l2_params": 238.43006896972656, "l2_updates": 0.014260582625865936, "train/loss": 1.3081759214401245, "uptime": 19328.081023430997, "examples_seen": 107571200.0, "progress": 0.9329236343614291, "epoch": 83.96344894927827, "img/sec/core": 721.5955430956284, "core_hours_NVIDIA A100-SXM4-40GB": 41.96277218244664, "core_hours": 41.96277218244664} {"step": 105100, "global_schedule": 0.013139963150024414, "l2_grads": 2.970060348510742, "l2_params": 238.42205810546875, "l2_updates": 0.013997497037053108, "train/loss": 1.3891491889953613, "uptime": 19337.676600295003, "examples_seen": 107622400.0, "progress": 0.9333676722645045, "epoch": 84.00341251374724, "img/sec/core": 666.9739704769675, "core_hours_NVIDIA A100-SXM4-40GB": 41.984095686588866, "core_hours": 41.984095686588866} {"step": 105150, "global_schedule": 0.012966185808181763, "l2_grads": 2.841150999069214, "l2_params": 238.41407775878906, "l2_updates": 0.013907059095799923, "train/loss": 1.386472225189209, "uptime": 19346.104820815002, "examples_seen": 107673600.0, "progress": 0.9338117101675799, "epoch": 84.04337607821618, "img/sec/core": 759.3536482360806, "core_hours_NVIDIA A100-SXM4-40GB": 42.0028250655222, "core_hours": 42.0028250655222} {"step": 105200, "global_schedule": 0.012793570756912231, "l2_grads": 2.617570161819458, "l2_params": 238.40586853027344, "l2_updates": 0.013730193488299847, "train/loss": 1.8163597583770752, "uptime": 19355.633688986003, "examples_seen": 107724800.0, "progress": 0.9342557480706553, "epoch": 84.08333964268515, "img/sec/core": 671.6432513440704, "core_hours_NVIDIA A100-SXM4-40GB": 42.02400032812442, "core_hours": 42.02400032812442} {"step": 105250, "global_schedule": 0.012622088193893433, "l2_grads": 2.8897931575775146, "l2_params": 238.39822387695312, "l2_updates": 0.013288239948451519, "train/loss": 1.5161619186401367, "uptime": 19364.110253281004, "examples_seen": 107776000.0, "progress": 0.9346997859737307, "epoch": 84.12330320715411, "img/sec/core": 755.0228815906797, "core_hours_NVIDIA A100-SXM4-40GB": 42.042837137668876, "core_hours": 42.042837137668876} {"step": 105300, "global_schedule": 0.012451738119125366, "l2_grads": 2.6588125228881836, "l2_params": 238.39039611816406, "l2_updates": 0.013380324468016624, "train/loss": 1.5329312086105347, "uptime": 19373.03267855, "examples_seen": 107827200.0, "progress": 0.9351438238768062, "epoch": 84.16326677162306, "img/sec/core": 717.2937634161021, "core_hours_NVIDIA A100-SXM4-40GB": 42.06266474937776, "core_hours": 42.06266474937776} {"step": 105350, "global_schedule": 0.012282520532608032, "l2_grads": 2.6976544857025146, "l2_params": 238.3827362060547, "l2_updates": 0.013325558975338936, "train/loss": 1.6052926778793335, "uptime": 19382.661225025004, "examples_seen": 107878400.0, "progress": 0.9355878617798815, "epoch": 84.20323033609202, "img/sec/core": 664.690149922143, "core_hours_NVIDIA A100-SXM4-40GB": 42.084061519322205, "core_hours": 42.084061519322205} {"step": 105400, "global_schedule": 0.012114524841308594, "l2_grads": 2.776252508163452, "l2_params": 238.37501525878906, "l2_updates": 0.01309411134570837, "train/loss": 1.4128203392028809, "uptime": 19391.361691036, "examples_seen": 107929600.0, "progress": 0.936031899682957, "epoch": 84.24319390056097, "img/sec/core": 735.5927822611718, "core_hours_NVIDIA A100-SXM4-40GB": 42.10339588823554, "core_hours": 42.10339588823554} {"step": 105450, "global_schedule": 0.011947572231292725, "l2_grads": 2.7716987133026123, "l2_params": 238.3672332763672, "l2_updates": 0.012802587822079659, "train/loss": 3.489166021347046, "uptime": 19400.296924092, "examples_seen": 107980800.0, "progress": 0.9364759375860323, "epoch": 84.28315746502993, "img/sec/core": 716.2655926140305, "core_hours_NVIDIA A100-SXM4-40GB": 42.12325196169331, "core_hours": 42.12325196169331} {"step": 105500, "global_schedule": 0.011781841516494751, "l2_grads": 2.602918863296509, "l2_params": 238.35903930664062, "l2_updates": 0.01260305568575859, "train/loss": 2.7784500122070312, "uptime": 19408.890438404, "examples_seen": 108032000.0, "progress": 0.9369199754891078, "epoch": 84.32312102949889, "img/sec/core": 744.7476978146962, "core_hours_NVIDIA A100-SXM4-40GB": 42.14234866016442, "core_hours": 42.14234866016442} {"step": 105550, "global_schedule": 0.011617183685302734, "l2_grads": 2.739108085632324, "l2_params": 238.3520050048828, "l2_updates": 0.012399693951010704, "train/loss": 1.8625234365463257, "uptime": 19417.515331466, "examples_seen": 108083200.0, "progress": 0.9373640133921831, "epoch": 84.36308459396784, "img/sec/core": 742.0381857484699, "core_hours_NVIDIA A100-SXM4-40GB": 42.16151508919109, "core_hours": 42.16151508919109} {"step": 105600, "global_schedule": 0.011453717947006226, "l2_grads": 2.676361083984375, "l2_params": 238.34413146972656, "l2_updates": 0.012290594168007374, "train/loss": 1.7992985248565674, "uptime": 19425.986639667004, "examples_seen": 108134400.0, "progress": 0.9378080512952586, "epoch": 84.4030481584368, "img/sec/core": 755.4913418500014, "core_hours_NVIDIA A100-SXM4-40GB": 42.18034021852665, "core_hours": 42.18034021852665} {"step": 105650, "global_schedule": 0.01129138469696045, "l2_grads": 2.576876163482666, "l2_params": 238.33636474609375, "l2_updates": 0.012087360955774784, "train/loss": 2.5257644653320312, "uptime": 19434.520392106002, "examples_seen": 108185600.0, "progress": 0.9382520891983339, "epoch": 84.44301172290575, "img/sec/core": 749.9631663502454, "core_hours_NVIDIA A100-SXM4-40GB": 42.199304112835534, "core_hours": 42.199304112835534} {"step": 105700, "global_schedule": 0.011130213737487793, "l2_grads": 2.6803956031799316, "l2_params": 238.32891845703125, "l2_updates": 0.01194180827587843, "train/loss": 1.3706530332565308, "uptime": 19443.08686666, "examples_seen": 108236800.0, "progress": 0.9386961271014094, "epoch": 84.48297528737471, "img/sec/core": 747.098466195805, "core_hours_NVIDIA A100-SXM4-40GB": 42.21834072295554, "core_hours": 42.21834072295554} {"step": 105750, "global_schedule": 0.01097017526626587, "l2_grads": 2.805572271347046, "l2_params": 238.32212829589844, "l2_updates": 0.011721069924533367, "train/loss": 1.5916836261749268, "uptime": 19451.598779542, "examples_seen": 108288000.0, "progress": 0.9391401650044848, "epoch": 84.52293885184368, "img/sec/core": 751.8873946109394, "core_hours_NVIDIA A100-SXM4-40GB": 42.23725608491553, "core_hours": 42.23725608491553} {"step": 105800, "global_schedule": 0.010811269283294678, "l2_grads": 2.6446921825408936, "l2_params": 238.31544494628906, "l2_updates": 0.011592713184654713, "train/loss": 2.5369815826416016, "uptime": 19460.646020553002, "examples_seen": 108339200.0, "progress": 0.9395842029075602, "epoch": 84.56290241631262, "img/sec/core": 707.3979782585197, "core_hours_NVIDIA A100-SXM4-40GB": 42.25736106493998, "core_hours": 42.25736106493998} {"step": 105850, "global_schedule": 0.010653525590896606, "l2_grads": 2.8784594535827637, "l2_params": 238.3082275390625, "l2_updates": 0.011532364413142204, "train/loss": 1.6549227237701416, "uptime": 19469.762589767, "examples_seen": 108390400.0, "progress": 0.9400282408106356, "epoch": 84.60286598078159, "img/sec/core": 702.0184731521896, "core_hours_NVIDIA A100-SXM4-40GB": 42.27762010763776, "core_hours": 42.27762010763776} {"step": 105900, "global_schedule": 0.010496944189071655, "l2_grads": 2.9156389236450195, "l2_params": 238.30149841308594, "l2_updates": 0.011196812614798546, "train/loss": 1.914515495300293, "uptime": 19478.296837333997, "examples_seen": 108441600.0, "progress": 0.940472278713711, "epoch": 84.64282954525054, "img/sec/core": 749.9196560397148, "core_hours_NVIDIA A100-SXM4-40GB": 42.29658510223109, "core_hours": 42.29658510223109} {"step": 105950, "global_schedule": 0.010341495275497437, "l2_grads": 2.7186310291290283, "l2_params": 238.29452514648438, "l2_updates": 0.011311736889183521, "train/loss": 1.3850665092468262, "uptime": 19487.087059498997, "examples_seen": 108492800.0, "progress": 0.9409163166167864, "epoch": 84.6827931097195, "img/sec/core": 728.0817116867357, "core_hours_NVIDIA A100-SXM4-40GB": 42.31611892926442, "core_hours": 42.31611892926442} {"step": 106000, "global_schedule": 0.010187149047851562, "l2_grads": 2.915198802947998, "l2_params": 238.28831481933594, "l2_updates": 0.010949395596981049, "train/loss": 1.4584133625030518, "uptime": 19495.523058359002, "examples_seen": 108544000.0, "progress": 0.9413603545198618, "epoch": 84.72275667418846, "img/sec/core": 758.6534927530047, "core_hours_NVIDIA A100-SXM4-40GB": 42.33486559339776, "core_hours": 42.33486559339776} {"step": 106050, "global_schedule": 0.010033994913101196, "l2_grads": 2.579824924468994, "l2_params": 238.28143310546875, "l2_updates": 0.010731836780905724, "train/loss": 1.586712121963501, "uptime": 19505.008905679002, "examples_seen": 108595200.0, "progress": 0.9418043924229372, "epoch": 84.76272023865741, "img/sec/core": 726.6613199704361, "core_hours_NVIDIA A100-SXM4-40GB": 42.35443760284887, "core_hours": 42.35443760284887} {"step": 106100, "global_schedule": 0.009881973266601562, "l2_grads": 2.802628993988037, "l2_params": 238.27493286132812, "l2_updates": 0.010485843755304813, "train/loss": 1.6331331729888916, "uptime": 19513.513537849, "examples_seen": 108646400.0, "progress": 0.9422484303260126, "epoch": 84.80268380312637, "img/sec/core": 752.5310762500116, "core_hours_NVIDIA A100-SXM4-40GB": 42.37333678544887, "core_hours": 42.37333678544887} {"step": 106150, "global_schedule": 0.009731143712997437, "l2_grads": 2.788381576538086, "l2_params": 238.2683563232422, "l2_updates": 0.010310224257409573, "train/loss": 1.3765153884887695, "uptime": 19522.232762891, "examples_seen": 108697600.0, "progress": 0.942692468229088, "epoch": 84.84264736759532, "img/sec/core": 734.0101865900573, "core_hours_NVIDIA A100-SXM4-40GB": 42.39271284109777, "core_hours": 42.39271284109777} {"step": 106200, "global_schedule": 0.009581416845321655, "l2_grads": 2.6702659130096436, "l2_params": 238.26303100585938, "l2_updates": 0.010214102454483509, "train/loss": 2.5562052726745605, "uptime": 19531.265604089, "examples_seen": 108748800.0, "progress": 0.9431365061321635, "epoch": 84.88261093206428, "img/sec/core": 708.5256852978293, "core_hours_NVIDIA A100-SXM4-40GB": 42.41278582153777, "core_hours": 42.41278582153777} {"step": 106250, "global_schedule": 0.009432852268218994, "l2_grads": 2.5306620597839355, "l2_params": 238.25717163085938, "l2_updates": 0.010173572227358818, "train/loss": 2.0257527828216553, "uptime": 19540.010290255, "examples_seen": 108800000.0, "progress": 0.9435805440352388, "epoch": 84.92257449653324, "img/sec/core": 731.8730344931419, "core_hours_NVIDIA A100-SXM4-40GB": 42.432218457462206, "core_hours": 42.432218457462206} {"step": 106300, "global_schedule": 0.009285449981689453, "l2_grads": 2.609727382659912, "l2_params": 238.25082397460938, "l2_updates": 0.009953741915524006, "train/loss": 2.712482213973999, "uptime": 19549.178066415, "examples_seen": 108851200.0, "progress": 0.9440245819383143, "epoch": 84.96253806100219, "img/sec/core": 698.0973235279939, "core_hours_NVIDIA A100-SXM4-40GB": 42.45259129337332, "core_hours": 42.45259129337332} {"step": 106350, "global_schedule": 0.009139180183410645, "l2_grads": 2.6180918216705322, "l2_params": 238.24473571777344, "l2_updates": 0.009820184670388699, "train/loss": 1.8683013916015625, "uptime": 19559.256902517, "examples_seen": 108902400.0, "progress": 0.9444686198413896, "epoch": 85.00250162547115, "img/sec/core": 634.9939551781082, "core_hours_NVIDIA A100-SXM4-40GB": 42.47498870693332, "core_hours": 42.47498870693332} {"step": 106400, "global_schedule": 0.008994102478027344, "l2_grads": 2.955533027648926, "l2_params": 238.2390594482422, "l2_updates": 0.009671526961028576, "train/loss": 3.602628231048584, "uptime": 19568.683479434003, "examples_seen": 108953600.0, "progress": 0.9449126577444651, "epoch": 85.0424651899401, "img/sec/core": 678.9314993502188, "core_hours_NVIDIA A100-SXM4-40GB": 42.495936655637756, "core_hours": 42.495936655637756} {"step": 106450, "global_schedule": 0.008850127458572388, "l2_grads": 2.5664172172546387, "l2_params": 238.23362731933594, "l2_updates": 0.009535766206681728, "train/loss": 2.7067790031433105, "uptime": 19577.271048586, "examples_seen": 109004800.0, "progress": 0.9453566956475404, "epoch": 85.08242875440907, "img/sec/core": 745.2632854212484, "core_hours_NVIDIA A100-SXM4-40GB": 42.51502014264221, "core_hours": 42.51502014264221} {"step": 106500, "global_schedule": 0.008707314729690552, "l2_grads": 2.9303650856018066, "l2_params": 238.22796630859375, "l2_updates": 0.009313422255218029, "train/loss": 3.4289793968200684, "uptime": 19585.939162461, "examples_seen": 109056000.0, "progress": 0.9458007335506159, "epoch": 85.12239231887803, "img/sec/core": 738.3382466232277, "core_hours_NVIDIA A100-SXM4-40GB": 42.534282617919985, "core_hours": 42.534282617919985} {"step": 106550, "global_schedule": 0.008565634489059448, "l2_grads": 2.870732307434082, "l2_params": 238.22222900390625, "l2_updates": 0.009212947450578213, "train/loss": 1.4067062139511108, "uptime": 19594.859070704, "examples_seen": 109107200.0, "progress": 0.9462447714536912, "epoch": 85.16235588334698, "img/sec/core": 717.4961698763489, "core_hours_NVIDIA A100-SXM4-40GB": 42.55410463623776, "core_hours": 42.55410463623776} {"step": 106600, "global_schedule": 0.00842517614364624, "l2_grads": 2.7689592838287354, "l2_params": 238.21653747558594, "l2_updates": 0.008942024782299995, "train/loss": 1.774864912033081, "uptime": 19603.792599924003, "examples_seen": 109158400.0, "progress": 0.9466888093567667, "epoch": 85.20231944781594, "img/sec/core": 716.4022014581967, "core_hours_NVIDIA A100-SXM4-40GB": 42.57395692339332, "core_hours": 42.57395692339332} {"step": 106650, "global_schedule": 0.00828579068183899, "l2_grads": 2.7291431427001953, "l2_params": 238.2115478515625, "l2_updates": 0.008758769370615482, "train/loss": 1.9374865293502808, "uptime": 19613.304237571, "examples_seen": 109209600.0, "progress": 0.9471328472598421, "epoch": 85.24228301228489, "img/sec/core": 672.8599466800396, "core_hours_NVIDIA A100-SXM4-40GB": 42.595093895942206, "core_hours": 42.595093895942206} {"step": 106700, "global_schedule": 0.008147597312927246, "l2_grads": 2.7644283771514893, "l2_params": 238.2057647705078, "l2_updates": 0.008649185299873352, "train/loss": 1.3699547052383423, "uptime": 19622.649176751, "examples_seen": 109260800.0, "progress": 0.9475768851629175, "epoch": 85.28224657675385, "img/sec/core": 684.8626702352648, "core_hours_NVIDIA A100-SXM4-40GB": 42.61586042745331, "core_hours": 42.61586042745331} {"step": 106750, "global_schedule": 0.008010536432266235, "l2_grads": 2.5619277954101562, "l2_params": 238.20071411132812, "l2_updates": 0.008713780902326107, "train/loss": 2.791773557662964, "uptime": 19631.608452368004, "examples_seen": 109312000.0, "progress": 0.948020923065993, "epoch": 85.32221014122281, "img/sec/core": 714.3434663238326, "core_hours_NVIDIA A100-SXM4-40GB": 42.63576992882443, "core_hours": 42.63576992882443} {"step": 106800, "global_schedule": 0.007874637842178345, "l2_grads": 2.7793123722076416, "l2_params": 238.19577026367188, "l2_updates": 0.008397449739277363, "train/loss": 1.4329438209533691, "uptime": 19640.504782823, "examples_seen": 109363200.0, "progress": 0.9484649609690683, "epoch": 85.36217370569176, "img/sec/core": 719.3977373451191, "core_hours_NVIDIA A100-SXM4-40GB": 42.65553955205776, "core_hours": 42.65553955205776} {"step": 106850, "global_schedule": 0.007739901542663574, "l2_grads": 2.835622549057007, "l2_params": 238.19105529785156, "l2_updates": 0.008202292956411839, "train/loss": 1.5229260921478271, "uptime": 19649.858190263003, "examples_seen": 109414400.0, "progress": 0.9489089988721437, "epoch": 85.40213727016072, "img/sec/core": 684.2426186449862, "core_hours_NVIDIA A100-SXM4-40GB": 42.67632490192443, "core_hours": 42.67632490192443} {"step": 106900, "global_schedule": 0.007606327533721924, "l2_grads": 2.817903518676758, "l2_params": 238.1858367919922, "l2_updates": 0.00822124257683754, "train/loss": 1.2338509559631348, "uptime": 19659.201368665003, "examples_seen": 109465600.0, "progress": 0.9493530367752191, "epoch": 85.44210083462968, "img/sec/core": 684.9917367124641, "core_hours_NVIDIA A100-SXM4-40GB": 42.697087520595545, "core_hours": 42.697087520595545} {"step": 106950, "global_schedule": 0.007473886013031006, "l2_grads": 3.024052858352661, "l2_params": 238.1810760498047, "l2_updates": 0.007943792268633842, "train/loss": 1.6103307008743286, "uptime": 19667.923178651, "examples_seen": 109516800.0, "progress": 0.9497970746782946, "epoch": 85.48206439909863, "img/sec/core": 733.7926428428256, "core_hours_NVIDIA A100-SXM4-40GB": 42.71646932056443, "core_hours": 42.71646932056443} {"step": 107000, "global_schedule": 0.007342606782913208, "l2_grads": 2.5116961002349854, "l2_params": 238.1761932373047, "l2_updates": 0.007922304794192314, "train/loss": 2.404074192047119, "uptime": 19676.516470123002, "examples_seen": 109568000.0, "progress": 0.9502411125813699, "epoch": 85.5220279635676, "img/sec/core": 744.767010505079, "core_hours_NVIDIA A100-SXM4-40GB": 42.73556552383554, "core_hours": 42.73556552383554} {"step": 107050, "global_schedule": 0.00721248984336853, "l2_grads": 2.6905195713043213, "l2_params": 238.17140197753906, "l2_updates": 0.007753756828606129, "train/loss": 1.7706161737442017, "uptime": 19686.246988596, "examples_seen": 109619200.0, "progress": 0.9506851504844454, "epoch": 85.56199152803654, "img/sec/core": 704.9005673532738, "core_hours_NVIDIA A100-SXM4-40GB": 42.75574173432665, "core_hours": 42.75574173432665} {"step": 107100, "global_schedule": 0.007083505392074585, "l2_grads": 2.827139139175415, "l2_params": 238.16696166992188, "l2_updates": 0.007690052036195993, "train/loss": 1.338139533996582, "uptime": 19695.702346701997, "examples_seen": 109670400.0, "progress": 0.9511291883875208, "epoch": 85.6019550925055, "img/sec/core": 676.8648980031186, "core_hours_NVIDIA A100-SXM4-40GB": 42.77675364122887, "core_hours": 42.77675364122887} {"step": 107150, "global_schedule": 0.0069557130336761475, "l2_grads": 2.7538235187530518, "l2_params": 238.1620635986328, "l2_updates": 0.00749086681753397, "train/loss": 1.4050999879837036, "uptime": 19705.243284666998, "examples_seen": 109721600.0, "progress": 0.9515732262905962, "epoch": 85.64191865697447, "img/sec/core": 670.7935869069852, "core_hours_NVIDIA A100-SXM4-40GB": 42.797955725595536, "core_hours": 42.797955725595536} {"step": 107200, "global_schedule": 0.006829023361206055, "l2_grads": 2.6199891567230225, "l2_params": 238.1576385498047, "l2_updates": 0.00728550786152482, "train/loss": 2.6474130153656006, "uptime": 19714.730097958003, "examples_seen": 109772800.0, "progress": 0.9520172641936716, "epoch": 85.68188222144342, "img/sec/core": 674.6206343146445, "core_hours_NVIDIA A100-SXM4-40GB": 42.81903753290887, "core_hours": 42.81903753290887} {"step": 107250, "global_schedule": 0.00670352578163147, "l2_grads": 2.7655858993530273, "l2_params": 238.15286254882812, "l2_updates": 0.007211735937744379, "train/loss": 3.30084228515625, "uptime": 19724.309217572998, "examples_seen": 109824000.0, "progress": 0.952461302096747, "epoch": 85.72184578591238, "img/sec/core": 668.1198541439248, "core_hours_NVIDIA A100-SXM4-40GB": 42.84032446538665, "core_hours": 42.84032446538665} {"step": 107300, "global_schedule": 0.006579160690307617, "l2_grads": 2.8321709632873535, "l2_params": 238.14846801757812, "l2_updates": 0.007057874463498592, "train/loss": 3.5412416458129883, "uptime": 19733.100088461004, "examples_seen": 109875200.0, "progress": 0.9529053399998224, "epoch": 85.76180935038133, "img/sec/core": 728.0279828400961, "core_hours_NVIDIA A100-SXM4-40GB": 42.85985973402665, "core_hours": 42.85985973402665} {"step": 107350, "global_schedule": 0.0064559876918792725, "l2_grads": 2.8608171939849854, "l2_params": 238.14427185058594, "l2_updates": 0.0069929868914186954, "train/loss": 3.385509967803955, "uptime": 19741.69810306, "examples_seen": 109926400.0, "progress": 0.9533493779028978, "epoch": 85.80177291485029, "img/sec/core": 744.3578894067664, "core_hours_NVIDIA A100-SXM4-40GB": 42.878966433135545, "core_hours": 42.878966433135545} {"step": 107400, "global_schedule": 0.00633394718170166, "l2_grads": 2.703626871109009, "l2_params": 238.13990783691406, "l2_updates": 0.006809577811509371, "train/loss": 1.2793877124786377, "uptime": 19750.730015273002, "examples_seen": 109977600.0, "progress": 0.9537934158059732, "epoch": 85.84173647931925, "img/sec/core": 708.5985613090024, "core_hours_NVIDIA A100-SXM4-40GB": 42.89903734916443, "core_hours": 42.89903734916443} {"step": 107450, "global_schedule": 0.006213068962097168, "l2_grads": 2.8892784118652344, "l2_params": 238.13595581054688, "l2_updates": 0.006706711836159229, "train/loss": 1.4214744567871094, "uptime": 19759.902301513, "examples_seen": 110028800.0, "progress": 0.9542374537090486, "epoch": 85.8817000437882, "img/sec/core": 697.7540639858124, "core_hours_NVIDIA A100-SXM4-40GB": 42.91942020747554, "core_hours": 42.91942020747554} {"step": 107500, "global_schedule": 0.006093353033065796, "l2_grads": 2.847496509552002, "l2_params": 238.13192749023438, "l2_updates": 0.006471985951066017, "train/loss": 3.4655606746673584, "uptime": 19768.924165452, "examples_seen": 110080000.0, "progress": 0.954681491612124, "epoch": 85.92166360825716, "img/sec/core": 709.3877765473213, "core_hours_NVIDIA A100-SXM4-40GB": 42.93946879400665, "core_hours": 42.93946879400665, "val/acc@1": 0.76708, "val/loss": 0.9246074731445313, "z/secs/eval/val": 3.639286646997789} {"step": 107550, "global_schedule": 0.005974799394607544, "l2_grads": 2.8248002529144287, "l2_params": 238.12808227539062, "l2_updates": 0.006462676916271448, "train/loss": 1.7145605087280273, "uptime": 19780.670007155, "examples_seen": 110131200.0, "progress": 0.9551255295151995, "epoch": 85.96162717272611, "img/sec/core": 789.5680590205749, "core_hours_NVIDIA A100-SXM4-40GB": 42.95748145556221, "core_hours": 42.95748145556221} {"step": 107600, "global_schedule": 0.005857378244400024, "l2_grads": 2.8028197288513184, "l2_params": 238.12420654296875, "l2_updates": 0.006246626842767, "train/loss": 1.341677188873291, "uptime": 19790.196374992003, "examples_seen": 110182400.0, "progress": 0.9555695674182748, "epoch": 86.00159073719507, "img/sec/core": 671.8195338986562, "core_hours_NVIDIA A100-SXM4-40GB": 42.97865116186666, "core_hours": 42.97865116186666} {"step": 107650, "global_schedule": 0.005741149187088013, "l2_grads": 3.0777626037597656, "l2_params": 238.12049865722656, "l2_updates": 0.006177023984491825, "train/loss": 3.635441780090332, "uptime": 19799.329568850997, "examples_seen": 110233600.0, "progress": 0.9560136053213503, "epoch": 86.04155430166404, "img/sec/core": 700.7406279562495, "core_hours_NVIDIA A100-SXM4-40GB": 42.99894714821998, "core_hours": 42.99894714821998} {"step": 107700, "global_schedule": 0.005626052618026733, "l2_grads": 2.870065212249756, "l2_params": 238.11663818359375, "l2_updates": 0.00609062472358346, "train/loss": 1.5200761556625366, "uptime": 19808.15262906, "examples_seen": 110284800.0, "progress": 0.9564576432244256, "epoch": 86.08151786613298, "img/sec/core": 725.3719059370302, "core_hours_NVIDIA A100-SXM4-40GB": 43.018553948684435, "core_hours": 43.018553948684435} {"step": 107750, "global_schedule": 0.005512118339538574, "l2_grads": 2.8402087688446045, "l2_params": 238.11306762695312, "l2_updates": 0.006040729582309723, "train/loss": 1.3650128841400146, "uptime": 19817.391821514, "examples_seen": 110336000.0, "progress": 0.9569016811275011, "epoch": 86.12148143060195, "img/sec/core": 692.7012324791956, "core_hours_NVIDIA A100-SXM4-40GB": 43.0390854874711, "core_hours": 43.0390854874711} {"step": 107800, "global_schedule": 0.005399346351623535, "l2_grads": 2.5211973190307617, "l2_params": 238.1087646484375, "l2_updates": 0.0058682686649262905, "train/loss": 2.5241358280181885, "uptime": 19826.558917964, "examples_seen": 110387200.0, "progress": 0.9573457190305764, "epoch": 86.1614449950709, "img/sec/core": 698.1490851448348, "core_hours_NVIDIA A100-SXM4-40GB": 43.05945681291554, "core_hours": 43.05945681291554} {"step": 107850, "global_schedule": 0.005287736654281616, "l2_grads": 2.8283486366271973, "l2_params": 238.10549926757812, "l2_updates": 0.005610044114291668, "train/loss": 1.3736071586608887, "uptime": 19835.687439954003, "examples_seen": 110438400.0, "progress": 0.9577897569336519, "epoch": 86.20140855953986, "img/sec/core": 701.0992586762304, "core_hours_NVIDIA A100-SXM4-40GB": 43.07974241733777, "core_hours": 43.07974241733777} {"step": 107900, "global_schedule": 0.005177289247512817, "l2_grads": 3.034830331802368, "l2_params": 238.1022186279297, "l2_updates": 0.005548819899559021, "train/loss": 1.3345427513122559, "uptime": 19845.179327697, "examples_seen": 110489600.0, "progress": 0.9582337948367272, "epoch": 86.24137212400882, "img/sec/core": 674.2599758114953, "core_hours_NVIDIA A100-SXM4-40GB": 43.1008355012111, "core_hours": 43.1008355012111} {"step": 107950, "global_schedule": 0.005068004131317139, "l2_grads": 3.0706989765167236, "l2_params": 238.09890747070312, "l2_updates": 0.005441558081656694, "train/loss": 3.611124277114868, "uptime": 19853.798111718002, "examples_seen": 110540800.0, "progress": 0.9586778327398027, "epoch": 86.28133568847777, "img/sec/core": 742.5641464510315, "core_hours_NVIDIA A100-SXM4-40GB": 43.1199883545911, "core_hours": 43.1199883545911} {"step": 108000, "global_schedule": 0.00495988130569458, "l2_grads": 2.864617347717285, "l2_params": 238.0957794189453, "l2_updates": 0.005332397297024727, "train/loss": 1.377148151397705, "uptime": 19862.490044232, "examples_seen": 110592000.0, "progress": 0.9591218706428781, "epoch": 86.32129925294673, "img/sec/core": 736.3149667454398, "core_hours_NVIDIA A100-SXM4-40GB": 43.13930376017777, "core_hours": 43.13930376017777} {"step": 108050, "global_schedule": 0.004852920770645142, "l2_grads": 2.6541624069213867, "l2_params": 238.0926055908203, "l2_updates": 0.005218322854489088, "train/loss": 2.8510942459106445, "uptime": 19871.79479339, "examples_seen": 110643200.0, "progress": 0.9595659085459535, "epoch": 86.36126281741568, "img/sec/core": 742.7460752814624, "core_hours_NVIDIA A100-SXM4-40GB": 43.158451922242214, "core_hours": 43.158451922242214} {"step": 108100, "global_schedule": 0.0047470927238464355, "l2_grads": 2.586367607116699, "l2_params": 238.08956909179688, "l2_updates": 0.005073509644716978, "train/loss": 2.4148623943328857, "uptime": 19881.101361117, "examples_seen": 110694400.0, "progress": 0.9600099464490289, "epoch": 86.40122638188464, "img/sec/core": 687.6863939251542, "core_hours_NVIDIA A100-SXM4-40GB": 43.179133183857765, "core_hours": 43.179133183857765} {"step": 108150, "global_schedule": 0.00464242696762085, "l2_grads": 2.807176351547241, "l2_params": 238.08641052246094, "l2_updates": 0.004932005889713764, "train/loss": 2.8451080322265625, "uptime": 19889.784849543, "examples_seen": 110745600.0, "progress": 0.9604539843521043, "epoch": 86.4411899463536, "img/sec/core": 737.0309817927639, "core_hours_NVIDIA A100-SXM4-40GB": 43.19842982480443, "core_hours": 43.19842982480443} {"step": 108200, "global_schedule": 0.0045389533042907715, "l2_grads": 2.823798656463623, "l2_params": 238.08326721191406, "l2_updates": 0.004942947532981634, "train/loss": 1.4767346382141113, "uptime": 19898.329860441998, "examples_seen": 110796800.0, "progress": 0.9608980222551797, "epoch": 86.48115351082255, "img/sec/core": 748.9750540573795, "core_hours_NVIDIA A100-SXM4-40GB": 43.21741873791333, "core_hours": 43.21741873791333} {"step": 108250, "global_schedule": 0.0044366419315338135, "l2_grads": 2.782282829284668, "l2_params": 238.08055114746094, "l2_updates": 0.004708117805421352, "train/loss": 1.3435146808624268, "uptime": 19907.384780671004, "examples_seen": 110848000.0, "progress": 0.9613420601582551, "epoch": 86.52111707529151, "img/sec/core": 706.7980543330825, "core_hours_NVIDIA A100-SXM4-40GB": 43.23754078286666, "core_hours": 43.23754078286666} {"step": 108300, "global_schedule": 0.004335463047027588, "l2_grads": 2.7188658714294434, "l2_params": 238.0777130126953, "l2_updates": 0.004682980943471193, "train/loss": 1.5386431217193604, "uptime": 19916.022258436, "examples_seen": 110899200.0, "progress": 0.9617860980613305, "epoch": 86.56108063976046, "img/sec/core": 740.9570448835133, "core_hours_NVIDIA A100-SXM4-40GB": 43.256735177899984, "core_hours": 43.256735177899984} {"step": 108350, "global_schedule": 0.00423547625541687, "l2_grads": 2.7135632038116455, "l2_params": 238.07470703125, "l2_updates": 0.004520003218203783, "train/loss": 2.438082456588745, "uptime": 19924.623796740998, "examples_seen": 110950400.0, "progress": 0.9622301359644059, "epoch": 86.60104420422942, "img/sec/core": 744.0529557695334, "core_hours_NVIDIA A100-SXM4-40GB": 43.275849707466655, "core_hours": 43.275849707466655} {"step": 108400, "global_schedule": 0.004136621952056885, "l2_grads": 2.686593532562256, "l2_params": 238.07200622558594, "l2_updates": 0.004408719949424267, "train/loss": 1.6692806482315063, "uptime": 19933.249626921002, "examples_seen": 111001600.0, "progress": 0.9626741738674813, "epoch": 86.64100776869839, "img/sec/core": 741.957570047991, "core_hours_NVIDIA A100-SXM4-40GB": 43.29501821897777, "core_hours": 43.29501821897777} {"step": 108450, "global_schedule": 0.0040389299392700195, "l2_grads": 2.6136577129364014, "l2_params": 238.06932067871094, "l2_updates": 0.004300007130950689, "train/loss": 2.4025490283966064, "uptime": 19942.136610101, "examples_seen": 111052800.0, "progress": 0.9631182117705568, "epoch": 86.68097133316734, "img/sec/core": 720.1543955211835, "core_hours_NVIDIA A100-SXM4-40GB": 43.31476707048888, "core_hours": 43.31476707048888} {"step": 108500, "global_schedule": 0.003942400217056274, "l2_grads": 2.7471439838409424, "l2_params": 238.06675720214844, "l2_updates": 0.004246164578944445, "train/loss": 1.6011652946472168, "uptime": 19951.170410525003, "examples_seen": 111104000.0, "progress": 0.9635622496736321, "epoch": 86.7209348976363, "img/sec/core": 708.450452701726, "core_hours_NVIDIA A100-SXM4-40GB": 43.33484218254221, "core_hours": 43.33484218254221} {"step": 108550, "global_schedule": 0.003847062587738037, "l2_grads": 2.603985548019409, "l2_params": 238.0643310546875, "l2_updates": 0.004123017657548189, "train/loss": 2.426957368850708, "uptime": 19959.901368051003, "examples_seen": 111155200.0, "progress": 0.9640062875767076, "epoch": 86.76089846210525, "img/sec/core": 733.0238385584818, "core_hours_NVIDIA A100-SXM4-40GB": 43.35424431037777, "core_hours": 43.35424431037777} {"step": 108600, "global_schedule": 0.0037528574466705322, "l2_grads": 2.772081136703491, "l2_params": 238.0619354248047, "l2_updates": 0.0039869993925094604, "train/loss": 3.136518716812134, "uptime": 19968.802578119998, "examples_seen": 111206400.0, "progress": 0.9644503254797829, "epoch": 86.80086202657421, "img/sec/core": 719.0033658783782, "core_hours_NVIDIA A100-SXM4-40GB": 43.37402477719777, "core_hours": 43.37402477719777} {"step": 108650, "global_schedule": 0.003659844398498535, "l2_grads": 2.607621431350708, "l2_params": 238.05975341796875, "l2_updates": 0.003951307851821184, "train/loss": 1.697824478149414, "uptime": 19977.383772054003, "examples_seen": 111257600.0, "progress": 0.9648943633828584, "epoch": 86.84082559104317, "img/sec/core": 745.8169631431803, "core_hours_NVIDIA A100-SXM4-40GB": 43.3930940970511, "core_hours": 43.3930940970511} {"step": 108700, "global_schedule": 0.0035679638385772705, "l2_grads": 2.910768985748291, "l2_params": 238.05728149414062, "l2_updates": 0.003839915618300438, "train/loss": 3.4345099925994873, "uptime": 19986.076765627004, "examples_seen": 111308800.0, "progress": 0.9653384012859337, "epoch": 86.88078915551212, "img/sec/core": 736.2250928009158, "core_hours_NVIDIA A100-SXM4-40GB": 43.412411860546655, "core_hours": 43.412411860546655} {"step": 108750, "global_schedule": 0.0034772753715515137, "l2_grads": 2.9970715045928955, "l2_params": 238.05491638183594, "l2_updates": 0.003805851098150015, "train/loss": 1.493955373764038, "uptime": 19994.825926119003, "examples_seen": 111360000.0, "progress": 0.9657824391890092, "epoch": 86.92075271998108, "img/sec/core": 731.4987541778721, "core_hours_NVIDIA A100-SXM4-40GB": 43.43185443941777, "core_hours": 43.43185443941777} {"step": 108800, "global_schedule": 0.0033877193927764893, "l2_grads": 2.9543511867523193, "l2_params": 238.05264282226562, "l2_updates": 0.0036713036242872477, "train/loss": 1.4344666004180908, "uptime": 20003.859594882, "examples_seen": 111411200.0, "progress": 0.9662264770920845, "epoch": 86.96071628445004, "img/sec/core": 708.4607779967116, "core_hours_NVIDIA A100-SXM4-40GB": 43.451929258891106, "core_hours": 43.451929258891106} {"step": 108850, "global_schedule": 0.0032993555068969727, "l2_grads": 2.7860708236694336, "l2_params": 238.05052185058594, "l2_updates": 0.0034994708839803934, "train/loss": 1.8539118766784668, "uptime": 20013.595424237, "examples_seen": 111462400.0, "progress": 0.96667051499516, "epoch": 87.00067984891899, "img/sec/core": 657.365671339958, "core_hours_NVIDIA A100-SXM4-40GB": 43.473564435235545, "core_hours": 43.473564435235545} {"step": 108900, "global_schedule": 0.003212153911590576, "l2_grads": 3.0272321701049805, "l2_params": 238.0482940673828, "l2_updates": 0.003465640125796199, "train/loss": 3.6625986099243164, "uptime": 20022.479764604002, "examples_seen": 111513600.0, "progress": 0.9671145528982354, "epoch": 87.04064341338795, "img/sec/core": 720.3686188985164, "core_hours_NVIDIA A100-SXM4-40GB": 43.49330741382888, "core_hours": 43.49330741382888} {"step": 108950, "global_schedule": 0.003126084804534912, "l2_grads": 2.713505983352661, "l2_params": 238.04623413085938, "l2_updates": 0.0033609680831432343, "train/loss": 1.4063589572906494, "uptime": 20031.209302465002, "examples_seen": 111564800.0, "progress": 0.9675585908013108, "epoch": 87.0806069778569, "img/sec/core": 733.1430485676452, "core_hours_NVIDIA A100-SXM4-40GB": 43.512706386853324, "core_hours": 43.512706386853324} {"step": 109000, "global_schedule": 0.003041207790374756, "l2_grads": 2.829843759536743, "l2_params": 238.04403686523438, "l2_updates": 0.0032498319633305073, "train/loss": 1.3188533782958984, "uptime": 20040.321744105, "examples_seen": 111616000.0, "progress": 0.9680026287043862, "epoch": 87.12057054232586, "img/sec/core": 702.3364596273949, "core_hours_NVIDIA A100-SXM4-40GB": 43.532956257164436, "core_hours": 43.532956257164436} {"step": 109050, "global_schedule": 0.0029575228691101074, "l2_grads": 3.0946052074432373, "l2_params": 238.0420684814453, "l2_updates": 0.003144014161080122, "train/loss": 1.4743911027908325, "uptime": 20050.126017412003, "examples_seen": 111667200.0, "progress": 0.9684466666074616, "epoch": 87.16053410679483, "img/sec/core": 750.3543222644804, "core_hours_NVIDIA A100-SXM4-40GB": 43.5519102656911, "core_hours": 43.5519102656911} {"step": 109100, "global_schedule": 0.0028749704360961914, "l2_grads": 2.8792378902435303, "l2_params": 238.03990173339844, "l2_updates": 0.00302872178144753, "train/loss": 1.727075457572937, "uptime": 20058.96591421, "examples_seen": 111718400.0, "progress": 0.968890704510537, "epoch": 87.20049767126378, "img/sec/core": 723.9903526304207, "core_hours_NVIDIA A100-SXM4-40GB": 43.57155448079777, "core_hours": 43.57155448079777} {"step": 109150, "global_schedule": 0.002793550491333008, "l2_grads": 2.709507703781128, "l2_params": 238.03817749023438, "l2_updates": 0.003087766468524933, "train/loss": 1.3268550634384155, "uptime": 20068.710225251998, "examples_seen": 111769600.0, "progress": 0.9693347424136124, "epoch": 87.24046123573274, "img/sec/core": 656.793484158635, "core_hours_NVIDIA A100-SXM4-40GB": 43.59320850533554, "core_hours": 43.59320850533554} {"step": 109200, "global_schedule": 0.0027133524417877197, "l2_grads": 2.7793469429016113, "l2_params": 238.0362548828125, "l2_updates": 0.0029263868927955627, "train/loss": 1.5984312295913696, "uptime": 20078.595760937, "examples_seen": 111820800.0, "progress": 0.9697787803166878, "epoch": 87.28042480020169, "img/sec/core": 647.4105404031071, "core_hours_NVIDIA A100-SXM4-40GB": 43.61517636241332, "core_hours": 43.61517636241332} {"step": 109250, "global_schedule": 0.002634286880493164, "l2_grads": 2.986891746520996, "l2_params": 238.03443908691406, "l2_updates": 0.0028353717643767595, "train/loss": 3.5802900791168213, "uptime": 20087.435799657003, "examples_seen": 111872000.0, "progress": 0.9702228182197632, "epoch": 87.32038836467065, "img/sec/core": 723.9787293599917, "core_hours_NVIDIA A100-SXM4-40GB": 43.63482089290221, "core_hours": 43.63482089290221} {"step": 109300, "global_schedule": 0.002556413412094116, "l2_grads": 2.692692995071411, "l2_params": 238.03256225585938, "l2_updates": 0.0027297423221170902, "train/loss": 2.5701255798339844, "uptime": 20096.381830119004, "examples_seen": 111923200.0, "progress": 0.9706668561228387, "epoch": 87.36035192913961, "img/sec/core": 715.4010962945841, "core_hours_NVIDIA A100-SXM4-40GB": 43.65470096059555, "core_hours": 43.65470096059555} {"step": 109350, "global_schedule": 0.0024796724319458008, "l2_grads": 2.5914900302886963, "l2_params": 238.0309600830078, "l2_updates": 0.0026977446395903826, "train/loss": 2.3530375957489014, "uptime": 20106.136918873002, "examples_seen": 111974400.0, "progress": 0.9711108940259141, "epoch": 87.40031549360856, "img/sec/core": 656.0678391959127, "core_hours_NVIDIA A100-SXM4-40GB": 43.67637893560444, "core_hours": 43.67637893560444} {"step": 109400, "global_schedule": 0.002404123544692993, "l2_grads": 2.685081720352173, "l2_params": 238.0294189453125, "l2_updates": 0.0025987711269408464, "train/loss": 1.341286301612854, "uptime": 20115.696851202003, "examples_seen": 112025600.0, "progress": 0.9715549319289895, "epoch": 87.44027905807752, "img/sec/core": 669.4608057616839, "core_hours_NVIDIA A100-SXM4-40GB": 43.697623229668885, "core_hours": 43.697623229668885} {"step": 109450, "global_schedule": 0.0023297369480133057, "l2_grads": 2.7223329544067383, "l2_params": 238.0277862548828, "l2_updates": 0.0025195875205099583, "train/loss": 1.485021710395813, "uptime": 20124.887861795003, "examples_seen": 112076800.0, "progress": 0.9719989698320649, "epoch": 87.48024262254647, "img/sec/core": 696.3325670491837, "core_hours_NVIDIA A100-SXM4-40GB": 43.718047697653326, "core_hours": 43.718047697653326} {"step": 109500, "global_schedule": 0.0022565126419067383, "l2_grads": 2.609208345413208, "l2_params": 238.02627563476562, "l2_updates": 0.002412523375824094, "train/loss": 2.263078451156616, "uptime": 20133.764176534998, "examples_seen": 112128000.0, "progress": 0.9724430077351403, "epoch": 87.52020618701543, "img/sec/core": 721.0199488713697, "core_hours_NVIDIA A100-SXM4-40GB": 43.73777284151999, "core_hours": 43.73777284151999} {"step": 109550, "global_schedule": 0.002184450626373291, "l2_grads": 2.77590012550354, "l2_params": 238.02474975585938, "l2_updates": 0.0023655863478779793, "train/loss": 1.980785608291626, "uptime": 20142.624892941, "examples_seen": 112179200.0, "progress": 0.9728870456382157, "epoch": 87.5601697514844, "img/sec/core": 722.2892265985766, "core_hours_NVIDIA A100-SXM4-40GB": 43.75746332242222, "core_hours": 43.75746332242222} {"step": 109600, "global_schedule": 0.002113550901412964, "l2_grads": 2.7053966522216797, "l2_params": 238.0233917236328, "l2_updates": 0.002246609190478921, "train/loss": 2.6422271728515625, "uptime": 20151.244952367, "examples_seen": 112230400.0, "progress": 0.973331083541291, "epoch": 87.60013331595334, "img/sec/core": 742.4542782959928, "core_hours_NVIDIA A100-SXM4-40GB": 43.77661901003555, "core_hours": 43.77661901003555} {"step": 109650, "global_schedule": 0.0020438432693481445, "l2_grads": 2.8290817737579346, "l2_params": 238.02191162109375, "l2_updates": 0.0022122713271528482, "train/loss": 1.3613131046295166, "uptime": 20159.956903864004, "examples_seen": 112281600.0, "progress": 0.9737751214443665, "epoch": 87.6400968804223, "img/sec/core": 734.623006361306, "core_hours_NVIDIA A100-SXM4-40GB": 43.79597890225111, "core_hours": 43.79597890225111} {"step": 109700, "global_schedule": 0.0019752681255340576, "l2_grads": 2.7096638679504395, "l2_params": 238.02056884765625, "l2_updates": 0.002116147195920348, "train/loss": 1.7465077638626099, "uptime": 20169.590956602, "examples_seen": 112332800.0, "progress": 0.9742191593474419, "epoch": 87.68006044489125, "img/sec/core": 664.310251775719, "core_hours_NVIDIA A100-SXM4-40GB": 43.81738790833554, "core_hours": 43.81738790833554} {"step": 109750, "global_schedule": 0.0019078850746154785, "l2_grads": 2.6888513565063477, "l2_params": 238.01922607421875, "l2_updates": 0.0020559204276651144, "train/loss": 1.6595323085784912, "uptime": 20178.925107568997, "examples_seen": 112384000.0, "progress": 0.9746631972505173, "epoch": 87.72002400936022, "img/sec/core": 685.6542199314401, "core_hours_NVIDIA A100-SXM4-40GB": 43.838130466039985, "core_hours": 43.838130466039985} {"step": 109800, "global_schedule": 0.0018416643142700195, "l2_grads": 2.9162886142730713, "l2_params": 238.0179901123047, "l2_updates": 0.0020054613705724478, "train/loss": 1.5122895240783691, "uptime": 20187.385668791, "examples_seen": 112435200.0, "progress": 0.9751072351535927, "epoch": 87.75998757382918, "img/sec/core": 756.4510003612867, "core_hours_NVIDIA A100-SXM4-40GB": 43.856931713199984, "core_hours": 43.856931713199984} {"step": 109850, "global_schedule": 0.0017766058444976807, "l2_grads": 2.7320332527160645, "l2_params": 238.0167694091797, "l2_updates": 0.001882375916466117, "train/loss": 2.090301275253296, "uptime": 20195.989729952, "examples_seen": 112486400.0, "progress": 0.9755512730566681, "epoch": 87.79995113829813, "img/sec/core": 743.8347868805408, "core_hours_NVIDIA A100-SXM4-40GB": 43.876051849113324, "core_hours": 43.876051849113324} {"step": 109900, "global_schedule": 0.001712709665298462, "l2_grads": 2.7231311798095703, "l2_params": 238.01564025878906, "l2_updates": 0.001859211130067706, "train/loss": 1.5780795812606812, "uptime": 20204.648153513997, "examples_seen": 112537600.0, "progress": 0.9759953109597436, "epoch": 87.83991470276709, "img/sec/core": 739.1645781905056, "core_hours_NVIDIA A100-SXM4-40GB": 43.89529279036221, "core_hours": 43.89529279036221} {"step": 109950, "global_schedule": 0.0016499757766723633, "l2_grads": 2.9545021057128906, "l2_params": 238.01454162597656, "l2_updates": 0.001776372198946774, "train/loss": 1.395416498184204, "uptime": 20213.724647862, "examples_seen": 112588800.0, "progress": 0.9764393488628189, "epoch": 87.87987826723604, "img/sec/core": 705.1180504958288, "core_hours_NVIDIA A100-SXM4-40GB": 43.91546277780221, "core_hours": 43.91546277780221} {"step": 110000, "global_schedule": 0.0015884339809417725, "l2_grads": 2.7746474742889404, "l2_params": 238.0134735107422, "l2_updates": 0.0017023703549057245, "train/loss": 1.5642262697219849, "uptime": 20222.260147246, "examples_seen": 112640000.0, "progress": 0.9768833867658944, "epoch": 87.919841831705, "img/sec/core": 749.8096727648908, "core_hours_NVIDIA A100-SXM4-40GB": 43.9344305542111, "core_hours": 43.9344305542111, "val/acc@1": 0.7685, "val/loss": 0.9228044128417969, "z/secs/eval/val": 2.5782502119982382} {"step": 110050, "global_schedule": 0.0015280544757843018, "l2_grads": 3.0112721920013428, "l2_params": 238.01260375976562, "l2_updates": 0.0016307560727000237, "train/loss": 3.5637171268463135, "uptime": 20233.94039777, "examples_seen": 112691200.0, "progress": 0.9773274246689697, "epoch": 87.95980539617396, "img/sec/core": 762.8138753082978, "core_hours_NVIDIA A100-SXM4-40GB": 43.953074974144435, "core_hours": 43.953074974144435} {"step": 110100, "global_schedule": 0.0014688372611999512, "l2_grads": 2.7310235500335693, "l2_params": 238.0115966796875, "l2_updates": 0.0015915624098852277, "train/loss": 1.9270830154418945, "uptime": 20242.718798226997, "examples_seen": 112742400.0, "progress": 0.9777714625720452, "epoch": 87.99976896064291, "img/sec/core": 729.0622057344923, "core_hours_NVIDIA A100-SXM4-40GB": 43.97258253071554, "core_hours": 43.97258253071554} {"step": 110150, "global_schedule": 0.0014107823371887207, "l2_grads": 2.9417262077331543, "l2_params": 238.0107879638672, "l2_updates": 0.0015206357929855585, "train/loss": 3.7501349449157715, "uptime": 20251.883485566002, "examples_seen": 112793600.0, "progress": 0.9782155004751205, "epoch": 88.03973252511187, "img/sec/core": 698.3326068052262, "core_hours_NVIDIA A100-SXM4-40GB": 43.99294850257999, "core_hours": 43.99294850257999} {"step": 110200, "global_schedule": 0.001353919506072998, "l2_grads": 2.7722089290618896, "l2_params": 238.0099639892578, "l2_updates": 0.0014654680853709579, "train/loss": 1.5319637060165405, "uptime": 20261.092819669, "examples_seen": 112844800.0, "progress": 0.978659538378196, "epoch": 88.07969608958082, "img/sec/core": 694.9470969800354, "core_hours_NVIDIA A100-SXM4-40GB": 44.01341368947555, "core_hours": 44.01341368947555} {"step": 110250, "global_schedule": 0.0012982189655303955, "l2_grads": 2.901432514190674, "l2_params": 238.0090789794922, "l2_updates": 0.0014018418733030558, "train/loss": 3.5575246810913086, "uptime": 20270.297202841, "examples_seen": 112896000.0, "progress": 0.9791035762812713, "epoch": 88.11965965404978, "img/sec/core": 695.3209009669243, "core_hours_NVIDIA A100-SXM4-40GB": 44.03386787430222, "core_hours": 44.03386787430222} {"step": 110300, "global_schedule": 0.001243680715560913, "l2_grads": 2.740980625152588, "l2_params": 238.00823974609375, "l2_updates": 0.0013560398947447538, "train/loss": 1.4284753799438477, "uptime": 20278.883050978002, "examples_seen": 112947200.0, "progress": 0.9795476141843468, "epoch": 88.15962321851875, "img/sec/core": 745.4126718618936, "core_hours_NVIDIA A100-SXM4-40GB": 44.05294753682888, "core_hours": 44.05294753682888} {"step": 110350, "global_schedule": 0.0011903047561645508, "l2_grads": 2.7834177017211914, "l2_params": 238.0074005126953, "l2_updates": 0.0012832446955144405, "train/loss": 1.844527006149292, "uptime": 20287.400002216003, "examples_seen": 112998400.0, "progress": 0.9799916520874222, "epoch": 88.1995867829877, "img/sec/core": 751.4426020714959, "core_hours_NVIDIA A100-SXM4-40GB": 44.07187409513555, "core_hours": 44.07187409513555} {"step": 110400, "global_schedule": 0.0011380910873413086, "l2_grads": 2.897735357284546, "l2_params": 238.006591796875, "l2_updates": 0.0012258507777005434, "train/loss": 1.2761963605880737, "uptime": 20296.21882699, "examples_seen": 113049600.0, "progress": 0.9804356899904976, "epoch": 88.23955034745666, "img/sec/core": 725.7202817850247, "core_hours_NVIDIA A100-SXM4-40GB": 44.09147148352221, "core_hours": 44.09147148352221} {"step": 110450, "global_schedule": 0.0010870695114135742, "l2_grads": 2.621683120727539, "l2_params": 238.00584411621094, "l2_updates": 0.001157248392701149, "train/loss": 2.681203842163086, "uptime": 20305.766339592003, "examples_seen": 113100800.0, "progress": 0.980879727893573, "epoch": 88.2795139119256, "img/sec/core": 670.3316629987879, "core_hours_NVIDIA A100-SXM4-40GB": 44.11268817819332, "core_hours": 44.11268817819332} {"step": 110500, "global_schedule": 0.00103721022605896, "l2_grads": 2.656198024749756, "l2_params": 238.00506591796875, "l2_updates": 0.0011247507063671947, "train/loss": 1.3839696645736694, "uptime": 20314.837145787, "examples_seen": 113152000.0, "progress": 0.9813237657966484, "epoch": 88.31947747639457, "img/sec/core": 705.560218399164, "core_hours_NVIDIA A100-SXM4-40GB": 44.13284552529332, "core_hours": 44.13284552529332} {"step": 110550, "global_schedule": 0.0009885132312774658, "l2_grads": 2.5737998485565186, "l2_params": 238.00430297851562, "l2_updates": 0.0010587810538709164, "train/loss": 2.809889793395996, "uptime": 20323.325344315002, "examples_seen": 113203200.0, "progress": 0.9817678036997238, "epoch": 88.35944104086353, "img/sec/core": 753.9880198239634, "core_hours_NVIDIA A100-SXM4-40GB": 44.15170818868888, "core_hours": 44.15170818868888} {"step": 110600, "global_schedule": 0.0009409785270690918, "l2_grads": 2.916121006011963, "l2_params": 238.00364685058594, "l2_updates": 0.0010244547156617045, "train/loss": 3.573441505432129, "uptime": 20331.822716058, "examples_seen": 113254400.0, "progress": 0.9822118416027992, "epoch": 88.39940460533248, "img/sec/core": 753.1740629415235, "core_hours_NVIDIA A100-SXM4-40GB": 44.170591237006654, "core_hours": 44.170591237006654} {"step": 110650, "global_schedule": 0.0008946359157562256, "l2_grads": 2.950230121612549, "l2_params": 238.00308227539062, "l2_updates": 0.0009680351940914989, "train/loss": 1.4647196531295776, "uptime": 20340.987810427003, "examples_seen": 113305600.0, "progress": 0.9826558795058746, "epoch": 88.43936816980144, "img/sec/core": 698.3015932326075, "core_hours_NVIDIA A100-SXM4-40GB": 44.19095811338221, "core_hours": 44.19095811338221} {"step": 110700, "global_schedule": 0.0008494257926940918, "l2_grads": 2.665379524230957, "l2_params": 238.00257873535156, "l2_updates": 0.0009109828970395029, "train/loss": 2.8064005374908447, "uptime": 20350.588188540998, "examples_seen": 113356800.0, "progress": 0.98309991740895, "epoch": 88.47933173427039, "img/sec/core": 666.640409784254, "core_hours_NVIDIA A100-SXM4-40GB": 44.21229228696888, "core_hours": 44.21229228696888} {"step": 110750, "global_schedule": 0.0008054375648498535, "l2_grads": 2.769979953765869, "l2_params": 238.001953125, "l2_updates": 0.0008653954137116671, "train/loss": 1.7136743068695068, "uptime": 20359.995750215, "examples_seen": 113408000.0, "progress": 0.9835439553120254, "epoch": 88.51929529873935, "img/sec/core": 680.3038047241496, "core_hours_NVIDIA A100-SXM4-40GB": 44.23319797957777, "core_hours": 44.23319797957777} {"step": 110800, "global_schedule": 0.0007625818252563477, "l2_grads": 2.5761306285858154, "l2_params": 238.00143432617188, "l2_updates": 0.0008228436927311122, "train/loss": 2.926661968231201, "uptime": 20369.322511070997, "examples_seen": 113459200.0, "progress": 0.9839879932151009, "epoch": 88.55925886320831, "img/sec/core": 686.1975018780596, "core_hours_NVIDIA A100-SXM4-40GB": 44.25392411481332, "core_hours": 44.25392411481332} {"step": 110850, "global_schedule": 0.0007208883762359619, "l2_grads": 2.861281633377075, "l2_params": 238.00094604492188, "l2_updates": 0.0007755999686196446, "train/loss": 1.4842102527618408, "uptime": 20377.796432536, "examples_seen": 113510400.0, "progress": 0.9844320311181762, "epoch": 88.59922242767726, "img/sec/core": 755.2583566456376, "core_hours_NVIDIA A100-SXM4-40GB": 44.27275505140221, "core_hours": 44.27275505140221} {"step": 110900, "global_schedule": 0.000680387020111084, "l2_grads": 2.9309322834014893, "l2_params": 238.00050354003906, "l2_updates": 0.000737758819013834, "train/loss": 1.4843802452087402, "uptime": 20386.765153624998, "examples_seen": 113561600.0, "progress": 0.9848760690212517, "epoch": 88.63918599214622, "img/sec/core": 713.5911504538889, "core_hours_NVIDIA A100-SXM4-40GB": 44.2926855427111, "core_hours": 44.2926855427111} {"step": 110950, "global_schedule": 0.0006410479545593262, "l2_grads": 2.6458919048309326, "l2_params": 238.0000457763672, "l2_updates": 0.0006843550363555551, "train/loss": 1.887516736984253, "uptime": 20396.190296028, "examples_seen": 113612800.0, "progress": 0.985320106924327, "epoch": 88.67914955661519, "img/sec/core": 679.0348332522126, "core_hours_NVIDIA A100-SXM4-40GB": 44.31363030360665, "core_hours": 44.31363030360665} {"step": 111000, "global_schedule": 0.0006029009819030762, "l2_grads": 2.554394006729126, "l2_params": 237.99961853027344, "l2_updates": 0.0006489804363809526, "train/loss": 2.2528419494628906, "uptime": 20404.796469685003, "examples_seen": 113664000.0, "progress": 0.9857641448274025, "epoch": 88.71911312108413, "img/sec/core": 743.6522030663137, "core_hours_NVIDIA A100-SXM4-40GB": 44.332755133955544, "core_hours": 44.332755133955544} {"step": 111050, "global_schedule": 0.0005658864974975586, "l2_grads": 2.8893280029296875, "l2_params": 237.999267578125, "l2_updates": 0.000618527177721262, "train/loss": 1.4472159147262573, "uptime": 20414.219609058004, "examples_seen": 113715200.0, "progress": 0.9862081827304778, "epoch": 88.7590766855531, "img/sec/core": 731.4882918882136, "core_hours_NVIDIA A100-SXM4-40GB": 44.35219799090888, "core_hours": 44.35219799090888} {"step": 111100, "global_schedule": 0.0005300641059875488, "l2_grads": 2.7239255905151367, "l2_params": 237.9989013671875, "l2_updates": 0.000569729832932353, "train/loss": 1.67803156375885, "uptime": 20422.743301460003, "examples_seen": 113766400.0, "progress": 0.9866522206335533, "epoch": 88.79904025002205, "img/sec/core": 750.8483058936931, "core_hours_NVIDIA A100-SXM4-40GB": 44.37113952957999, "core_hours": 44.37113952957999} {"step": 111150, "global_schedule": 0.0004954338073730469, "l2_grads": 2.5092685222625732, "l2_params": 237.99853515625, "l2_updates": 0.0005318556213751435, "train/loss": 1.5248538255691528, "uptime": 20431.425517870004, "examples_seen": 113817600.0, "progress": 0.9870962585366286, "epoch": 88.83900381449101, "img/sec/core": 737.1389628836793, "core_hours_NVIDIA A100-SXM4-40GB": 44.390433343824434, "core_hours": 44.390433343824434} {"step": 111200, "global_schedule": 0.00046193599700927734, "l2_grads": 2.8934781551361084, "l2_params": 237.9982147216797, "l2_updates": 0.0005046118167228997, "train/loss": 1.398181676864624, "uptime": 20440.774628386003, "examples_seen": 113868800.0, "progress": 0.9875402964397041, "epoch": 88.87896737895997, "img/sec/core": 684.5571018812575, "core_hours_NVIDIA A100-SXM4-40GB": 44.4112091449711, "core_hours": 44.4112091449711} {"step": 111250, "global_schedule": 0.0004296302795410156, "l2_grads": 2.6681466102600098, "l2_params": 237.99794006347656, "l2_updates": 0.0004596800426952541, "train/loss": 3.183121919631958, "uptime": 20449.897222984997, "examples_seen": 113920000.0, "progress": 0.9879843343427795, "epoch": 88.91893094342892, "img/sec/core": 701.5547967793606, "core_hours_NVIDIA A100-SXM4-40GB": 44.43148157741332, "core_hours": 44.43148157741332} {"step": 111300, "global_schedule": 0.000398486852645874, "l2_grads": 2.719865560531616, "l2_params": 237.99766540527344, "l2_updates": 0.00041909230640158057, "train/loss": 2.3340377807617188, "uptime": 20458.653785356997, "examples_seen": 113971200.0, "progress": 0.9884283722458549, "epoch": 88.95889450789788, "img/sec/core": 730.8804218039392, "core_hours_NVIDIA A100-SXM4-40GB": 44.450940604906656, "core_hours": 44.450940604906656} {"step": 111350, "global_schedule": 0.00036850571632385254, "l2_grads": 2.957087516784668, "l2_params": 237.99740600585938, "l2_updates": 0.0003910998348146677, "train/loss": 1.5691378116607666, "uptime": 20468.068719347997, "examples_seen": 114022400.0, "progress": 0.9888724101489303, "epoch": 88.99885807236683, "img/sec/core": 679.7710962305143, "core_hours_NVIDIA A100-SXM4-40GB": 44.47186268044221, "core_hours": 44.47186268044221} {"step": 111400, "global_schedule": 0.00033971667289733887, "l2_grads": 2.744906425476074, "l2_params": 237.99713134765625, "l2_updates": 0.000365428306395188, "train/loss": 1.3429830074310303, "uptime": 20478.261774968, "examples_seen": 114073600.0, "progress": 0.9893164480520057, "epoch": 89.03882163683579, "img/sec/core": 627.8784535856947, "core_hours_NVIDIA A100-SXM4-40GB": 44.49451391515333, "core_hours": 44.49451391515333} {"step": 111450, "global_schedule": 0.0003120899200439453, "l2_grads": 2.795133590698242, "l2_params": 237.9968719482422, "l2_updates": 0.0003377152024768293, "train/loss": 1.3665924072265625, "uptime": 20487.244950428998, "examples_seen": 114124800.0, "progress": 0.9897604859550811, "epoch": 89.07878520130475, "img/sec/core": 712.442947127802, "core_hours_NVIDIA A100-SXM4-40GB": 44.514476527288885, "core_hours": 44.514476527288885} {"step": 111500, "global_schedule": 0.0002856254577636719, "l2_grads": 2.7098162174224854, "l2_params": 237.99673461914062, "l2_updates": 0.0003078803129028529, "train/loss": 1.340589165687561, "uptime": 20496.762686638, "examples_seen": 114176000.0, "progress": 0.9902045238581565, "epoch": 89.1187487657737, "img/sec/core": 672.4288065420685, "core_hours_NVIDIA A100-SXM4-40GB": 44.53562705219777, "core_hours": 44.53562705219777} {"step": 111550, "global_schedule": 0.00026035308837890625, "l2_grads": 2.940264940261841, "l2_params": 237.9965362548828, "l2_updates": 0.00028214085614308715, "train/loss": 1.403396725654602, "uptime": 20506.092661675, "examples_seen": 114227200.0, "progress": 0.990648561761232, "epoch": 89.15871233024266, "img/sec/core": 685.9611065000457, "core_hours_NVIDIA A100-SXM4-40GB": 44.55636033005778, "core_hours": 44.55636033005778} {"step": 111600, "global_schedule": 0.00023624300956726074, "l2_grads": 2.61299467086792, "l2_params": 237.99632263183594, "l2_updates": 0.0002536254469305277, "train/loss": 2.2841362953186035, "uptime": 20515.355896059, "examples_seen": 114278400.0, "progress": 0.9910925996643073, "epoch": 89.19867589471161, "img/sec/core": 690.9033858687626, "core_hours_NVIDIA A100-SXM4-40GB": 44.57694529535555, "core_hours": 44.57694529535555} {"step": 111650, "global_schedule": 0.00021329522132873535, "l2_grads": 2.6504716873168945, "l2_params": 237.9961700439453, "l2_updates": 0.0002325619279872626, "train/loss": 3.149533271789551, "uptime": 20524.840784775, "examples_seen": 114329600.0, "progress": 0.9915366375673828, "epoch": 89.23863945918058, "img/sec/core": 674.757521319517, "core_hours_NVIDIA A100-SXM4-40GB": 44.59802282583554, "core_hours": 44.59802282583554} {"step": 111700, "global_schedule": 0.00019153952598571777, "l2_grads": 2.8363444805145264, "l2_params": 237.9960479736328, "l2_updates": 0.0002084377483697608, "train/loss": 1.4189872741699219, "uptime": 20533.850298526, "examples_seen": 114380800.0, "progress": 0.9919806754704582, "epoch": 89.27860302364954, "img/sec/core": 710.360201102952, "core_hours_NVIDIA A100-SXM4-40GB": 44.61804396750444, "core_hours": 44.61804396750444} {"step": 111750, "global_schedule": 0.00017091631889343262, "l2_grads": 2.655930995941162, "l2_params": 237.99594116210938, "l2_updates": 0.00018458894919604063, "train/loss": 2.3834097385406494, "uptime": 20542.394316141, "examples_seen": 114432000.0, "progress": 0.9924247133735336, "epoch": 89.31856658811849, "img/sec/core": 749.0621260850054, "core_hours_NVIDIA A100-SXM4-40GB": 44.63703067331554, "core_hours": 44.63703067331554} {"step": 111800, "global_schedule": 0.00015148520469665527, "l2_grads": 2.730747938156128, "l2_params": 237.99581909179688, "l2_updates": 0.0001633000938454643, "train/loss": 2.0359249114990234, "uptime": 20551.232404430004, "examples_seen": 114483200.0, "progress": 0.992868751276609, "epoch": 89.35853015258745, "img/sec/core": 724.1385003999637, "core_hours_NVIDIA A100-SXM4-40GB": 44.65667086951333, "core_hours": 44.65667086951333} {"step": 111850, "global_schedule": 0.00013324618339538574, "l2_grads": 3.0196757316589355, "l2_params": 237.99571228027344, "l2_updates": 0.00014396656479220837, "train/loss": 1.5462452173233032, "uptime": 20560.428745182, "examples_seen": 114534400.0, "progress": 0.9933127891796844, "epoch": 89.3984937170564, "img/sec/core": 695.9289757297855, "core_hours_NVIDIA A100-SXM4-40GB": 44.67710718229554, "core_hours": 44.67710718229554} {"step": 111900, "global_schedule": 0.00011616945266723633, "l2_grads": 3.1074182987213135, "l2_params": 237.99560546875, "l2_updates": 0.00012431401410140097, "train/loss": 3.701120376586914, "uptime": 20568.874215648, "examples_seen": 114585600.0, "progress": 0.9937568270827598, "epoch": 89.43845728152536, "img/sec/core": 757.8026618841152, "core_hours_NVIDIA A100-SXM4-40GB": 44.69587489444222, "core_hours": 44.69587489444222} {"step": 111950, "global_schedule": 0.00010025501251220703, "l2_grads": 2.883469820022583, "l2_params": 237.9955291748047, "l2_updates": 0.0001092428938136436, "train/loss": 3.507739782333374, "uptime": 20577.512515554, "examples_seen": 114636800.0, "progress": 0.9942008649858352, "epoch": 89.47842084599432, "img/sec/core": 740.8865250854423, "core_hours_NVIDIA A100-SXM4-40GB": 44.71507111645554, "core_hours": 44.71507111645554} {"step": 112000, "global_schedule": 8.550286293029785e-05, "l2_grads": 2.6601603031158447, "l2_params": 237.9954833984375, "l2_updates": 9.132087870966643e-05, "train/loss": 1.2927377223968506, "uptime": 20586.128875761002, "examples_seen": 114688000.0, "progress": 0.9946449028889106, "epoch": 89.51838441046327, "img/sec/core": 742.7730324922884, "core_hours_NVIDIA A100-SXM4-40GB": 44.73421858358221, "core_hours": 44.73421858358221} {"step": 112050, "global_schedule": 7.194280624389648e-05, "l2_grads": 2.851378917694092, "l2_params": 237.9954376220703, "l2_updates": 7.67975507187657e-05, "train/loss": 3.4482052326202393, "uptime": 20595.313827646998, "examples_seen": 114739200.0, "progress": 0.995088940791986, "epoch": 89.55834797493223, "img/sec/core": 784.9261072358818, "core_hours_NVIDIA A100-SXM4-40GB": 44.75233776969555, "core_hours": 44.75233776969555} {"step": 112100, "global_schedule": 5.9545040130615234e-05, "l2_grads": 2.84551739692688, "l2_params": 237.99539184570312, "l2_updates": 6.478635623352602e-05, "train/loss": 1.4909292459487915, "uptime": 20604.254152948997, "examples_seen": 114790400.0, "progress": 0.9955329786950614, "epoch": 89.59831153940118, "img/sec/core": 715.8576208148626, "core_hours_NVIDIA A100-SXM4-40GB": 44.77220515925555, "core_hours": 44.77220515925555} {"step": 112150, "global_schedule": 4.83095645904541e-05, "l2_grads": 2.5961854457855225, "l2_params": 237.99534606933594, "l2_updates": 5.166431947145611e-05, "train/loss": 2.1077685356140137, "uptime": 20612.936714473, "examples_seen": 114841600.0, "progress": 0.9959770165981369, "epoch": 89.63827510387014, "img/sec/core": 737.1096631228431, "core_hours_NVIDIA A100-SXM4-40GB": 44.791499740419994, "core_hours": 44.791499740419994} {"step": 112200, "global_schedule": 3.826618194580078e-05, "l2_grads": 2.734973669052124, "l2_params": 237.9953155517578, "l2_updates": 4.0884286136133596e-05, "train/loss": 2.4539315700531006, "uptime": 20621.355107290998, "examples_seen": 114892800.0, "progress": 0.9964210545012122, "epoch": 89.6782386683391, "img/sec/core": 760.2401240194383, "core_hours_NVIDIA A100-SXM4-40GB": 44.81020728001555, "core_hours": 44.81020728001555} {"step": 112250, "global_schedule": 2.9385089874267578e-05, "l2_grads": 2.5033202171325684, "l2_params": 237.99530029296875, "l2_updates": 3.178811675752513e-05, "train/loss": 2.242250442504883, "uptime": 20630.691286317, "examples_seen": 114944000.0, "progress": 0.9968650924042877, "epoch": 89.71820223280805, "img/sec/core": 685.5052781416517, "core_hours_NVIDIA A100-SXM4-40GB": 44.83095434451777, "core_hours": 44.83095434451777} {"step": 112300, "global_schedule": 2.1666288375854492e-05, "l2_grads": 2.949913740158081, "l2_params": 237.99526977539062, "l2_updates": 2.3356422389042564e-05, "train/loss": 3.620847225189209, "uptime": 20639.421922183, "examples_seen": 114995200.0, "progress": 0.997309130307363, "epoch": 89.75816579727702, "img/sec/core": 733.050845119371, "core_hours_NVIDIA A100-SXM4-40GB": 44.850355757553324, "core_hours": 44.850355757553324} {"step": 112350, "global_schedule": 1.5109777450561523e-05, "l2_grads": 2.8595128059387207, "l2_params": 237.99525451660156, "l2_updates": 1.6379943190258928e-05, "train/loss": 1.406538486480713, "uptime": 20648.571340616, "examples_seen": 115046400.0, "progress": 0.9977531682104385, "epoch": 89.79812936174596, "img/sec/core": 699.4980114710123, "core_hours_NVIDIA A100-SXM4-40GB": 44.87068779851555, "core_hours": 44.87068779851555} {"step": 112400, "global_schedule": 9.745359420776367e-06, "l2_grads": 2.8042728900909424, "l2_params": 237.99525451660156, "l2_updates": 1.0468840628163889e-05, "train/loss": 1.6582810878753662, "uptime": 20657.384042965, "examples_seen": 115097600.0, "progress": 0.9981972061135138, "epoch": 89.83809292621493, "img/sec/core": 726.2244594846426, "core_hours_NVIDIA A100-SXM4-40GB": 44.89027158151332, "core_hours": 44.89027158151332} {"step": 112450, "global_schedule": 5.5730342864990234e-06, "l2_grads": 2.7977235317230225, "l2_params": 237.99520874023438, "l2_updates": 5.9844842326128855e-06, "train/loss": 1.585754156112671, "uptime": 20666.707624671, "examples_seen": 115148800.0, "progress": 0.9986412440165893, "epoch": 89.87805649068389, "img/sec/core": 686.4314811421167, "core_hours_NVIDIA A100-SXM4-40GB": 44.910990651971105, "core_hours": 44.910990651971105} {"step": 112500, "global_schedule": 2.5331974029541016e-06, "l2_grads": 2.8503425121307373, "l2_params": 237.99520874023438, "l2_updates": 2.739778210525401e-06, "train/loss": 1.308261752128601, "uptime": 20675.631419598, "examples_seen": 115200000.0, "progress": 0.9990852819196646, "epoch": 89.91802005515284, "img/sec/core": 717.183670440104, "core_hours_NVIDIA A100-SXM4-40GB": 44.93082130736443, "core_hours": 44.93082130736443} {"step": 112550, "global_schedule": 6.854534149169922e-07, "l2_grads": 2.5085790157318115, "l2_params": 237.99520874023438, "l2_updates": 7.338149998759036e-07, "train/loss": 2.3447089195251465, "uptime": 20684.749238199, "examples_seen": 115251200.0, "progress": 0.9995293198227401, "epoch": 89.9579836196218, "img/sec/core": 701.9222776923804, "core_hours_NVIDIA A100-SXM4-40GB": 44.95108312647777, "core_hours": 44.95108312647777} {"step": 112603, "global_schedule": 0.0, "l2_grads": 2.6730122566223145, "l2_params": 237.99520874023438, "l2_updates": 0.0, "train/loss": 1.9165900945663452, "uptime": 20695.194294736, "examples_seen": 115305472.0, "progress": 1.0, "epoch": 90.00034499795889, "img/sec/core": 649.4938515619408, "core_hours_NVIDIA A100-SXM4-40GB": 44.97429436322666, "core_hours": 44.97429436322666, "val/acc@1": 0.76852, "val/loss": 0.9222128649902344, "z/secs/eval/val": 2.6359426800008805} {"step": 112603, "global_schedule": 0.0, "l2_grads": 2.6730122566223145, "l2_params": 237.99520874023438, "l2_updates": 0.0, "train/loss": 1.9165900945663452, "uptime": 20695.194294736, "examples_seen": 115305472.0, "progress": 1.0, "epoch": 90.00034499795889, "img/sec/core": 649.4938515619408, "core_hours_NVIDIA A100-SXM4-40GB": 44.97429436322666, "core_hours": 44.97429436322666, "val/acc@1": 0.76852, "val/loss": 0.9222128649902344, "z/secs/eval/val": 2.6359426800008805}