ZH-GPT-small / metrics.json
xiulinyang's picture
Adding model checkpoints and config files
20c7fc9
{"num_parameters": 102068736, "trainable_parameters": 102068736, "step": 0}
{"train_info/time_between_train_steps": 3.9748432636260986, "step": 0}
{"info/global_step": 1, "train_info/time_within_train_step": 25.29767894744873, "step": 1}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 17273.5732421875, "train_info/memory_reserved": 18442.0, "train_info/memory_max_reserved": 18442.0, "_timestamp": 1740920122, "_runtime": 33}, "step": 1}
{"logs": {"train/loss": 10.1251, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1740920122, "_runtime": 33}, "step": 1}
{"train_info/time_between_train_steps": 0.015340805053710938, "step": 1}
{"info/global_step": 2, "train_info/time_within_train_step": 25.099069356918335, "step": 2}
{"train_info/time_between_train_steps": 0.005385160446166992, "step": 2}
{"info/global_step": 3, "train_info/time_within_train_step": 24.812320232391357, "step": 3}
{"train_info/time_between_train_steps": 0.005757570266723633, "step": 3}
{"info/global_step": 4, "train_info/time_within_train_step": 24.960580825805664, "step": 4}
{"train_info/time_between_train_steps": 0.005323648452758789, "step": 4}
{"info/global_step": 5, "train_info/time_within_train_step": 24.808937788009644, "step": 5}
{"train_info/time_between_train_steps": 0.007637500762939453, "step": 5}
{"info/global_step": 6, "train_info/time_within_train_step": 24.941815614700317, "step": 6}
{"train_info/time_between_train_steps": 0.005566835403442383, "step": 6}
{"info/global_step": 7, "train_info/time_within_train_step": 24.81364941596985, "step": 7}
{"train_info/time_between_train_steps": 0.005424022674560547, "step": 7}
{"info/global_step": 8, "train_info/time_within_train_step": 24.93263554573059, "step": 8}
{"train_info/time_between_train_steps": 0.005368232727050781, "step": 8}
{"info/global_step": 9, "train_info/time_within_train_step": 24.818796396255493, "step": 9}
{"train_info/time_between_train_steps": 0.005715608596801758, "step": 9}
{"info/global_step": 10, "train_info/time_within_train_step": 24.928115606307983, "step": 10}
{"train_info/time_between_train_steps": 0.005578279495239258, "step": 10}
{"info/global_step": 11, "train_info/time_within_train_step": 24.846867561340332, "step": 11}
{"train_info/time_between_train_steps": 0.005870819091796875, "step": 11}
{"info/global_step": 12, "train_info/time_within_train_step": 25.11908769607544, "step": 12}
{"train_info/time_between_train_steps": 0.005486965179443359, "step": 12}
{"info/global_step": 13, "train_info/time_within_train_step": 24.99142837524414, "step": 13}
{"train_info/time_between_train_steps": 0.005359649658203125, "step": 13}
{"info/global_step": 14, "train_info/time_within_train_step": 24.89536213874817, "step": 14}
{"train_info/time_between_train_steps": 0.006455659866333008, "step": 14}
{"info/global_step": 15, "train_info/time_within_train_step": 24.82007622718811, "step": 15}
{"train_info/time_between_train_steps": 0.005432605743408203, "step": 15}
{"info/global_step": 16, "train_info/time_within_train_step": 25.026381254196167, "step": 16}
{"train_info/time_between_train_steps": 0.00533747673034668, "step": 16}
{"info/global_step": 17, "train_info/time_within_train_step": 24.82409429550171, "step": 17}
{"train_info/time_between_train_steps": 0.005103349685668945, "step": 17}
{"info/global_step": 18, "train_info/time_within_train_step": 24.82201313972473, "step": 18}
{"train_info/time_between_train_steps": 0.005330801010131836, "step": 18}
{"info/global_step": 19, "train_info/time_within_train_step": 24.79266881942749, "step": 19}
{"train_info/time_between_train_steps": 0.005071163177490234, "step": 19}
{"info/global_step": 20, "train_info/time_within_train_step": 24.78656244277954, "step": 20}
{"train_info/time_between_train_steps": 0.005069255828857422, "step": 20}
{"info/global_step": 21, "train_info/time_within_train_step": 24.737099409103394, "step": 21}
{"train_info/time_between_train_steps": 0.005138874053955078, "step": 21}
{"info/global_step": 22, "train_info/time_within_train_step": 24.744120359420776, "step": 22}
{"train_info/time_between_train_steps": 0.005052089691162109, "step": 22}
{"info/global_step": 23, "train_info/time_within_train_step": 24.736136198043823, "step": 23}
{"train_info/time_between_train_steps": 0.004993915557861328, "step": 23}
{"info/global_step": 24, "train_info/time_within_train_step": 24.749072313308716, "step": 24}
{"train_info/time_between_train_steps": 0.00518035888671875, "step": 24}
{"info/global_step": 25, "train_info/time_within_train_step": 24.76796841621399, "step": 25}
{"train_info/time_between_train_steps": 0.005128383636474609, "step": 25}
{"info/global_step": 26, "train_info/time_within_train_step": 24.770771026611328, "step": 26}
{"train_info/time_between_train_steps": 0.005117177963256836, "step": 26}
{"info/global_step": 27, "train_info/time_within_train_step": 24.77668023109436, "step": 27}
{"train_info/time_between_train_steps": 0.005379199981689453, "step": 27}
{"info/global_step": 28, "train_info/time_within_train_step": 24.766622304916382, "step": 28}
{"train_info/time_between_train_steps": 0.0051004886627197266, "step": 28}
{"info/global_step": 29, "train_info/time_within_train_step": 24.775333404541016, "step": 29}
{"train_info/time_between_train_steps": 0.005373716354370117, "step": 29}
{"info/global_step": 30, "train_info/time_within_train_step": 24.787676572799683, "step": 30}
{"train_info/time_between_train_steps": 0.010397911071777344, "step": 30}
{"info/global_step": 31, "train_info/time_within_train_step": 24.901972770690918, "step": 31}
{"train_info/time_between_train_steps": 0.00505828857421875, "step": 31}
{"info/global_step": 32, "train_info/time_within_train_step": 24.91492462158203, "step": 32}
{"train_info/time_between_train_steps": 0.005320549011230469, "step": 32}
{"info/global_step": 33, "train_info/time_within_train_step": 24.814911603927612, "step": 33}
{"train_info/time_between_train_steps": 0.00563502311706543, "step": 33}
{"info/global_step": 34, "train_info/time_within_train_step": 24.84148669242859, "step": 34}
{"train_info/time_between_train_steps": 0.0062329769134521484, "step": 34}
{"train_info/time_between_train_steps": 5.339306592941284, "step": 34}
{"info/global_step": 35, "train_info/time_within_train_step": 25.011415719985962, "step": 35}
{"train_info/time_between_train_steps": 0.005385160446166992, "step": 35}
{"info/global_step": 36, "train_info/time_within_train_step": 24.950895071029663, "step": 36}
{"train_info/time_between_train_steps": 0.005301237106323242, "step": 36}
{"info/global_step": 37, "train_info/time_within_train_step": 24.793596982955933, "step": 37}
{"train_info/time_between_train_steps": 0.005071878433227539, "step": 37}
{"info/global_step": 38, "train_info/time_within_train_step": 24.920902490615845, "step": 38}
{"train_info/time_between_train_steps": 0.005326032638549805, "step": 38}
{"info/global_step": 39, "train_info/time_within_train_step": 24.818591594696045, "step": 39}
{"train_info/time_between_train_steps": 0.0074846744537353516, "step": 39}
{"info/global_step": 40, "train_info/time_within_train_step": 24.928252935409546, "step": 40}
{"train_info/time_between_train_steps": 0.00762629508972168, "step": 40}
{"info/global_step": 41, "train_info/time_within_train_step": 24.78254461288452, "step": 41}
{"train_info/time_between_train_steps": 0.007555484771728516, "step": 41}
{"info/global_step": 42, "train_info/time_within_train_step": 24.941072940826416, "step": 42}
{"train_info/time_between_train_steps": 0.006258726119995117, "step": 42}
{"info/global_step": 43, "train_info/time_within_train_step": 24.765688180923462, "step": 43}
{"train_info/time_between_train_steps": 0.005083560943603516, "step": 43}
{"info/global_step": 44, "train_info/time_within_train_step": 24.8748676776886, "step": 44}
{"train_info/time_between_train_steps": 0.005274295806884766, "step": 44}
{"info/global_step": 45, "train_info/time_within_train_step": 24.795369148254395, "step": 45}
{"train_info/time_between_train_steps": 0.00563502311706543, "step": 45}
{"info/global_step": 46, "train_info/time_within_train_step": 24.896656274795532, "step": 46}
{"train_info/time_between_train_steps": 0.005282163619995117, "step": 46}
{"info/global_step": 47, "train_info/time_within_train_step": 24.89812707901001, "step": 47}
{"train_info/time_between_train_steps": 0.010710716247558594, "step": 47}
{"info/global_step": 48, "train_info/time_within_train_step": 24.903117179870605, "step": 48}
{"train_info/time_between_train_steps": 0.005549192428588867, "step": 48}
{"info/global_step": 49, "train_info/time_within_train_step": 24.783502340316772, "step": 49}
{"train_info/time_between_train_steps": 0.010082483291625977, "step": 49}
{"info/global_step": 50, "train_info/time_within_train_step": 24.772361993789673, "step": 50}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740921346, "_runtime": 1257}, "step": 50}
{"logs": {"train/loss": 7.2523, "train/learning_rate": 0.00025, "train/epoch": 1.01, "_timestamp": 1740921346, "_runtime": 1257}, "step": 50}
{"train_info/time_between_train_steps": 0.008487939834594727, "step": 50}
{"info/global_step": 51, "train_info/time_within_train_step": 24.76487159729004, "step": 51}
{"train_info/time_between_train_steps": 0.005156755447387695, "step": 51}
{"info/global_step": 52, "train_info/time_within_train_step": 24.7608699798584, "step": 52}
{"train_info/time_between_train_steps": 0.006047725677490234, "step": 52}
{"info/global_step": 53, "train_info/time_within_train_step": 24.76108741760254, "step": 53}
{"train_info/time_between_train_steps": 0.005170345306396484, "step": 53}
{"info/global_step": 54, "train_info/time_within_train_step": 24.7758629322052, "step": 54}
{"train_info/time_between_train_steps": 0.006214141845703125, "step": 54}
{"info/global_step": 55, "train_info/time_within_train_step": 24.770238876342773, "step": 55}
{"train_info/time_between_train_steps": 0.005258798599243164, "step": 55}
{"info/global_step": 56, "train_info/time_within_train_step": 24.81588077545166, "step": 56}
{"train_info/time_between_train_steps": 0.005321979522705078, "step": 56}
{"info/global_step": 57, "train_info/time_within_train_step": 24.789792776107788, "step": 57}
{"train_info/time_between_train_steps": 0.0052988529205322266, "step": 57}
{"info/global_step": 58, "train_info/time_within_train_step": 24.772271871566772, "step": 58}
{"train_info/time_between_train_steps": 0.006421327590942383, "step": 58}
{"info/global_step": 59, "train_info/time_within_train_step": 24.79297709465027, "step": 59}
{"train_info/time_between_train_steps": 0.0051844120025634766, "step": 59}
{"info/global_step": 60, "train_info/time_within_train_step": 24.801740646362305, "step": 60}
{"train_info/time_between_train_steps": 0.010095596313476562, "step": 60}
{"info/global_step": 61, "train_info/time_within_train_step": 24.804505348205566, "step": 61}
{"train_info/time_between_train_steps": 0.005092144012451172, "step": 61}
{"info/global_step": 62, "train_info/time_within_train_step": 24.809823751449585, "step": 62}
{"train_info/time_between_train_steps": 0.005235195159912109, "step": 62}
{"info/global_step": 63, "train_info/time_within_train_step": 24.889126539230347, "step": 63}
{"train_info/time_between_train_steps": 0.005342006683349609, "step": 63}
{"info/global_step": 64, "train_info/time_within_train_step": 24.828266620635986, "step": 64}
{"train_info/time_between_train_steps": 0.0052030086517333984, "step": 64}
{"info/global_step": 65, "train_info/time_within_train_step": 24.799081087112427, "step": 65}
{"train_info/time_between_train_steps": 0.0054013729095458984, "step": 65}
{"info/global_step": 66, "train_info/time_within_train_step": 24.80423140525818, "step": 66}
{"train_info/time_between_train_steps": 0.005564451217651367, "step": 66}
{"info/global_step": 67, "train_info/time_within_train_step": 24.801207304000854, "step": 67}
{"train_info/time_between_train_steps": 0.005765199661254883, "step": 67}
{"info/global_step": 68, "train_info/time_within_train_step": 24.838858604431152, "step": 68}
{"train_info/time_between_train_steps": 0.006044864654541016, "step": 68}
{"train_info/time_between_train_steps": 5.24376654624939, "step": 68}
{"info/global_step": 69, "train_info/time_within_train_step": 24.74887466430664, "step": 69}
{"train_info/time_between_train_steps": 0.00510859489440918, "step": 69}
{"info/global_step": 70, "train_info/time_within_train_step": 24.86243486404419, "step": 70}
{"train_info/time_between_train_steps": 0.00501251220703125, "step": 70}
{"info/global_step": 71, "train_info/time_within_train_step": 24.77493691444397, "step": 71}
{"train_info/time_between_train_steps": 0.004936695098876953, "step": 71}
{"info/global_step": 72, "train_info/time_within_train_step": 24.93021869659424, "step": 72}
{"train_info/time_between_train_steps": 0.005214214324951172, "step": 72}
{"info/global_step": 73, "train_info/time_within_train_step": 24.811963319778442, "step": 73}
{"train_info/time_between_train_steps": 0.006035327911376953, "step": 73}
{"info/global_step": 74, "train_info/time_within_train_step": 24.88904356956482, "step": 74}
{"train_info/time_between_train_steps": 0.005064725875854492, "step": 74}
{"info/global_step": 75, "train_info/time_within_train_step": 24.77592444419861, "step": 75}
{"train_info/time_between_train_steps": 0.005513906478881836, "step": 75}
{"info/global_step": 76, "train_info/time_within_train_step": 24.92940402030945, "step": 76}
{"train_info/time_between_train_steps": 0.005401134490966797, "step": 76}
{"info/global_step": 77, "train_info/time_within_train_step": 24.791345357894897, "step": 77}
{"train_info/time_between_train_steps": 0.005208253860473633, "step": 77}
{"info/global_step": 78, "train_info/time_within_train_step": 25.011282920837402, "step": 78}
{"train_info/time_between_train_steps": 0.005326986312866211, "step": 78}
{"info/global_step": 79, "train_info/time_within_train_step": 24.797748804092407, "step": 79}
{"train_info/time_between_train_steps": 0.005845546722412109, "step": 79}
{"info/global_step": 80, "train_info/time_within_train_step": 24.90913724899292, "step": 80}
{"train_info/time_between_train_steps": 0.005231618881225586, "step": 80}
{"info/global_step": 81, "train_info/time_within_train_step": 24.79573655128479, "step": 81}
{"train_info/time_between_train_steps": 0.0054798126220703125, "step": 81}
{"info/global_step": 82, "train_info/time_within_train_step": 24.879939079284668, "step": 82}
{"train_info/time_between_train_steps": 0.005312681198120117, "step": 82}
{"info/global_step": 83, "train_info/time_within_train_step": 24.801668405532837, "step": 83}
{"train_info/time_between_train_steps": 0.004910945892333984, "step": 83}
{"info/global_step": 84, "train_info/time_within_train_step": 24.76822519302368, "step": 84}
{"train_info/time_between_train_steps": 0.00997304916381836, "step": 84}
{"info/global_step": 85, "train_info/time_within_train_step": 24.775590658187866, "step": 85}
{"train_info/time_between_train_steps": 0.010097503662109375, "step": 85}
{"info/global_step": 86, "train_info/time_within_train_step": 24.763813495635986, "step": 86}
{"train_info/time_between_train_steps": 0.009991645812988281, "step": 86}
{"info/global_step": 87, "train_info/time_within_train_step": 24.772047996520996, "step": 87}
{"train_info/time_between_train_steps": 0.005001544952392578, "step": 87}
{"info/global_step": 88, "train_info/time_within_train_step": 24.784770250320435, "step": 88}
{"train_info/time_between_train_steps": 0.005179405212402344, "step": 88}
{"info/global_step": 89, "train_info/time_within_train_step": 24.848997116088867, "step": 89}
{"train_info/time_between_train_steps": 0.005191326141357422, "step": 89}
{"info/global_step": 90, "train_info/time_within_train_step": 24.78225040435791, "step": 90}
{"train_info/time_between_train_steps": 0.009989261627197266, "step": 90}
{"info/global_step": 91, "train_info/time_within_train_step": 24.79836416244507, "step": 91}
{"train_info/time_between_train_steps": 0.0052950382232666016, "step": 91}
{"info/global_step": 92, "train_info/time_within_train_step": 24.787277698516846, "step": 92}
{"train_info/time_between_train_steps": 0.005286455154418945, "step": 92}
{"info/global_step": 93, "train_info/time_within_train_step": 24.780993461608887, "step": 93}
{"train_info/time_between_train_steps": 0.005224704742431641, "step": 93}
{"info/global_step": 94, "train_info/time_within_train_step": 24.919578313827515, "step": 94}
{"train_info/time_between_train_steps": 0.005186319351196289, "step": 94}
{"info/global_step": 95, "train_info/time_within_train_step": 24.774234533309937, "step": 95}
{"train_info/time_between_train_steps": 0.0051724910736083984, "step": 95}
{"info/global_step": 96, "train_info/time_within_train_step": 24.774667978286743, "step": 96}
{"train_info/time_between_train_steps": 0.005136251449584961, "step": 96}
{"info/global_step": 97, "train_info/time_within_train_step": 24.87544560432434, "step": 97}
{"train_info/time_between_train_steps": 0.00531005859375, "step": 97}
{"info/global_step": 98, "train_info/time_within_train_step": 24.80091381072998, "step": 98}
{"train_info/time_between_train_steps": 0.009202241897583008, "step": 98}
{"info/global_step": 99, "train_info/time_within_train_step": 24.77820134162903, "step": 99}
{"train_info/time_between_train_steps": 0.005061149597167969, "step": 99}
{"info/global_step": 100, "train_info/time_within_train_step": 24.781496286392212, "step": 100}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740922592, "_runtime": 2503}, "step": 100}
{"logs": {"train/loss": 5.2491, "train/learning_rate": 0.0005, "train/epoch": 2.03, "_timestamp": 1740922592, "_runtime": 2503}, "step": 100}
{"train_info/time_between_train_steps": 11.028911828994751, "step": 100}
{"info/global_step": 101, "train_info/time_within_train_step": 24.839141130447388, "step": 101}
{"train_info/time_between_train_steps": 0.005518436431884766, "step": 101}
{"info/global_step": 102, "train_info/time_within_train_step": 24.841291904449463, "step": 102}
{"train_info/time_between_train_steps": 0.0062901973724365234, "step": 102}
{"train_info/time_between_train_steps": 5.367207050323486, "step": 102}
{"info/global_step": 103, "train_info/time_within_train_step": 24.794697046279907, "step": 103}
{"train_info/time_between_train_steps": 0.005364179611206055, "step": 103}
{"info/global_step": 104, "train_info/time_within_train_step": 24.994399785995483, "step": 104}
{"train_info/time_between_train_steps": 0.00955653190612793, "step": 104}
{"info/global_step": 105, "train_info/time_within_train_step": 24.8295955657959, "step": 105}
{"train_info/time_between_train_steps": 0.005156278610229492, "step": 105}
{"info/global_step": 106, "train_info/time_within_train_step": 24.976973056793213, "step": 106}
{"train_info/time_between_train_steps": 0.005389213562011719, "step": 106}
{"info/global_step": 107, "train_info/time_within_train_step": 24.860315561294556, "step": 107}
{"train_info/time_between_train_steps": 0.010249853134155273, "step": 107}
{"info/global_step": 108, "train_info/time_within_train_step": 24.90214991569519, "step": 108}
{"train_info/time_between_train_steps": 0.005239963531494141, "step": 108}
{"info/global_step": 109, "train_info/time_within_train_step": 24.790313005447388, "step": 109}
{"train_info/time_between_train_steps": 0.005441188812255859, "step": 109}
{"info/global_step": 110, "train_info/time_within_train_step": 25.059134244918823, "step": 110}
{"train_info/time_between_train_steps": 0.005263328552246094, "step": 110}
{"info/global_step": 111, "train_info/time_within_train_step": 24.812580585479736, "step": 111}
{"train_info/time_between_train_steps": 0.005194902420043945, "step": 111}
{"info/global_step": 112, "train_info/time_within_train_step": 24.966216325759888, "step": 112}
{"train_info/time_between_train_steps": 0.0052776336669921875, "step": 112}
{"info/global_step": 113, "train_info/time_within_train_step": 24.79370093345642, "step": 113}
{"train_info/time_between_train_steps": 0.005434274673461914, "step": 113}
{"info/global_step": 114, "train_info/time_within_train_step": 24.897989749908447, "step": 114}
{"train_info/time_between_train_steps": 0.005292654037475586, "step": 114}
{"info/global_step": 115, "train_info/time_within_train_step": 24.79217290878296, "step": 115}
{"train_info/time_between_train_steps": 0.0052967071533203125, "step": 115}
{"info/global_step": 116, "train_info/time_within_train_step": 24.901453733444214, "step": 116}
{"train_info/time_between_train_steps": 0.005383968353271484, "step": 116}
{"info/global_step": 117, "train_info/time_within_train_step": 24.82537841796875, "step": 117}
{"train_info/time_between_train_steps": 0.005053520202636719, "step": 117}
{"info/global_step": 118, "train_info/time_within_train_step": 24.836827039718628, "step": 118}
{"train_info/time_between_train_steps": 0.005095720291137695, "step": 118}
{"info/global_step": 119, "train_info/time_within_train_step": 24.83863091468811, "step": 119}
{"train_info/time_between_train_steps": 0.0051403045654296875, "step": 119}
{"info/global_step": 120, "train_info/time_within_train_step": 24.842710494995117, "step": 120}
{"train_info/time_between_train_steps": 0.005640506744384766, "step": 120}
{"info/global_step": 121, "train_info/time_within_train_step": 24.838252544403076, "step": 121}
{"train_info/time_between_train_steps": 0.009952545166015625, "step": 121}
{"info/global_step": 122, "train_info/time_within_train_step": 24.85964870452881, "step": 122}
{"train_info/time_between_train_steps": 0.008583784103393555, "step": 122}
{"info/global_step": 123, "train_info/time_within_train_step": 24.847113609313965, "step": 123}
{"train_info/time_between_train_steps": 0.005143404006958008, "step": 123}
{"info/global_step": 124, "train_info/time_within_train_step": 24.805502891540527, "step": 124}
{"train_info/time_between_train_steps": 0.005105495452880859, "step": 124}
{"info/global_step": 125, "train_info/time_within_train_step": 24.8937087059021, "step": 125}
{"train_info/time_between_train_steps": 0.005174160003662109, "step": 125}
{"info/global_step": 126, "train_info/time_within_train_step": 24.785630464553833, "step": 126}
{"train_info/time_between_train_steps": 0.005116939544677734, "step": 126}
{"info/global_step": 127, "train_info/time_within_train_step": 24.809425354003906, "step": 127}
{"train_info/time_between_train_steps": 0.005029201507568359, "step": 127}
{"info/global_step": 128, "train_info/time_within_train_step": 24.818108320236206, "step": 128}
{"train_info/time_between_train_steps": 0.005311489105224609, "step": 128}
{"info/global_step": 129, "train_info/time_within_train_step": 24.784713983535767, "step": 129}
{"train_info/time_between_train_steps": 0.009955167770385742, "step": 129}
{"info/global_step": 130, "train_info/time_within_train_step": 24.80552840232849, "step": 130}
{"train_info/time_between_train_steps": 0.005160808563232422, "step": 130}
{"info/global_step": 131, "train_info/time_within_train_step": 24.817366361618042, "step": 131}
{"train_info/time_between_train_steps": 0.0054624080657958984, "step": 131}
{"info/global_step": 132, "train_info/time_within_train_step": 24.816241979599, "step": 132}
{"train_info/time_between_train_steps": 0.010177373886108398, "step": 132}
{"info/global_step": 133, "train_info/time_within_train_step": 24.7843120098114, "step": 133}
{"train_info/time_between_train_steps": 0.005334138870239258, "step": 133}
{"info/global_step": 134, "train_info/time_within_train_step": 24.80145764350891, "step": 134}
{"train_info/time_between_train_steps": 0.0053255558013916016, "step": 134}
{"info/global_step": 135, "train_info/time_within_train_step": 24.83701729774475, "step": 135}
{"train_info/time_between_train_steps": 0.0059740543365478516, "step": 135}
{"info/global_step": 136, "train_info/time_within_train_step": 24.953816890716553, "step": 136}
{"train_info/time_between_train_steps": 0.00622868537902832, "step": 136}
{"train_info/time_between_train_steps": 5.063098669052124, "step": 136}
{"info/global_step": 137, "train_info/time_within_train_step": 24.81296706199646, "step": 137}
{"train_info/time_between_train_steps": 0.006559133529663086, "step": 137}
{"info/global_step": 138, "train_info/time_within_train_step": 24.949511766433716, "step": 138}
{"train_info/time_between_train_steps": 0.005316495895385742, "step": 138}
{"info/global_step": 139, "train_info/time_within_train_step": 24.821558952331543, "step": 139}
{"train_info/time_between_train_steps": 0.005319118499755859, "step": 139}
{"info/global_step": 140, "train_info/time_within_train_step": 24.96777057647705, "step": 140}
{"train_info/time_between_train_steps": 0.005365848541259766, "step": 140}
{"info/global_step": 141, "train_info/time_within_train_step": 24.911173105239868, "step": 141}
{"train_info/time_between_train_steps": 0.006280422210693359, "step": 141}
{"info/global_step": 142, "train_info/time_within_train_step": 24.930566787719727, "step": 142}
{"train_info/time_between_train_steps": 0.006249189376831055, "step": 142}
{"info/global_step": 143, "train_info/time_within_train_step": 24.82397961616516, "step": 143}
{"train_info/time_between_train_steps": 0.005417585372924805, "step": 143}
{"info/global_step": 144, "train_info/time_within_train_step": 24.982408046722412, "step": 144}
{"train_info/time_between_train_steps": 0.005280494689941406, "step": 144}
{"info/global_step": 145, "train_info/time_within_train_step": 24.794698238372803, "step": 145}
{"train_info/time_between_train_steps": 0.005131721496582031, "step": 145}
{"info/global_step": 146, "train_info/time_within_train_step": 24.912818908691406, "step": 146}
{"train_info/time_between_train_steps": 0.0052490234375, "step": 146}
{"info/global_step": 147, "train_info/time_within_train_step": 24.80975842475891, "step": 147}
{"train_info/time_between_train_steps": 0.005635738372802734, "step": 147}
{"info/global_step": 148, "train_info/time_within_train_step": 24.974666357040405, "step": 148}
{"train_info/time_between_train_steps": 0.005245685577392578, "step": 148}
{"info/global_step": 149, "train_info/time_within_train_step": 24.83226466178894, "step": 149}
{"train_info/time_between_train_steps": 0.00542449951171875, "step": 149}
{"info/global_step": 150, "train_info/time_within_train_step": 24.92183494567871, "step": 150}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740923857, "_runtime": 3768}, "step": 150}
{"logs": {"train/loss": 4.5664, "train/learning_rate": 0.0005833333333333333, "train/epoch": 4.01, "_timestamp": 1740923857, "_runtime": 3768}, "step": 150}
{"train_info/time_between_train_steps": 0.009172439575195312, "step": 150}
{"info/global_step": 151, "train_info/time_within_train_step": 24.807873010635376, "step": 151}
{"train_info/time_between_train_steps": 0.004883527755737305, "step": 151}
{"info/global_step": 152, "train_info/time_within_train_step": 24.788182258605957, "step": 152}
{"train_info/time_between_train_steps": 0.0050792694091796875, "step": 152}
{"info/global_step": 153, "train_info/time_within_train_step": 24.815590620040894, "step": 153}
{"train_info/time_between_train_steps": 0.0050470829010009766, "step": 153}
{"info/global_step": 154, "train_info/time_within_train_step": 24.813863039016724, "step": 154}
{"train_info/time_between_train_steps": 0.00523829460144043, "step": 154}
{"info/global_step": 155, "train_info/time_within_train_step": 24.784559965133667, "step": 155}
{"train_info/time_between_train_steps": 0.009888410568237305, "step": 155}
{"info/global_step": 156, "train_info/time_within_train_step": 24.89781665802002, "step": 156}
{"train_info/time_between_train_steps": 0.005021095275878906, "step": 156}
{"info/global_step": 157, "train_info/time_within_train_step": 24.839410543441772, "step": 157}
{"train_info/time_between_train_steps": 0.005189180374145508, "step": 157}
{"info/global_step": 158, "train_info/time_within_train_step": 24.833443641662598, "step": 158}
{"train_info/time_between_train_steps": 0.005168437957763672, "step": 158}
{"info/global_step": 159, "train_info/time_within_train_step": 24.804860830307007, "step": 159}
{"train_info/time_between_train_steps": 0.005076169967651367, "step": 159}
{"info/global_step": 160, "train_info/time_within_train_step": 24.82519841194153, "step": 160}
{"train_info/time_between_train_steps": 0.005281925201416016, "step": 160}
{"info/global_step": 161, "train_info/time_within_train_step": 24.844583749771118, "step": 161}
{"train_info/time_between_train_steps": 0.005076169967651367, "step": 161}
{"info/global_step": 162, "train_info/time_within_train_step": 24.904642343521118, "step": 162}
{"train_info/time_between_train_steps": 0.010017871856689453, "step": 162}
{"info/global_step": 163, "train_info/time_within_train_step": 24.81181502342224, "step": 163}
{"train_info/time_between_train_steps": 0.005285501480102539, "step": 163}
{"info/global_step": 164, "train_info/time_within_train_step": 24.792205572128296, "step": 164}
{"train_info/time_between_train_steps": 0.0051767826080322266, "step": 164}
{"info/global_step": 165, "train_info/time_within_train_step": 24.794247150421143, "step": 165}
{"train_info/time_between_train_steps": 0.005123615264892578, "step": 165}
{"info/global_step": 166, "train_info/time_within_train_step": 24.776041746139526, "step": 166}
{"train_info/time_between_train_steps": 0.005133628845214844, "step": 166}
{"info/global_step": 167, "train_info/time_within_train_step": 24.75942301750183, "step": 167}
{"train_info/time_between_train_steps": 0.005021810531616211, "step": 167}
{"info/global_step": 168, "train_info/time_within_train_step": 24.758984327316284, "step": 168}
{"train_info/time_between_train_steps": 0.005272626876831055, "step": 168}
{"info/global_step": 169, "train_info/time_within_train_step": 24.779895305633545, "step": 169}
{"train_info/time_between_train_steps": 0.005660295486450195, "step": 169}
{"info/global_step": 170, "train_info/time_within_train_step": 24.800325870513916, "step": 170}
{"train_info/time_between_train_steps": 0.011174440383911133, "step": 170}
{"train_info/time_between_train_steps": 5.148841381072998, "step": 170}
{"info/global_step": 171, "train_info/time_within_train_step": 24.774402618408203, "step": 171}
{"train_info/time_between_train_steps": 0.005356550216674805, "step": 171}
{"info/global_step": 172, "train_info/time_within_train_step": 24.990087032318115, "step": 172}
{"train_info/time_between_train_steps": 0.005226612091064453, "step": 172}
{"info/global_step": 173, "train_info/time_within_train_step": 24.776130199432373, "step": 173}
{"train_info/time_between_train_steps": 0.005261898040771484, "step": 173}
{"info/global_step": 174, "train_info/time_within_train_step": 24.890624046325684, "step": 174}
{"train_info/time_between_train_steps": 0.010178804397583008, "step": 174}
{"info/global_step": 175, "train_info/time_within_train_step": 24.789061784744263, "step": 175}
{"train_info/time_between_train_steps": 0.010279417037963867, "step": 175}
{"info/global_step": 176, "train_info/time_within_train_step": 24.941460371017456, "step": 176}
{"train_info/time_between_train_steps": 0.005402088165283203, "step": 176}
{"info/global_step": 177, "train_info/time_within_train_step": 24.86020541191101, "step": 177}
{"train_info/time_between_train_steps": 0.005285739898681641, "step": 177}
{"info/global_step": 178, "train_info/time_within_train_step": 24.970403909683228, "step": 178}
{"train_info/time_between_train_steps": 0.0052797794342041016, "step": 178}
{"info/global_step": 179, "train_info/time_within_train_step": 24.78226661682129, "step": 179}
{"train_info/time_between_train_steps": 0.010419368743896484, "step": 179}
{"info/global_step": 180, "train_info/time_within_train_step": 24.894317626953125, "step": 180}
{"train_info/time_between_train_steps": 0.010095834732055664, "step": 180}
{"info/global_step": 181, "train_info/time_within_train_step": 24.787662982940674, "step": 181}
{"train_info/time_between_train_steps": 0.006641864776611328, "step": 181}
{"info/global_step": 182, "train_info/time_within_train_step": 24.903980016708374, "step": 182}
{"train_info/time_between_train_steps": 0.007647514343261719, "step": 182}
{"info/global_step": 183, "train_info/time_within_train_step": 24.7781183719635, "step": 183}
{"train_info/time_between_train_steps": 0.007536411285400391, "step": 183}
{"info/global_step": 184, "train_info/time_within_train_step": 24.846612215042114, "step": 184}
{"train_info/time_between_train_steps": 0.005488157272338867, "step": 184}
{"info/global_step": 185, "train_info/time_within_train_step": 24.78907561302185, "step": 185}
{"train_info/time_between_train_steps": 0.005101680755615234, "step": 185}
{"info/global_step": 186, "train_info/time_within_train_step": 24.75334668159485, "step": 186}
{"train_info/time_between_train_steps": 0.009692668914794922, "step": 186}
{"info/global_step": 187, "train_info/time_within_train_step": 24.761815309524536, "step": 187}
{"train_info/time_between_train_steps": 0.005024433135986328, "step": 187}
{"info/global_step": 188, "train_info/time_within_train_step": 24.866244792938232, "step": 188}
{"train_info/time_between_train_steps": 0.00614166259765625, "step": 188}
{"info/global_step": 189, "train_info/time_within_train_step": 24.761016845703125, "step": 189}
{"train_info/time_between_train_steps": 0.004978656768798828, "step": 189}
{"info/global_step": 190, "train_info/time_within_train_step": 24.75328016281128, "step": 190}
{"train_info/time_between_train_steps": 0.009829998016357422, "step": 190}
{"info/global_step": 191, "train_info/time_within_train_step": 24.775492906570435, "step": 191}
{"train_info/time_between_train_steps": 0.005139827728271484, "step": 191}
{"info/global_step": 192, "train_info/time_within_train_step": 24.753293991088867, "step": 192}
{"train_info/time_between_train_steps": 0.0052030086517333984, "step": 192}
{"info/global_step": 193, "train_info/time_within_train_step": 24.76779580116272, "step": 193}
{"train_info/time_between_train_steps": 0.005042314529418945, "step": 193}
{"info/global_step": 194, "train_info/time_within_train_step": 24.769363403320312, "step": 194}
{"train_info/time_between_train_steps": 0.005322933197021484, "step": 194}
{"info/global_step": 195, "train_info/time_within_train_step": 24.757111072540283, "step": 195}
{"train_info/time_between_train_steps": 0.005010843276977539, "step": 195}
{"info/global_step": 196, "train_info/time_within_train_step": 24.776809453964233, "step": 196}
{"train_info/time_between_train_steps": 0.004990816116333008, "step": 196}
{"info/global_step": 197, "train_info/time_within_train_step": 24.77900719642639, "step": 197}
{"train_info/time_between_train_steps": 0.005385875701904297, "step": 197}
{"info/global_step": 198, "train_info/time_within_train_step": 24.760115385055542, "step": 198}
{"train_info/time_between_train_steps": 0.0053005218505859375, "step": 198}
{"info/global_step": 199, "train_info/time_within_train_step": 24.785183429718018, "step": 199}
{"train_info/time_between_train_steps": 0.005195140838623047, "step": 199}
{"info/global_step": 200, "train_info/time_within_train_step": 24.802248239517212, "step": 200}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740925104, "_runtime": 5015}, "step": 200}
{"logs": {"train/loss": 4.2636, "train/learning_rate": 0.0005555555555555556, "train/epoch": 5.03, "_timestamp": 1740925104, "_runtime": 5015}, "step": 200}
{"train_info/time_between_train_steps": 11.614535093307495, "step": 200}
{"info/global_step": 201, "train_info/time_within_train_step": 24.778773069381714, "step": 201}
{"train_info/time_between_train_steps": 0.005067110061645508, "step": 201}
{"info/global_step": 202, "train_info/time_within_train_step": 24.810627937316895, "step": 202}
{"train_info/time_between_train_steps": 0.005315065383911133, "step": 202}
{"info/global_step": 203, "train_info/time_within_train_step": 24.9086651802063, "step": 203}
{"train_info/time_between_train_steps": 0.005756378173828125, "step": 203}
{"info/global_step": 204, "train_info/time_within_train_step": 24.82077121734619, "step": 204}
{"train_info/time_between_train_steps": 0.005696296691894531, "step": 204}
{"train_info/time_between_train_steps": 5.286012649536133, "step": 204}
{"info/global_step": 205, "train_info/time_within_train_step": 24.762563943862915, "step": 205}
{"train_info/time_between_train_steps": 0.004950761795043945, "step": 205}
{"info/global_step": 206, "train_info/time_within_train_step": 24.907906770706177, "step": 206}
{"train_info/time_between_train_steps": 0.005145072937011719, "step": 206}
{"info/global_step": 207, "train_info/time_within_train_step": 24.779087781906128, "step": 207}
{"train_info/time_between_train_steps": 0.005232095718383789, "step": 207}
{"info/global_step": 208, "train_info/time_within_train_step": 24.878329038619995, "step": 208}
{"train_info/time_between_train_steps": 0.00531768798828125, "step": 208}
{"info/global_step": 209, "train_info/time_within_train_step": 24.774940729141235, "step": 209}
{"train_info/time_between_train_steps": 0.0053517818450927734, "step": 209}
{"info/global_step": 210, "train_info/time_within_train_step": 24.937156438827515, "step": 210}
{"train_info/time_between_train_steps": 0.005270481109619141, "step": 210}
{"info/global_step": 211, "train_info/time_within_train_step": 24.8417809009552, "step": 211}
{"train_info/time_between_train_steps": 0.0052182674407958984, "step": 211}
{"info/global_step": 212, "train_info/time_within_train_step": 24.971694231033325, "step": 212}
{"train_info/time_between_train_steps": 0.005316972732543945, "step": 212}
{"info/global_step": 213, "train_info/time_within_train_step": 24.796252965927124, "step": 213}
{"train_info/time_between_train_steps": 0.012216567993164062, "step": 213}
{"info/global_step": 214, "train_info/time_within_train_step": 24.995652198791504, "step": 214}
{"train_info/time_between_train_steps": 0.0051496028900146484, "step": 214}
{"info/global_step": 215, "train_info/time_within_train_step": 24.811171770095825, "step": 215}
{"train_info/time_between_train_steps": 0.005648374557495117, "step": 215}
{"info/global_step": 216, "train_info/time_within_train_step": 24.960816860198975, "step": 216}
{"train_info/time_between_train_steps": 0.005512237548828125, "step": 216}
{"info/global_step": 217, "train_info/time_within_train_step": 24.8075852394104, "step": 217}
{"train_info/time_between_train_steps": 0.0054280757904052734, "step": 217}
{"info/global_step": 218, "train_info/time_within_train_step": 24.87603521347046, "step": 218}
{"train_info/time_between_train_steps": 0.005456686019897461, "step": 218}
{"info/global_step": 219, "train_info/time_within_train_step": 24.90362524986267, "step": 219}
{"train_info/time_between_train_steps": 0.005010366439819336, "step": 219}
{"info/global_step": 220, "train_info/time_within_train_step": 24.78439474105835, "step": 220}
{"train_info/time_between_train_steps": 0.004978656768798828, "step": 220}
{"info/global_step": 221, "train_info/time_within_train_step": 24.771243572235107, "step": 221}
{"train_info/time_between_train_steps": 0.005027055740356445, "step": 221}
{"info/global_step": 222, "train_info/time_within_train_step": 24.768791675567627, "step": 222}
{"train_info/time_between_train_steps": 0.005189180374145508, "step": 222}
{"info/global_step": 223, "train_info/time_within_train_step": 24.764159202575684, "step": 223}
{"train_info/time_between_train_steps": 0.009792566299438477, "step": 223}
{"info/global_step": 224, "train_info/time_within_train_step": 24.760315656661987, "step": 224}
{"train_info/time_between_train_steps": 0.009952306747436523, "step": 224}
{"info/global_step": 225, "train_info/time_within_train_step": 24.759663581848145, "step": 225}
{"train_info/time_between_train_steps": 0.005639791488647461, "step": 225}
{"info/global_step": 226, "train_info/time_within_train_step": 24.77721905708313, "step": 226}
{"train_info/time_between_train_steps": 0.005178928375244141, "step": 226}
{"info/global_step": 227, "train_info/time_within_train_step": 24.817552089691162, "step": 227}
{"train_info/time_between_train_steps": 0.005104541778564453, "step": 227}
{"info/global_step": 228, "train_info/time_within_train_step": 24.78292417526245, "step": 228}
{"train_info/time_between_train_steps": 0.005346775054931641, "step": 228}
{"info/global_step": 229, "train_info/time_within_train_step": 24.781423330307007, "step": 229}
{"train_info/time_between_train_steps": 0.005193948745727539, "step": 229}
{"info/global_step": 230, "train_info/time_within_train_step": 24.775365352630615, "step": 230}
{"train_info/time_between_train_steps": 0.0050241947174072266, "step": 230}
{"info/global_step": 231, "train_info/time_within_train_step": 24.78489923477173, "step": 231}
{"train_info/time_between_train_steps": 0.005281925201416016, "step": 231}
{"info/global_step": 232, "train_info/time_within_train_step": 24.778449773788452, "step": 232}
{"train_info/time_between_train_steps": 0.005064725875854492, "step": 232}
{"info/global_step": 233, "train_info/time_within_train_step": 24.785383224487305, "step": 233}
{"train_info/time_between_train_steps": 0.005183696746826172, "step": 233}
{"info/global_step": 234, "train_info/time_within_train_step": 24.92452907562256, "step": 234}
{"train_info/time_between_train_steps": 0.005278348922729492, "step": 234}
{"info/global_step": 235, "train_info/time_within_train_step": 24.825998544692993, "step": 235}
{"train_info/time_between_train_steps": 0.0051097869873046875, "step": 235}
{"info/global_step": 236, "train_info/time_within_train_step": 24.794219493865967, "step": 236}
{"train_info/time_between_train_steps": 0.0053861141204833984, "step": 236}
{"info/global_step": 237, "train_info/time_within_train_step": 24.81600785255432, "step": 237}
{"train_info/time_between_train_steps": 0.006402730941772461, "step": 237}
{"info/global_step": 238, "train_info/time_within_train_step": 25.24498152732849, "step": 238}
{"train_info/time_between_train_steps": 0.010510683059692383, "step": 238}
{"train_info/time_between_train_steps": 5.078988075256348, "step": 238}
{"info/global_step": 239, "train_info/time_within_train_step": 24.803812980651855, "step": 239}
{"train_info/time_between_train_steps": 0.005156993865966797, "step": 239}
{"info/global_step": 240, "train_info/time_within_train_step": 24.952269315719604, "step": 240}
{"train_info/time_between_train_steps": 0.005309104919433594, "step": 240}
{"info/global_step": 241, "train_info/time_within_train_step": 24.796534061431885, "step": 241}
{"train_info/time_between_train_steps": 0.005333662033081055, "step": 241}
{"info/global_step": 242, "train_info/time_within_train_step": 24.900112628936768, "step": 242}
{"train_info/time_between_train_steps": 0.005220890045166016, "step": 242}
{"info/global_step": 243, "train_info/time_within_train_step": 24.810805082321167, "step": 243}
{"train_info/time_between_train_steps": 0.005476951599121094, "step": 243}
{"info/global_step": 244, "train_info/time_within_train_step": 24.94054388999939, "step": 244}
{"train_info/time_between_train_steps": 0.0054247379302978516, "step": 244}
{"info/global_step": 245, "train_info/time_within_train_step": 24.787834405899048, "step": 245}
{"train_info/time_between_train_steps": 0.005237102508544922, "step": 245}
{"info/global_step": 246, "train_info/time_within_train_step": 24.94779658317566, "step": 246}
{"train_info/time_between_train_steps": 0.005205869674682617, "step": 246}
{"info/global_step": 247, "train_info/time_within_train_step": 24.802738666534424, "step": 247}
{"train_info/time_between_train_steps": 0.005419492721557617, "step": 247}
{"info/global_step": 248, "train_info/time_within_train_step": 24.918033123016357, "step": 248}
{"train_info/time_between_train_steps": 0.005076169967651367, "step": 248}
{"info/global_step": 249, "train_info/time_within_train_step": 24.818042993545532, "step": 249}
{"train_info/time_between_train_steps": 0.005561351776123047, "step": 249}
{"info/global_step": 250, "train_info/time_within_train_step": 25.04455852508545, "step": 250}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740926369, "_runtime": 6280}, "step": 250}
{"logs": {"train/loss": 4.1491, "train/learning_rate": 0.0005277777777777777, "train/epoch": 7.01, "_timestamp": 1740926369, "_runtime": 6280}, "step": 250}
{"train_info/time_between_train_steps": 0.014718055725097656, "step": 250}
{"info/global_step": 251, "train_info/time_within_train_step": 24.79257893562317, "step": 251}
{"train_info/time_between_train_steps": 0.005406618118286133, "step": 251}
{"info/global_step": 252, "train_info/time_within_train_step": 24.87458372116089, "step": 252}
{"train_info/time_between_train_steps": 0.005360126495361328, "step": 252}
{"info/global_step": 253, "train_info/time_within_train_step": 24.859344005584717, "step": 253}
{"train_info/time_between_train_steps": 0.005194187164306641, "step": 253}
{"info/global_step": 254, "train_info/time_within_train_step": 24.791179895401, "step": 254}
{"train_info/time_between_train_steps": 0.009947776794433594, "step": 254}
{"info/global_step": 255, "train_info/time_within_train_step": 24.804360389709473, "step": 255}
{"train_info/time_between_train_steps": 0.005054950714111328, "step": 255}
{"info/global_step": 256, "train_info/time_within_train_step": 24.78124737739563, "step": 256}
{"train_info/time_between_train_steps": 0.005391597747802734, "step": 256}
{"info/global_step": 257, "train_info/time_within_train_step": 24.85259175300598, "step": 257}
{"train_info/time_between_train_steps": 0.005046844482421875, "step": 257}
{"info/global_step": 258, "train_info/time_within_train_step": 24.78471803665161, "step": 258}
{"train_info/time_between_train_steps": 0.00508570671081543, "step": 258}
{"info/global_step": 259, "train_info/time_within_train_step": 24.780942678451538, "step": 259}
{"train_info/time_between_train_steps": 0.0052149295806884766, "step": 259}
{"info/global_step": 260, "train_info/time_within_train_step": 24.78369402885437, "step": 260}
{"train_info/time_between_train_steps": 0.005034923553466797, "step": 260}
{"info/global_step": 261, "train_info/time_within_train_step": 24.8039231300354, "step": 261}
{"train_info/time_between_train_steps": 0.0050048828125, "step": 261}
{"info/global_step": 262, "train_info/time_within_train_step": 24.777438402175903, "step": 262}
{"train_info/time_between_train_steps": 0.005343437194824219, "step": 262}
{"info/global_step": 263, "train_info/time_within_train_step": 24.773326873779297, "step": 263}
{"train_info/time_between_train_steps": 0.004964590072631836, "step": 263}
{"info/global_step": 264, "train_info/time_within_train_step": 24.77667498588562, "step": 264}
{"train_info/time_between_train_steps": 0.0049474239349365234, "step": 264}
{"info/global_step": 265, "train_info/time_within_train_step": 24.78695797920227, "step": 265}
{"train_info/time_between_train_steps": 0.005151987075805664, "step": 265}
{"info/global_step": 266, "train_info/time_within_train_step": 24.868593215942383, "step": 266}
{"train_info/time_between_train_steps": 0.005203962326049805, "step": 266}
{"info/global_step": 267, "train_info/time_within_train_step": 24.782606840133667, "step": 267}
{"train_info/time_between_train_steps": 0.0051116943359375, "step": 267}
{"info/global_step": 268, "train_info/time_within_train_step": 24.786333084106445, "step": 268}
{"train_info/time_between_train_steps": 0.005159616470336914, "step": 268}
{"info/global_step": 269, "train_info/time_within_train_step": 24.779988050460815, "step": 269}
{"train_info/time_between_train_steps": 0.005280971527099609, "step": 269}
{"info/global_step": 270, "train_info/time_within_train_step": 24.803112268447876, "step": 270}
{"train_info/time_between_train_steps": 0.005125522613525391, "step": 270}
{"info/global_step": 271, "train_info/time_within_train_step": 24.799468278884888, "step": 271}
{"train_info/time_between_train_steps": 0.0055925846099853516, "step": 271}
{"info/global_step": 272, "train_info/time_within_train_step": 24.829561948776245, "step": 272}
{"train_info/time_between_train_steps": 0.00601649284362793, "step": 272}
{"train_info/time_between_train_steps": 5.067803144454956, "step": 272}
{"info/global_step": 273, "train_info/time_within_train_step": 24.760622024536133, "step": 273}
{"train_info/time_between_train_steps": 0.007229328155517578, "step": 273}
{"info/global_step": 274, "train_info/time_within_train_step": 24.95095705986023, "step": 274}
{"train_info/time_between_train_steps": 0.005341768264770508, "step": 274}
{"info/global_step": 275, "train_info/time_within_train_step": 24.902547597885132, "step": 275}
{"train_info/time_between_train_steps": 0.005635976791381836, "step": 275}
{"info/global_step": 276, "train_info/time_within_train_step": 24.906595945358276, "step": 276}
{"train_info/time_between_train_steps": 0.007585048675537109, "step": 276}
{"info/global_step": 277, "train_info/time_within_train_step": 24.814988613128662, "step": 277}
{"train_info/time_between_train_steps": 0.0053212642669677734, "step": 277}
{"info/global_step": 278, "train_info/time_within_train_step": 25.012235164642334, "step": 278}
{"train_info/time_between_train_steps": 0.010373115539550781, "step": 278}
{"info/global_step": 279, "train_info/time_within_train_step": 24.807786226272583, "step": 279}
{"train_info/time_between_train_steps": 0.010143756866455078, "step": 279}
{"info/global_step": 280, "train_info/time_within_train_step": 24.943576097488403, "step": 280}
{"train_info/time_between_train_steps": 0.0053064823150634766, "step": 280}
{"info/global_step": 281, "train_info/time_within_train_step": 25.007651329040527, "step": 281}
{"train_info/time_between_train_steps": 0.005596637725830078, "step": 281}
{"info/global_step": 282, "train_info/time_within_train_step": 24.940649032592773, "step": 282}
{"train_info/time_between_train_steps": 0.005099773406982422, "step": 282}
{"info/global_step": 283, "train_info/time_within_train_step": 24.810191869735718, "step": 283}
{"train_info/time_between_train_steps": 0.00693058967590332, "step": 283}
{"info/global_step": 284, "train_info/time_within_train_step": 24.96360468864441, "step": 284}
{"train_info/time_between_train_steps": 0.0054187774658203125, "step": 284}
{"info/global_step": 285, "train_info/time_within_train_step": 24.81496286392212, "step": 285}
{"train_info/time_between_train_steps": 0.0053081512451171875, "step": 285}
{"info/global_step": 286, "train_info/time_within_train_step": 24.84802508354187, "step": 286}
{"train_info/time_between_train_steps": 0.0076618194580078125, "step": 286}
{"info/global_step": 287, "train_info/time_within_train_step": 24.791069507598877, "step": 287}
{"train_info/time_between_train_steps": 0.0054988861083984375, "step": 287}
{"info/global_step": 288, "train_info/time_within_train_step": 24.77535843849182, "step": 288}
{"train_info/time_between_train_steps": 0.005514621734619141, "step": 288}
{"info/global_step": 289, "train_info/time_within_train_step": 24.776819705963135, "step": 289}
{"train_info/time_between_train_steps": 0.005072832107543945, "step": 289}
{"info/global_step": 290, "train_info/time_within_train_step": 24.8103289604187, "step": 290}
{"train_info/time_between_train_steps": 0.005164623260498047, "step": 290}
{"info/global_step": 291, "train_info/time_within_train_step": 24.793518781661987, "step": 291}
{"train_info/time_between_train_steps": 0.005084037780761719, "step": 291}
{"info/global_step": 292, "train_info/time_within_train_step": 24.810068607330322, "step": 292}
{"train_info/time_between_train_steps": 0.005106449127197266, "step": 292}
{"info/global_step": 293, "train_info/time_within_train_step": 24.80709218978882, "step": 293}
{"train_info/time_between_train_steps": 0.00513458251953125, "step": 293}
{"info/global_step": 294, "train_info/time_within_train_step": 24.78920888900757, "step": 294}
{"train_info/time_between_train_steps": 0.005137205123901367, "step": 294}
{"info/global_step": 295, "train_info/time_within_train_step": 24.783164262771606, "step": 295}
{"train_info/time_between_train_steps": 0.00543665885925293, "step": 295}
{"info/global_step": 296, "train_info/time_within_train_step": 24.785433530807495, "step": 296}
{"train_info/time_between_train_steps": 0.0051381587982177734, "step": 296}
{"info/global_step": 297, "train_info/time_within_train_step": 24.922919511795044, "step": 297}
{"train_info/time_between_train_steps": 0.005098581314086914, "step": 297}
{"info/global_step": 298, "train_info/time_within_train_step": 24.781251907348633, "step": 298}
{"train_info/time_between_train_steps": 0.005133867263793945, "step": 298}
{"info/global_step": 299, "train_info/time_within_train_step": 24.79051446914673, "step": 299}
{"train_info/time_between_train_steps": 0.005152225494384766, "step": 299}
{"info/global_step": 300, "train_info/time_within_train_step": 24.814976453781128, "step": 300}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740927616, "_runtime": 7527}, "step": 300}
{"logs": {"train/loss": 3.9977, "train/learning_rate": 0.0005, "train/epoch": 8.02, "_timestamp": 1740927616, "_runtime": 7527}, "step": 300}
{"train_info/time_between_train_steps": 10.933754444122314, "step": 300}
{"info/global_step": 301, "train_info/time_within_train_step": 24.765063524246216, "step": 301}
{"train_info/time_between_train_steps": 0.005074501037597656, "step": 301}
{"info/global_step": 302, "train_info/time_within_train_step": 24.80315113067627, "step": 302}
{"train_info/time_between_train_steps": 0.005259513854980469, "step": 302}
{"info/global_step": 303, "train_info/time_within_train_step": 24.767523527145386, "step": 303}
{"train_info/time_between_train_steps": 0.005304574966430664, "step": 303}
{"info/global_step": 304, "train_info/time_within_train_step": 24.77528667449951, "step": 304}
{"train_info/time_between_train_steps": 0.005243062973022461, "step": 304}
{"info/global_step": 305, "train_info/time_within_train_step": 24.817107439041138, "step": 305}
{"train_info/time_between_train_steps": 0.005651712417602539, "step": 305}
{"info/global_step": 306, "train_info/time_within_train_step": 24.811697959899902, "step": 306}
{"train_info/time_between_train_steps": 0.00621485710144043, "step": 306}
{"train_info/time_between_train_steps": 5.163711071014404, "step": 306}
{"info/global_step": 307, "train_info/time_within_train_step": 24.77231478691101, "step": 307}
{"train_info/time_between_train_steps": 0.004957914352416992, "step": 307}
{"info/global_step": 308, "train_info/time_within_train_step": 24.916396856307983, "step": 308}
{"train_info/time_between_train_steps": 0.005436897277832031, "step": 308}
{"info/global_step": 309, "train_info/time_within_train_step": 24.815910577774048, "step": 309}
{"train_info/time_between_train_steps": 0.01044321060180664, "step": 309}
{"info/global_step": 310, "train_info/time_within_train_step": 24.89259099960327, "step": 310}
{"train_info/time_between_train_steps": 0.01021575927734375, "step": 310}
{"info/global_step": 311, "train_info/time_within_train_step": 24.79747247695923, "step": 311}
{"train_info/time_between_train_steps": 0.0052928924560546875, "step": 311}
{"info/global_step": 312, "train_info/time_within_train_step": 25.01759433746338, "step": 312}
{"train_info/time_between_train_steps": 0.007417917251586914, "step": 312}
{"info/global_step": 313, "train_info/time_within_train_step": 24.793709993362427, "step": 313}
{"train_info/time_between_train_steps": 0.00759434700012207, "step": 313}
{"info/global_step": 314, "train_info/time_within_train_step": 25.027040004730225, "step": 314}
{"train_info/time_between_train_steps": 0.005245208740234375, "step": 314}
{"info/global_step": 315, "train_info/time_within_train_step": 24.78758692741394, "step": 315}
{"train_info/time_between_train_steps": 0.005715608596801758, "step": 315}
{"info/global_step": 316, "train_info/time_within_train_step": 24.962263345718384, "step": 316}
{"train_info/time_between_train_steps": 0.006265401840209961, "step": 316}
{"info/global_step": 317, "train_info/time_within_train_step": 24.80383276939392, "step": 317}
{"train_info/time_between_train_steps": 0.01044464111328125, "step": 317}
{"info/global_step": 318, "train_info/time_within_train_step": 24.96462631225586, "step": 318}
{"train_info/time_between_train_steps": 0.005627632141113281, "step": 318}
{"info/global_step": 319, "train_info/time_within_train_step": 24.8078134059906, "step": 319}
{"train_info/time_between_train_steps": 0.0062940120697021484, "step": 319}
{"info/global_step": 320, "train_info/time_within_train_step": 24.891763925552368, "step": 320}
{"train_info/time_between_train_steps": 0.005314350128173828, "step": 320}
{"info/global_step": 321, "train_info/time_within_train_step": 24.820425510406494, "step": 321}
{"train_info/time_between_train_steps": 0.005212545394897461, "step": 321}
{"info/global_step": 322, "train_info/time_within_train_step": 24.78352689743042, "step": 322}
{"train_info/time_between_train_steps": 0.00502467155456543, "step": 322}
{"info/global_step": 323, "train_info/time_within_train_step": 24.81717801094055, "step": 323}
{"train_info/time_between_train_steps": 0.005151510238647461, "step": 323}
{"info/global_step": 324, "train_info/time_within_train_step": 24.823650598526, "step": 324}
{"train_info/time_between_train_steps": 0.005204916000366211, "step": 324}
{"info/global_step": 325, "train_info/time_within_train_step": 24.78371500968933, "step": 325}
{"train_info/time_between_train_steps": 0.004984140396118164, "step": 325}
{"info/global_step": 326, "train_info/time_within_train_step": 24.781360626220703, "step": 326}
{"train_info/time_between_train_steps": 0.009865522384643555, "step": 326}
{"info/global_step": 327, "train_info/time_within_train_step": 24.777124166488647, "step": 327}
{"train_info/time_between_train_steps": 0.005213737487792969, "step": 327}
{"info/global_step": 328, "train_info/time_within_train_step": 24.88957691192627, "step": 328}
{"train_info/time_between_train_steps": 0.0060367584228515625, "step": 328}
{"info/global_step": 329, "train_info/time_within_train_step": 24.780477046966553, "step": 329}
{"train_info/time_between_train_steps": 0.0050389766693115234, "step": 329}
{"info/global_step": 330, "train_info/time_within_train_step": 24.789347887039185, "step": 330}
{"train_info/time_between_train_steps": 0.006169795989990234, "step": 330}
{"info/global_step": 331, "train_info/time_within_train_step": 24.77304220199585, "step": 331}
{"train_info/time_between_train_steps": 0.005167722702026367, "step": 331}
{"info/global_step": 332, "train_info/time_within_train_step": 24.78642749786377, "step": 332}
{"train_info/time_between_train_steps": 0.009940385818481445, "step": 332}
{"info/global_step": 333, "train_info/time_within_train_step": 24.806387901306152, "step": 333}
{"train_info/time_between_train_steps": 0.005073070526123047, "step": 333}
{"info/global_step": 334, "train_info/time_within_train_step": 24.800675630569458, "step": 334}
{"train_info/time_between_train_steps": 0.006314277648925781, "step": 334}
{"info/global_step": 335, "train_info/time_within_train_step": 24.784570693969727, "step": 335}
{"train_info/time_between_train_steps": 0.005192279815673828, "step": 335}
{"info/global_step": 336, "train_info/time_within_train_step": 24.79302740097046, "step": 336}
{"train_info/time_between_train_steps": 0.005144596099853516, "step": 336}
{"info/global_step": 337, "train_info/time_within_train_step": 24.857619047164917, "step": 337}
{"train_info/time_between_train_steps": 0.009546756744384766, "step": 337}
{"info/global_step": 338, "train_info/time_within_train_step": 24.81925630569458, "step": 338}
{"train_info/time_between_train_steps": 0.006640195846557617, "step": 338}
{"info/global_step": 339, "train_info/time_within_train_step": 24.91418480873108, "step": 339}
{"train_info/time_between_train_steps": 0.005690336227416992, "step": 339}
{"info/global_step": 340, "train_info/time_within_train_step": 24.825390338897705, "step": 340}
{"train_info/time_between_train_steps": 0.006498098373413086, "step": 340}
{"train_info/time_between_train_steps": 5.33832573890686, "step": 340}
{"info/global_step": 341, "train_info/time_within_train_step": 24.77650260925293, "step": 341}
{"train_info/time_between_train_steps": 0.00496220588684082, "step": 341}
{"info/global_step": 342, "train_info/time_within_train_step": 24.924341678619385, "step": 342}
{"train_info/time_between_train_steps": 0.005264997482299805, "step": 342}
{"info/global_step": 343, "train_info/time_within_train_step": 24.873985052108765, "step": 343}
{"train_info/time_between_train_steps": 0.005262851715087891, "step": 343}
{"info/global_step": 344, "train_info/time_within_train_step": 24.904863595962524, "step": 344}
{"train_info/time_between_train_steps": 0.005248069763183594, "step": 344}
{"info/global_step": 345, "train_info/time_within_train_step": 24.79253125190735, "step": 345}
{"train_info/time_between_train_steps": 0.005388736724853516, "step": 345}
{"info/global_step": 346, "train_info/time_within_train_step": 24.963209867477417, "step": 346}
{"train_info/time_between_train_steps": 0.0054514408111572266, "step": 346}
{"info/global_step": 347, "train_info/time_within_train_step": 24.818541288375854, "step": 347}
{"train_info/time_between_train_steps": 0.00512242317199707, "step": 347}
{"info/global_step": 348, "train_info/time_within_train_step": 24.946448802947998, "step": 348}
{"train_info/time_between_train_steps": 0.005311250686645508, "step": 348}
{"info/global_step": 349, "train_info/time_within_train_step": 24.775137662887573, "step": 349}
{"train_info/time_between_train_steps": 0.005247354507446289, "step": 349}
{"info/global_step": 350, "train_info/time_within_train_step": 24.89706540107727, "step": 350}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740928880, "_runtime": 8791}, "step": 350}
{"logs": {"train/loss": 3.8366, "train/learning_rate": 0.00047222222222222224, "train/epoch": 10.01, "_timestamp": 1740928880, "_runtime": 8791}, "step": 350}
{"train_info/time_between_train_steps": 0.008573293685913086, "step": 350}
{"info/global_step": 351, "train_info/time_within_train_step": 24.778045892715454, "step": 351}
{"train_info/time_between_train_steps": 0.0065042972564697266, "step": 351}
{"info/global_step": 352, "train_info/time_within_train_step": 24.923688173294067, "step": 352}
{"train_info/time_between_train_steps": 0.0053789615631103516, "step": 352}
{"info/global_step": 353, "train_info/time_within_train_step": 24.942675590515137, "step": 353}
{"train_info/time_between_train_steps": 0.00513458251953125, "step": 353}
{"info/global_step": 354, "train_info/time_within_train_step": 24.849465370178223, "step": 354}
{"train_info/time_between_train_steps": 0.005452394485473633, "step": 354}
{"info/global_step": 355, "train_info/time_within_train_step": 24.795753955841064, "step": 355}
{"train_info/time_between_train_steps": 0.0050351619720458984, "step": 355}
{"info/global_step": 356, "train_info/time_within_train_step": 24.766928911209106, "step": 356}
{"train_info/time_between_train_steps": 0.010047197341918945, "step": 356}
{"info/global_step": 357, "train_info/time_within_train_step": 24.748886346817017, "step": 357}
{"train_info/time_between_train_steps": 0.009888410568237305, "step": 357}
{"info/global_step": 358, "train_info/time_within_train_step": 24.76164150238037, "step": 358}
{"train_info/time_between_train_steps": 0.005264997482299805, "step": 358}
{"info/global_step": 359, "train_info/time_within_train_step": 24.850462436676025, "step": 359}
{"train_info/time_between_train_steps": 0.00500798225402832, "step": 359}
{"info/global_step": 360, "train_info/time_within_train_step": 24.78079891204834, "step": 360}
{"train_info/time_between_train_steps": 0.005026102066040039, "step": 360}
{"info/global_step": 361, "train_info/time_within_train_step": 24.771502017974854, "step": 361}
{"train_info/time_between_train_steps": 0.005356311798095703, "step": 361}
{"info/global_step": 362, "train_info/time_within_train_step": 24.776998281478882, "step": 362}
{"train_info/time_between_train_steps": 0.00504302978515625, "step": 362}
{"info/global_step": 363, "train_info/time_within_train_step": 24.77822256088257, "step": 363}
{"train_info/time_between_train_steps": 0.00507354736328125, "step": 363}
{"info/global_step": 364, "train_info/time_within_train_step": 24.79934334754944, "step": 364}
{"train_info/time_between_train_steps": 0.005343198776245117, "step": 364}
{"info/global_step": 365, "train_info/time_within_train_step": 24.804238080978394, "step": 365}
{"train_info/time_between_train_steps": 0.005114078521728516, "step": 365}
{"info/global_step": 366, "train_info/time_within_train_step": 24.80504536628723, "step": 366}
{"train_info/time_between_train_steps": 0.005128383636474609, "step": 366}
{"info/global_step": 367, "train_info/time_within_train_step": 24.802382469177246, "step": 367}
{"train_info/time_between_train_steps": 0.0051076412200927734, "step": 367}
{"info/global_step": 368, "train_info/time_within_train_step": 24.784708261489868, "step": 368}
{"train_info/time_between_train_steps": 0.010445594787597656, "step": 368}
{"info/global_step": 369, "train_info/time_within_train_step": 24.802082777023315, "step": 369}
{"train_info/time_between_train_steps": 0.005181789398193359, "step": 369}
{"info/global_step": 370, "train_info/time_within_train_step": 24.79573106765747, "step": 370}
{"train_info/time_between_train_steps": 0.005149126052856445, "step": 370}
{"info/global_step": 371, "train_info/time_within_train_step": 24.790525197982788, "step": 371}
{"train_info/time_between_train_steps": 0.0054302215576171875, "step": 371}
{"info/global_step": 372, "train_info/time_within_train_step": 24.807286739349365, "step": 372}
{"train_info/time_between_train_steps": 0.0052263736724853516, "step": 372}
{"info/global_step": 373, "train_info/time_within_train_step": 24.830692291259766, "step": 373}
{"train_info/time_between_train_steps": 0.005610942840576172, "step": 373}
{"info/global_step": 374, "train_info/time_within_train_step": 24.909169912338257, "step": 374}
{"train_info/time_between_train_steps": 0.010457992553710938, "step": 374}
{"train_info/time_between_train_steps": 4.9893128871917725, "step": 374}
{"info/global_step": 375, "train_info/time_within_train_step": 24.964081048965454, "step": 375}
{"train_info/time_between_train_steps": 0.00506138801574707, "step": 375}
{"info/global_step": 376, "train_info/time_within_train_step": 24.95251727104187, "step": 376}
{"train_info/time_between_train_steps": 0.005346059799194336, "step": 376}
{"info/global_step": 377, "train_info/time_within_train_step": 24.9051673412323, "step": 377}
{"train_info/time_between_train_steps": 0.005581378936767578, "step": 377}
{"info/global_step": 378, "train_info/time_within_train_step": 24.915474891662598, "step": 378}
{"train_info/time_between_train_steps": 0.005319118499755859, "step": 378}
{"info/global_step": 379, "train_info/time_within_train_step": 24.81519079208374, "step": 379}
{"train_info/time_between_train_steps": 0.005273342132568359, "step": 379}
{"info/global_step": 380, "train_info/time_within_train_step": 24.970443964004517, "step": 380}
{"train_info/time_between_train_steps": 0.0054056644439697266, "step": 380}
{"info/global_step": 381, "train_info/time_within_train_step": 24.825338125228882, "step": 381}
{"train_info/time_between_train_steps": 0.00531458854675293, "step": 381}
{"info/global_step": 382, "train_info/time_within_train_step": 24.972851037979126, "step": 382}
{"train_info/time_between_train_steps": 0.005262613296508789, "step": 382}
{"info/global_step": 383, "train_info/time_within_train_step": 24.8069007396698, "step": 383}
{"train_info/time_between_train_steps": 0.005461931228637695, "step": 383}
{"info/global_step": 384, "train_info/time_within_train_step": 24.96416425704956, "step": 384}
{"train_info/time_between_train_steps": 0.005216121673583984, "step": 384}
{"info/global_step": 385, "train_info/time_within_train_step": 24.794286727905273, "step": 385}
{"train_info/time_between_train_steps": 0.005330562591552734, "step": 385}
{"info/global_step": 386, "train_info/time_within_train_step": 24.92258310317993, "step": 386}
{"train_info/time_between_train_steps": 0.005496501922607422, "step": 386}
{"info/global_step": 387, "train_info/time_within_train_step": 24.833847284317017, "step": 387}
{"train_info/time_between_train_steps": 0.005650043487548828, "step": 387}
{"info/global_step": 388, "train_info/time_within_train_step": 24.894766569137573, "step": 388}
{"train_info/time_between_train_steps": 0.005393028259277344, "step": 388}
{"info/global_step": 389, "train_info/time_within_train_step": 24.847748279571533, "step": 389}
{"train_info/time_between_train_steps": 0.00510406494140625, "step": 389}
{"info/global_step": 390, "train_info/time_within_train_step": 24.89688467979431, "step": 390}
{"train_info/time_between_train_steps": 0.005256175994873047, "step": 390}
{"info/global_step": 391, "train_info/time_within_train_step": 24.792823314666748, "step": 391}
{"train_info/time_between_train_steps": 0.005090951919555664, "step": 391}
{"info/global_step": 392, "train_info/time_within_train_step": 24.80779457092285, "step": 392}
{"train_info/time_between_train_steps": 0.009867191314697266, "step": 392}
{"info/global_step": 393, "train_info/time_within_train_step": 24.805888652801514, "step": 393}
{"train_info/time_between_train_steps": 0.005103588104248047, "step": 393}
{"info/global_step": 394, "train_info/time_within_train_step": 24.800689935684204, "step": 394}
{"train_info/time_between_train_steps": 0.005031108856201172, "step": 394}
{"info/global_step": 395, "train_info/time_within_train_step": 24.789403200149536, "step": 395}
{"train_info/time_between_train_steps": 0.0050640106201171875, "step": 395}
{"info/global_step": 396, "train_info/time_within_train_step": 24.798469066619873, "step": 396}
{"train_info/time_between_train_steps": 0.005300760269165039, "step": 396}
{"info/global_step": 397, "train_info/time_within_train_step": 24.770126342773438, "step": 397}
{"train_info/time_between_train_steps": 0.008365631103515625, "step": 397}
{"info/global_step": 398, "train_info/time_within_train_step": 24.771175146102905, "step": 398}
{"train_info/time_between_train_steps": 0.005239963531494141, "step": 398}
{"info/global_step": 399, "train_info/time_within_train_step": 24.780751943588257, "step": 399}
{"train_info/time_between_train_steps": 0.005281209945678711, "step": 399}
{"info/global_step": 400, "train_info/time_within_train_step": 24.813451766967773, "step": 400}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740930127, "_runtime": 10038}, "step": 400}
{"logs": {"train/loss": 3.6473, "train/learning_rate": 0.00044444444444444436, "train/epoch": 11.02, "_timestamp": 1740930127, "_runtime": 10038}, "step": 400}
{"train_info/time_between_train_steps": 11.137678623199463, "step": 400}
{"info/global_step": 401, "train_info/time_within_train_step": 24.78366231918335, "step": 401}
{"train_info/time_between_train_steps": 0.00490570068359375, "step": 401}
{"info/global_step": 402, "train_info/time_within_train_step": 24.788341522216797, "step": 402}
{"train_info/time_between_train_steps": 0.005354881286621094, "step": 402}
{"info/global_step": 403, "train_info/time_within_train_step": 24.785059452056885, "step": 403}
{"train_info/time_between_train_steps": 0.0051021575927734375, "step": 403}
{"info/global_step": 404, "train_info/time_within_train_step": 24.775449514389038, "step": 404}
{"train_info/time_between_train_steps": 0.005113840103149414, "step": 404}
{"info/global_step": 405, "train_info/time_within_train_step": 24.822643041610718, "step": 405}
{"train_info/time_between_train_steps": 0.005402565002441406, "step": 405}
{"info/global_step": 406, "train_info/time_within_train_step": 24.879587650299072, "step": 406}
{"train_info/time_between_train_steps": 0.005223751068115234, "step": 406}
{"info/global_step": 407, "train_info/time_within_train_step": 24.815365314483643, "step": 407}
{"train_info/time_between_train_steps": 0.005711555480957031, "step": 407}
{"info/global_step": 408, "train_info/time_within_train_step": 24.884169101715088, "step": 408}
{"train_info/time_between_train_steps": 0.00611567497253418, "step": 408}
{"train_info/time_between_train_steps": 5.239779710769653, "step": 408}
{"info/global_step": 409, "train_info/time_within_train_step": 24.792282581329346, "step": 409}
{"train_info/time_between_train_steps": 0.0049648284912109375, "step": 409}
{"info/global_step": 410, "train_info/time_within_train_step": 24.9403133392334, "step": 410}
{"train_info/time_between_train_steps": 0.0052144527435302734, "step": 410}
{"info/global_step": 411, "train_info/time_within_train_step": 24.81127119064331, "step": 411}
{"train_info/time_between_train_steps": 0.005258321762084961, "step": 411}
{"info/global_step": 412, "train_info/time_within_train_step": 24.936562299728394, "step": 412}
{"train_info/time_between_train_steps": 0.006247758865356445, "step": 412}
{"info/global_step": 413, "train_info/time_within_train_step": 24.813117265701294, "step": 413}
{"train_info/time_between_train_steps": 0.005248069763183594, "step": 413}
{"info/global_step": 414, "train_info/time_within_train_step": 24.981440782546997, "step": 414}
{"train_info/time_between_train_steps": 0.005357980728149414, "step": 414}
{"info/global_step": 415, "train_info/time_within_train_step": 24.829511642456055, "step": 415}
{"train_info/time_between_train_steps": 0.005358695983886719, "step": 415}
{"info/global_step": 416, "train_info/time_within_train_step": 24.93358588218689, "step": 416}
{"train_info/time_between_train_steps": 0.005255699157714844, "step": 416}
{"info/global_step": 417, "train_info/time_within_train_step": 24.817995309829712, "step": 417}
{"train_info/time_between_train_steps": 0.005614280700683594, "step": 417}
{"info/global_step": 418, "train_info/time_within_train_step": 25.101074695587158, "step": 418}
{"train_info/time_between_train_steps": 0.0062503814697265625, "step": 418}
{"info/global_step": 419, "train_info/time_within_train_step": 24.787944316864014, "step": 419}
{"train_info/time_between_train_steps": 0.00511479377746582, "step": 419}
{"info/global_step": 420, "train_info/time_within_train_step": 24.98177981376648, "step": 420}
{"train_info/time_between_train_steps": 0.005344390869140625, "step": 420}
{"info/global_step": 421, "train_info/time_within_train_step": 24.909952640533447, "step": 421}
{"train_info/time_between_train_steps": 0.005440711975097656, "step": 421}
{"info/global_step": 422, "train_info/time_within_train_step": 24.928460359573364, "step": 422}
{"train_info/time_between_train_steps": 0.005300998687744141, "step": 422}
{"info/global_step": 423, "train_info/time_within_train_step": 24.817472219467163, "step": 423}
{"train_info/time_between_train_steps": 0.010044574737548828, "step": 423}
{"info/global_step": 424, "train_info/time_within_train_step": 24.81159281730652, "step": 424}
{"train_info/time_between_train_steps": 0.005955934524536133, "step": 424}
{"info/global_step": 425, "train_info/time_within_train_step": 24.786867141723633, "step": 425}
{"train_info/time_between_train_steps": 0.004973173141479492, "step": 425}
{"info/global_step": 426, "train_info/time_within_train_step": 24.77848982810974, "step": 426}
{"train_info/time_between_train_steps": 0.005137920379638672, "step": 426}
{"info/global_step": 427, "train_info/time_within_train_step": 24.793366193771362, "step": 427}
{"train_info/time_between_train_steps": 0.005142688751220703, "step": 427}
{"info/global_step": 428, "train_info/time_within_train_step": 24.78955864906311, "step": 428}
{"train_info/time_between_train_steps": 0.005045413970947266, "step": 428}
{"info/global_step": 429, "train_info/time_within_train_step": 24.800957441329956, "step": 429}
{"train_info/time_between_train_steps": 0.005088090896606445, "step": 429}
{"info/global_step": 430, "train_info/time_within_train_step": 24.79424500465393, "step": 430}
{"train_info/time_between_train_steps": 0.0051877498626708984, "step": 430}
{"info/global_step": 431, "train_info/time_within_train_step": 24.80604338645935, "step": 431}
{"train_info/time_between_train_steps": 0.005141496658325195, "step": 431}
{"info/global_step": 432, "train_info/time_within_train_step": 24.81227684020996, "step": 432}
{"train_info/time_between_train_steps": 0.005308866500854492, "step": 432}
{"info/global_step": 433, "train_info/time_within_train_step": 24.84263300895691, "step": 433}
{"train_info/time_between_train_steps": 0.005182504653930664, "step": 433}
{"info/global_step": 434, "train_info/time_within_train_step": 24.807866096496582, "step": 434}
{"train_info/time_between_train_steps": 0.005132436752319336, "step": 434}
{"info/global_step": 435, "train_info/time_within_train_step": 24.804181337356567, "step": 435}
{"train_info/time_between_train_steps": 0.0051577091217041016, "step": 435}
{"info/global_step": 436, "train_info/time_within_train_step": 24.797430992126465, "step": 436}
{"train_info/time_between_train_steps": 0.0053560733795166016, "step": 436}
{"info/global_step": 437, "train_info/time_within_train_step": 24.892083168029785, "step": 437}
{"train_info/time_between_train_steps": 0.005127429962158203, "step": 437}
{"info/global_step": 438, "train_info/time_within_train_step": 24.806618213653564, "step": 438}
{"train_info/time_between_train_steps": 0.00525665283203125, "step": 438}
{"info/global_step": 439, "train_info/time_within_train_step": 24.82013964653015, "step": 439}
{"train_info/time_between_train_steps": 0.005313396453857422, "step": 439}
{"info/global_step": 440, "train_info/time_within_train_step": 24.816996812820435, "step": 440}
{"train_info/time_between_train_steps": 0.0053827762603759766, "step": 440}
{"info/global_step": 441, "train_info/time_within_train_step": 24.814340353012085, "step": 441}
{"train_info/time_between_train_steps": 0.005658626556396484, "step": 441}
{"info/global_step": 442, "train_info/time_within_train_step": 24.846220016479492, "step": 442}
{"train_info/time_between_train_steps": 0.011626243591308594, "step": 442}
{"train_info/time_between_train_steps": 5.414006233215332, "step": 442}
{"info/global_step": 443, "train_info/time_within_train_step": 24.82495951652527, "step": 443}
{"train_info/time_between_train_steps": 0.004820823669433594, "step": 443}
{"info/global_step": 444, "train_info/time_within_train_step": 24.834421396255493, "step": 444}
{"train_info/time_between_train_steps": 0.009674310684204102, "step": 444}
{"info/global_step": 445, "train_info/time_within_train_step": 24.739858865737915, "step": 445}
{"train_info/time_between_train_steps": 0.0052564144134521484, "step": 445}
{"info/global_step": 446, "train_info/time_within_train_step": 24.86435317993164, "step": 446}
{"train_info/time_between_train_steps": 0.010225534439086914, "step": 446}
{"info/global_step": 447, "train_info/time_within_train_step": 24.735960483551025, "step": 447}
{"train_info/time_between_train_steps": 0.00515294075012207, "step": 447}
{"info/global_step": 448, "train_info/time_within_train_step": 24.87696361541748, "step": 448}
{"train_info/time_between_train_steps": 0.005387067794799805, "step": 448}
{"info/global_step": 449, "train_info/time_within_train_step": 24.74665641784668, "step": 449}
{"train_info/time_between_train_steps": 0.0053369998931884766, "step": 449}
{"info/global_step": 450, "train_info/time_within_train_step": 24.846734762191772, "step": 450}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740931391, "_runtime": 11302}, "step": 450}
{"logs": {"train/loss": 3.5171, "train/learning_rate": 0.00041666666666666664, "train/epoch": 13.01, "_timestamp": 1740931391, "_runtime": 11302}, "step": 450}
{"train_info/time_between_train_steps": 0.008594512939453125, "step": 450}
{"info/global_step": 451, "train_info/time_within_train_step": 24.74860143661499, "step": 451}
{"train_info/time_between_train_steps": 0.005511760711669922, "step": 451}
{"info/global_step": 452, "train_info/time_within_train_step": 24.888253927230835, "step": 452}
{"train_info/time_between_train_steps": 0.005250453948974609, "step": 452}
{"info/global_step": 453, "train_info/time_within_train_step": 24.82557964324951, "step": 453}
{"train_info/time_between_train_steps": 0.005226612091064453, "step": 453}
{"info/global_step": 454, "train_info/time_within_train_step": 24.893208742141724, "step": 454}
{"train_info/time_between_train_steps": 0.00529932975769043, "step": 454}
{"info/global_step": 455, "train_info/time_within_train_step": 24.753715753555298, "step": 455}
{"train_info/time_between_train_steps": 0.005387306213378906, "step": 455}
{"info/global_step": 456, "train_info/time_within_train_step": 24.807571172714233, "step": 456}
{"train_info/time_between_train_steps": 0.005719423294067383, "step": 456}
{"info/global_step": 457, "train_info/time_within_train_step": 24.745986700057983, "step": 457}
{"train_info/time_between_train_steps": 0.004956245422363281, "step": 457}
{"info/global_step": 458, "train_info/time_within_train_step": 24.730358600616455, "step": 458}
{"train_info/time_between_train_steps": 0.0050237178802490234, "step": 458}
{"info/global_step": 459, "train_info/time_within_train_step": 24.73230791091919, "step": 459}
{"train_info/time_between_train_steps": 0.004865884780883789, "step": 459}
{"info/global_step": 460, "train_info/time_within_train_step": 24.72532606124878, "step": 460}
{"train_info/time_between_train_steps": 0.0050203800201416016, "step": 460}
{"info/global_step": 461, "train_info/time_within_train_step": 24.734665632247925, "step": 461}
{"train_info/time_between_train_steps": 0.005057811737060547, "step": 461}
{"info/global_step": 462, "train_info/time_within_train_step": 24.728516340255737, "step": 462}
{"train_info/time_between_train_steps": 0.004925727844238281, "step": 462}
{"info/global_step": 463, "train_info/time_within_train_step": 24.729544401168823, "step": 463}
{"train_info/time_between_train_steps": 0.004983425140380859, "step": 463}
{"info/global_step": 464, "train_info/time_within_train_step": 24.731744050979614, "step": 464}
{"train_info/time_between_train_steps": 0.005100727081298828, "step": 464}
{"info/global_step": 465, "train_info/time_within_train_step": 24.73421335220337, "step": 465}
{"train_info/time_between_train_steps": 0.004979372024536133, "step": 465}
{"info/global_step": 466, "train_info/time_within_train_step": 24.747792959213257, "step": 466}
{"train_info/time_between_train_steps": 0.00509953498840332, "step": 466}
{"info/global_step": 467, "train_info/time_within_train_step": 24.74287438392639, "step": 467}
{"train_info/time_between_train_steps": 0.00507807731628418, "step": 467}
{"info/global_step": 468, "train_info/time_within_train_step": 24.828445196151733, "step": 468}
{"train_info/time_between_train_steps": 0.004930019378662109, "step": 468}
{"info/global_step": 469, "train_info/time_within_train_step": 24.738059282302856, "step": 469}
{"train_info/time_between_train_steps": 0.005066871643066406, "step": 469}
{"info/global_step": 470, "train_info/time_within_train_step": 24.75226354598999, "step": 470}
{"train_info/time_between_train_steps": 0.005162239074707031, "step": 470}
{"info/global_step": 471, "train_info/time_within_train_step": 24.73556637763977, "step": 471}
{"train_info/time_between_train_steps": 0.0049703121185302734, "step": 471}
{"info/global_step": 472, "train_info/time_within_train_step": 24.750807762145996, "step": 472}
{"train_info/time_between_train_steps": 0.004983663558959961, "step": 472}
{"info/global_step": 473, "train_info/time_within_train_step": 24.74091148376465, "step": 473}
{"train_info/time_between_train_steps": 0.005080699920654297, "step": 473}
{"info/global_step": 474, "train_info/time_within_train_step": 24.744964838027954, "step": 474}
{"train_info/time_between_train_steps": 0.005034923553466797, "step": 474}
{"info/global_step": 475, "train_info/time_within_train_step": 24.752630472183228, "step": 475}
{"train_info/time_between_train_steps": 0.005707740783691406, "step": 475}
{"info/global_step": 476, "train_info/time_within_train_step": 24.784889459609985, "step": 476}
{"train_info/time_between_train_steps": 0.006243467330932617, "step": 476}
{"train_info/time_between_train_steps": 5.032876014709473, "step": 476}
{"info/global_step": 477, "train_info/time_within_train_step": 24.730415105819702, "step": 477}
{"train_info/time_between_train_steps": 0.0048367977142333984, "step": 477}
{"info/global_step": 478, "train_info/time_within_train_step": 24.83672857284546, "step": 478}
{"train_info/time_between_train_steps": 0.005320072174072266, "step": 478}
{"info/global_step": 479, "train_info/time_within_train_step": 24.86903715133667, "step": 479}
{"train_info/time_between_train_steps": 0.00531005859375, "step": 479}
{"info/global_step": 480, "train_info/time_within_train_step": 24.886587619781494, "step": 480}
{"train_info/time_between_train_steps": 0.0052525997161865234, "step": 480}
{"info/global_step": 481, "train_info/time_within_train_step": 24.742173433303833, "step": 481}
{"train_info/time_between_train_steps": 0.005126237869262695, "step": 481}
{"info/global_step": 482, "train_info/time_within_train_step": 24.87625813484192, "step": 482}
{"train_info/time_between_train_steps": 0.00510859489440918, "step": 482}
{"info/global_step": 483, "train_info/time_within_train_step": 24.76005983352661, "step": 483}
{"train_info/time_between_train_steps": 0.005323171615600586, "step": 483}
{"info/global_step": 484, "train_info/time_within_train_step": 24.947060346603394, "step": 484}
{"train_info/time_between_train_steps": 0.005007743835449219, "step": 484}
{"info/global_step": 485, "train_info/time_within_train_step": 24.746174812316895, "step": 485}
{"train_info/time_between_train_steps": 0.005268573760986328, "step": 485}
{"info/global_step": 486, "train_info/time_within_train_step": 24.908496856689453, "step": 486}
{"train_info/time_between_train_steps": 0.007180929183959961, "step": 486}
{"info/global_step": 487, "train_info/time_within_train_step": 24.74640917778015, "step": 487}
{"train_info/time_between_train_steps": 0.006108999252319336, "step": 487}
{"info/global_step": 488, "train_info/time_within_train_step": 24.86616849899292, "step": 488}
{"train_info/time_between_train_steps": 0.008221864700317383, "step": 488}
{"info/global_step": 489, "train_info/time_within_train_step": 24.753028392791748, "step": 489}
{"train_info/time_between_train_steps": 0.00577092170715332, "step": 489}
{"info/global_step": 490, "train_info/time_within_train_step": 24.81719422340393, "step": 490}
{"train_info/time_between_train_steps": 0.005046844482421875, "step": 490}
{"info/global_step": 491, "train_info/time_within_train_step": 24.739073753356934, "step": 491}
{"train_info/time_between_train_steps": 0.004851341247558594, "step": 491}
{"info/global_step": 492, "train_info/time_within_train_step": 24.733224391937256, "step": 492}
{"train_info/time_between_train_steps": 0.005156517028808594, "step": 492}
{"info/global_step": 493, "train_info/time_within_train_step": 24.723057985305786, "step": 493}
{"train_info/time_between_train_steps": 0.004927635192871094, "step": 493}
{"info/global_step": 494, "train_info/time_within_train_step": 24.72390913963318, "step": 494}
{"train_info/time_between_train_steps": 0.004976749420166016, "step": 494}
{"info/global_step": 495, "train_info/time_within_train_step": 24.725364923477173, "step": 495}
{"train_info/time_between_train_steps": 0.0050852298736572266, "step": 495}
{"info/global_step": 496, "train_info/time_within_train_step": 24.72523546218872, "step": 496}
{"train_info/time_between_train_steps": 0.0051250457763671875, "step": 496}
{"info/global_step": 497, "train_info/time_within_train_step": 24.72676658630371, "step": 497}
{"train_info/time_between_train_steps": 0.005067348480224609, "step": 497}
{"info/global_step": 498, "train_info/time_within_train_step": 24.72576117515564, "step": 498}
{"train_info/time_between_train_steps": 0.005059242248535156, "step": 498}
{"info/global_step": 499, "train_info/time_within_train_step": 24.81786346435547, "step": 499}
{"train_info/time_between_train_steps": 0.005185842514038086, "step": 499}
{"info/global_step": 500, "train_info/time_within_train_step": 24.72909951210022, "step": 500}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740932635, "_runtime": 12546}, "step": 500}
{"logs": {"train/loss": 3.4001, "train/learning_rate": 0.00038888888888888887, "train/epoch": 14.02, "_timestamp": 1740932635, "_runtime": 12546}, "step": 500}
{"train_info/time_between_train_steps": 11.050783395767212, "step": 500}
{"info/global_step": 501, "train_info/time_within_train_step": 24.735695362091064, "step": 501}
{"train_info/time_between_train_steps": 0.005060911178588867, "step": 501}
{"info/global_step": 502, "train_info/time_within_train_step": 24.73281216621399, "step": 502}
{"train_info/time_between_train_steps": 0.006168842315673828, "step": 502}
{"info/global_step": 503, "train_info/time_within_train_step": 24.72135639190674, "step": 503}
{"train_info/time_between_train_steps": 0.004900932312011719, "step": 503}
{"info/global_step": 504, "train_info/time_within_train_step": 24.735851287841797, "step": 504}
{"train_info/time_between_train_steps": 0.005036354064941406, "step": 504}
{"info/global_step": 505, "train_info/time_within_train_step": 24.74500799179077, "step": 505}
{"train_info/time_between_train_steps": 0.005158185958862305, "step": 505}
{"info/global_step": 506, "train_info/time_within_train_step": 24.729644775390625, "step": 506}
{"train_info/time_between_train_steps": 0.004931449890136719, "step": 506}
{"info/global_step": 507, "train_info/time_within_train_step": 24.73720645904541, "step": 507}
{"train_info/time_between_train_steps": 0.0050885677337646484, "step": 507}
{"info/global_step": 508, "train_info/time_within_train_step": 24.74003005027771, "step": 508}
{"train_info/time_between_train_steps": 0.005272865295410156, "step": 508}
{"info/global_step": 509, "train_info/time_within_train_step": 24.74204134941101, "step": 509}
{"train_info/time_between_train_steps": 0.006211519241333008, "step": 509}
{"info/global_step": 510, "train_info/time_within_train_step": 24.766363620758057, "step": 510}
{"train_info/time_between_train_steps": 0.005719184875488281, "step": 510}
{"train_info/time_between_train_steps": 5.07897162437439, "step": 510}
{"info/global_step": 511, "train_info/time_within_train_step": 24.722623825073242, "step": 511}
{"train_info/time_between_train_steps": 0.004917144775390625, "step": 511}
{"info/global_step": 512, "train_info/time_within_train_step": 24.82223153114319, "step": 512}
{"train_info/time_between_train_steps": 0.0048296451568603516, "step": 512}
{"info/global_step": 513, "train_info/time_within_train_step": 24.718576908111572, "step": 513}
{"train_info/time_between_train_steps": 0.004772186279296875, "step": 513}
{"info/global_step": 514, "train_info/time_within_train_step": 24.89417576789856, "step": 514}
{"train_info/time_between_train_steps": 0.0051615238189697266, "step": 514}
{"info/global_step": 515, "train_info/time_within_train_step": 24.82546329498291, "step": 515}
{"train_info/time_between_train_steps": 0.0051708221435546875, "step": 515}
{"info/global_step": 516, "train_info/time_within_train_step": 24.856436252593994, "step": 516}
{"train_info/time_between_train_steps": 0.0050334930419921875, "step": 516}
{"info/global_step": 517, "train_info/time_within_train_step": 24.73845148086548, "step": 517}
{"train_info/time_between_train_steps": 0.0053348541259765625, "step": 517}
{"info/global_step": 518, "train_info/time_within_train_step": 24.8877112865448, "step": 518}
{"train_info/time_between_train_steps": 0.005236387252807617, "step": 518}
{"info/global_step": 519, "train_info/time_within_train_step": 24.733855724334717, "step": 519}
{"train_info/time_between_train_steps": 0.005118846893310547, "step": 519}
{"info/global_step": 520, "train_info/time_within_train_step": 24.880034923553467, "step": 520}
{"train_info/time_between_train_steps": 0.004969358444213867, "step": 520}
{"info/global_step": 521, "train_info/time_within_train_step": 24.736340522766113, "step": 521}
{"train_info/time_between_train_steps": 0.005265235900878906, "step": 521}
{"info/global_step": 522, "train_info/time_within_train_step": 24.97746515274048, "step": 522}
{"train_info/time_between_train_steps": 0.005113840103149414, "step": 522}
{"info/global_step": 523, "train_info/time_within_train_step": 24.733543395996094, "step": 523}
{"train_info/time_between_train_steps": 0.010438919067382812, "step": 523}
{"info/global_step": 524, "train_info/time_within_train_step": 24.815750122070312, "step": 524}
{"train_info/time_between_train_steps": 0.005214691162109375, "step": 524}
{"info/global_step": 525, "train_info/time_within_train_step": 24.73849391937256, "step": 525}
{"train_info/time_between_train_steps": 0.004815816879272461, "step": 525}
{"info/global_step": 526, "train_info/time_within_train_step": 24.732134342193604, "step": 526}
{"train_info/time_between_train_steps": 0.004904747009277344, "step": 526}
{"info/global_step": 527, "train_info/time_within_train_step": 24.729625701904297, "step": 527}
{"train_info/time_between_train_steps": 0.005032539367675781, "step": 527}
{"info/global_step": 528, "train_info/time_within_train_step": 24.729934453964233, "step": 528}
{"train_info/time_between_train_steps": 0.0051097869873046875, "step": 528}
{"info/global_step": 529, "train_info/time_within_train_step": 24.726181507110596, "step": 529}
{"train_info/time_between_train_steps": 0.0049893856048583984, "step": 529}
{"info/global_step": 530, "train_info/time_within_train_step": 24.73071265220642, "step": 530}
{"train_info/time_between_train_steps": 0.005387544631958008, "step": 530}
{"info/global_step": 531, "train_info/time_within_train_step": 24.815383911132812, "step": 531}
{"train_info/time_between_train_steps": 0.005011796951293945, "step": 531}
{"info/global_step": 532, "train_info/time_within_train_step": 24.73110270500183, "step": 532}
{"train_info/time_between_train_steps": 0.0050182342529296875, "step": 532}
{"info/global_step": 533, "train_info/time_within_train_step": 24.732877016067505, "step": 533}
{"train_info/time_between_train_steps": 0.0051648616790771484, "step": 533}
{"info/global_step": 534, "train_info/time_within_train_step": 24.729100942611694, "step": 534}
{"train_info/time_between_train_steps": 0.005078792572021484, "step": 534}
{"info/global_step": 535, "train_info/time_within_train_step": 24.735610008239746, "step": 535}
{"train_info/time_between_train_steps": 0.0050258636474609375, "step": 535}
{"info/global_step": 536, "train_info/time_within_train_step": 24.736294507980347, "step": 536}
{"train_info/time_between_train_steps": 0.005025148391723633, "step": 536}
{"info/global_step": 537, "train_info/time_within_train_step": 24.7318913936615, "step": 537}
{"train_info/time_between_train_steps": 0.005086660385131836, "step": 537}
{"info/global_step": 538, "train_info/time_within_train_step": 24.745845079421997, "step": 538}
{"train_info/time_between_train_steps": 0.005172252655029297, "step": 538}
{"info/global_step": 539, "train_info/time_within_train_step": 24.736580848693848, "step": 539}
{"train_info/time_between_train_steps": 0.005148172378540039, "step": 539}
{"info/global_step": 540, "train_info/time_within_train_step": 24.73138666152954, "step": 540}
{"train_info/time_between_train_steps": 0.005141258239746094, "step": 540}
{"info/global_step": 541, "train_info/time_within_train_step": 24.75002408027649, "step": 541}
{"train_info/time_between_train_steps": 0.005777597427368164, "step": 541}
{"info/global_step": 542, "train_info/time_within_train_step": 24.761563539505005, "step": 542}
{"train_info/time_between_train_steps": 0.005411386489868164, "step": 542}
{"info/global_step": 543, "train_info/time_within_train_step": 24.75631833076477, "step": 543}
{"train_info/time_between_train_steps": 0.0055522918701171875, "step": 543}
{"info/global_step": 544, "train_info/time_within_train_step": 24.827905893325806, "step": 544}
{"train_info/time_between_train_steps": 0.005743265151977539, "step": 544}
{"train_info/time_between_train_steps": 5.1736085414886475, "step": 544}
{"info/global_step": 545, "train_info/time_within_train_step": 24.74317741394043, "step": 545}
{"train_info/time_between_train_steps": 0.005538463592529297, "step": 545}
{"info/global_step": 546, "train_info/time_within_train_step": 24.952776670455933, "step": 546}
{"train_info/time_between_train_steps": 0.00516200065612793, "step": 546}
{"info/global_step": 547, "train_info/time_within_train_step": 24.739448308944702, "step": 547}
{"train_info/time_between_train_steps": 0.00526881217956543, "step": 547}
{"info/global_step": 548, "train_info/time_within_train_step": 24.97725772857666, "step": 548}
{"train_info/time_between_train_steps": 0.005197763442993164, "step": 548}
{"info/global_step": 549, "train_info/time_within_train_step": 24.751278400421143, "step": 549}
{"train_info/time_between_train_steps": 0.005230426788330078, "step": 549}
{"info/global_step": 550, "train_info/time_within_train_step": 24.860200881958008, "step": 550}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740933896, "_runtime": 13807}, "step": 550}
{"logs": {"train/loss": 3.3159, "train/learning_rate": 0.0003611111111111111, "train/epoch": 16.0, "_timestamp": 1740933896, "_runtime": 13807}, "step": 550}
{"train_info/time_between_train_steps": 0.008715152740478516, "step": 550}
{"info/global_step": 551, "train_info/time_within_train_step": 24.746137380599976, "step": 551}
{"train_info/time_between_train_steps": 0.010048389434814453, "step": 551}
{"info/global_step": 552, "train_info/time_within_train_step": 24.895694732666016, "step": 552}
{"train_info/time_between_train_steps": 0.0052068233489990234, "step": 552}
{"info/global_step": 553, "train_info/time_within_train_step": 24.739177942276, "step": 553}
{"train_info/time_between_train_steps": 0.0049800872802734375, "step": 553}
{"info/global_step": 554, "train_info/time_within_train_step": 24.86281442642212, "step": 554}
{"train_info/time_between_train_steps": 0.00501561164855957, "step": 554}
{"info/global_step": 555, "train_info/time_within_train_step": 24.763758420944214, "step": 555}
{"train_info/time_between_train_steps": 0.0064544677734375, "step": 555}
{"info/global_step": 556, "train_info/time_within_train_step": 24.861016273498535, "step": 556}
{"train_info/time_between_train_steps": 0.0051801204681396484, "step": 556}
{"info/global_step": 557, "train_info/time_within_train_step": 24.745590209960938, "step": 557}
{"train_info/time_between_train_steps": 0.005272388458251953, "step": 557}
{"info/global_step": 558, "train_info/time_within_train_step": 24.840539932250977, "step": 558}
{"train_info/time_between_train_steps": 0.005283832550048828, "step": 558}
{"info/global_step": 559, "train_info/time_within_train_step": 24.749847173690796, "step": 559}
{"train_info/time_between_train_steps": 0.004862308502197266, "step": 559}
{"info/global_step": 560, "train_info/time_within_train_step": 24.730200052261353, "step": 560}
{"train_info/time_between_train_steps": 0.005843639373779297, "step": 560}
{"info/global_step": 561, "train_info/time_within_train_step": 24.726398229599, "step": 561}
{"train_info/time_between_train_steps": 0.005164384841918945, "step": 561}
{"info/global_step": 562, "train_info/time_within_train_step": 24.81541156768799, "step": 562}
{"train_info/time_between_train_steps": 0.005097866058349609, "step": 562}
{"info/global_step": 563, "train_info/time_within_train_step": 24.72533893585205, "step": 563}
{"train_info/time_between_train_steps": 0.005089998245239258, "step": 563}
{"info/global_step": 564, "train_info/time_within_train_step": 24.726505994796753, "step": 564}
{"train_info/time_between_train_steps": 0.00515294075012207, "step": 564}
{"info/global_step": 565, "train_info/time_within_train_step": 24.735878467559814, "step": 565}
{"train_info/time_between_train_steps": 0.004971027374267578, "step": 565}
{"info/global_step": 566, "train_info/time_within_train_step": 24.7444326877594, "step": 566}
{"train_info/time_between_train_steps": 0.005130290985107422, "step": 566}
{"info/global_step": 567, "train_info/time_within_train_step": 24.731431245803833, "step": 567}
{"train_info/time_between_train_steps": 0.005333900451660156, "step": 567}
{"info/global_step": 568, "train_info/time_within_train_step": 24.732009887695312, "step": 568}
{"train_info/time_between_train_steps": 0.004997968673706055, "step": 568}
{"info/global_step": 569, "train_info/time_within_train_step": 24.73505926132202, "step": 569}
{"train_info/time_between_train_steps": 0.00491786003112793, "step": 569}
{"info/global_step": 570, "train_info/time_within_train_step": 24.72515344619751, "step": 570}
{"train_info/time_between_train_steps": 0.004885673522949219, "step": 570}
{"info/global_step": 571, "train_info/time_within_train_step": 24.732109785079956, "step": 571}
{"train_info/time_between_train_steps": 0.005010843276977539, "step": 571}
{"info/global_step": 572, "train_info/time_within_train_step": 24.735713005065918, "step": 572}
{"train_info/time_between_train_steps": 0.004961490631103516, "step": 572}
{"info/global_step": 573, "train_info/time_within_train_step": 24.741560220718384, "step": 573}
{"train_info/time_between_train_steps": 0.0049746036529541016, "step": 573}
{"info/global_step": 574, "train_info/time_within_train_step": 24.74082660675049, "step": 574}
{"train_info/time_between_train_steps": 0.005098104476928711, "step": 574}
{"info/global_step": 575, "train_info/time_within_train_step": 24.738784313201904, "step": 575}
{"train_info/time_between_train_steps": 0.005237102508544922, "step": 575}
{"info/global_step": 576, "train_info/time_within_train_step": 24.74478507041931, "step": 576}
{"train_info/time_between_train_steps": 0.005376100540161133, "step": 576}
{"info/global_step": 577, "train_info/time_within_train_step": 24.84718132019043, "step": 577}
{"train_info/time_between_train_steps": 0.005530357360839844, "step": 577}
{"info/global_step": 578, "train_info/time_within_train_step": 24.765311002731323, "step": 578}
{"train_info/time_between_train_steps": 0.00567936897277832, "step": 578}
{"train_info/time_between_train_steps": 4.9355857372283936, "step": 578}
{"info/global_step": 579, "train_info/time_within_train_step": 24.737181425094604, "step": 579}
{"train_info/time_between_train_steps": 0.0052661895751953125, "step": 579}
{"info/global_step": 580, "train_info/time_within_train_step": 24.884490489959717, "step": 580}
{"train_info/time_between_train_steps": 0.00521397590637207, "step": 580}
{"info/global_step": 581, "train_info/time_within_train_step": 24.738383531570435, "step": 581}
{"train_info/time_between_train_steps": 0.004940986633300781, "step": 581}
{"info/global_step": 582, "train_info/time_within_train_step": 24.864378452301025, "step": 582}
{"train_info/time_between_train_steps": 0.00521087646484375, "step": 582}
{"info/global_step": 583, "train_info/time_within_train_step": 24.750944137573242, "step": 583}
{"train_info/time_between_train_steps": 0.005465507507324219, "step": 583}
{"info/global_step": 584, "train_info/time_within_train_step": 24.864943981170654, "step": 584}
{"train_info/time_between_train_steps": 0.005135297775268555, "step": 584}
{"info/global_step": 585, "train_info/time_within_train_step": 24.73339295387268, "step": 585}
{"train_info/time_between_train_steps": 0.00512242317199707, "step": 585}
{"info/global_step": 586, "train_info/time_within_train_step": 24.901312112808228, "step": 586}
{"train_info/time_between_train_steps": 0.005237102508544922, "step": 586}
{"info/global_step": 587, "train_info/time_within_train_step": 24.736732482910156, "step": 587}
{"train_info/time_between_train_steps": 0.005091190338134766, "step": 587}
{"info/global_step": 588, "train_info/time_within_train_step": 24.854686498641968, "step": 588}
{"train_info/time_between_train_steps": 0.005001068115234375, "step": 588}
{"info/global_step": 589, "train_info/time_within_train_step": 24.744218349456787, "step": 589}
{"train_info/time_between_train_steps": 0.0054934024810791016, "step": 589}
{"info/global_step": 590, "train_info/time_within_train_step": 24.88955068588257, "step": 590}
{"train_info/time_between_train_steps": 0.005377769470214844, "step": 590}
{"info/global_step": 591, "train_info/time_within_train_step": 24.735609531402588, "step": 591}
{"train_info/time_between_train_steps": 0.005264997482299805, "step": 591}
{"info/global_step": 592, "train_info/time_within_train_step": 24.829589128494263, "step": 592}
{"train_info/time_between_train_steps": 0.005313396453857422, "step": 592}
{"info/global_step": 593, "train_info/time_within_train_step": 24.84942126274109, "step": 593}
{"train_info/time_between_train_steps": 0.004991769790649414, "step": 593}
{"info/global_step": 594, "train_info/time_within_train_step": 24.731983184814453, "step": 594}
{"train_info/time_between_train_steps": 0.004934549331665039, "step": 594}
{"info/global_step": 595, "train_info/time_within_train_step": 24.738008975982666, "step": 595}
{"train_info/time_between_train_steps": 0.005101919174194336, "step": 595}
{"info/global_step": 596, "train_info/time_within_train_step": 24.737871885299683, "step": 596}
{"train_info/time_between_train_steps": 0.005181312561035156, "step": 596}
{"info/global_step": 597, "train_info/time_within_train_step": 24.7321035861969, "step": 597}
{"train_info/time_between_train_steps": 0.005018472671508789, "step": 597}
{"info/global_step": 598, "train_info/time_within_train_step": 24.73089599609375, "step": 598}
{"train_info/time_between_train_steps": 0.005121469497680664, "step": 598}
{"info/global_step": 599, "train_info/time_within_train_step": 24.727961540222168, "step": 599}
{"train_info/time_between_train_steps": 0.005048274993896484, "step": 599}
{"info/global_step": 600, "train_info/time_within_train_step": 24.724239587783813, "step": 600}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740935140, "_runtime": 15051}, "step": 600}
{"logs": {"train/loss": 3.2335, "train/learning_rate": 0.0003333333333333333, "train/epoch": 17.02, "_timestamp": 1740935140, "_runtime": 15051}, "step": 600}
{"train_info/time_between_train_steps": 11.08275842666626, "step": 600}
{"info/global_step": 601, "train_info/time_within_train_step": 24.715240478515625, "step": 601}
{"train_info/time_between_train_steps": 0.004802703857421875, "step": 601}
{"info/global_step": 602, "train_info/time_within_train_step": 24.727694272994995, "step": 602}
{"train_info/time_between_train_steps": 0.005124330520629883, "step": 602}
{"info/global_step": 603, "train_info/time_within_train_step": 24.731356620788574, "step": 603}
{"train_info/time_between_train_steps": 0.004884481430053711, "step": 603}
{"info/global_step": 604, "train_info/time_within_train_step": 24.731972217559814, "step": 604}
{"train_info/time_between_train_steps": 0.0049364566802978516, "step": 604}
{"info/global_step": 605, "train_info/time_within_train_step": 24.732810497283936, "step": 605}
{"train_info/time_between_train_steps": 0.010215282440185547, "step": 605}
{"info/global_step": 606, "train_info/time_within_train_step": 24.728954076766968, "step": 606}
{"train_info/time_between_train_steps": 0.005003213882446289, "step": 606}
{"info/global_step": 607, "train_info/time_within_train_step": 24.73045015335083, "step": 607}
{"train_info/time_between_train_steps": 0.004958152770996094, "step": 607}
{"info/global_step": 608, "train_info/time_within_train_step": 24.740942001342773, "step": 608}
{"train_info/time_between_train_steps": 0.006539821624755859, "step": 608}
{"info/global_step": 609, "train_info/time_within_train_step": 24.836398601531982, "step": 609}
{"train_info/time_between_train_steps": 0.0050182342529296875, "step": 609}
{"info/global_step": 610, "train_info/time_within_train_step": 24.747387647628784, "step": 610}
{"train_info/time_between_train_steps": 0.005198240280151367, "step": 610}
{"info/global_step": 611, "train_info/time_within_train_step": 24.754991054534912, "step": 611}
{"train_info/time_between_train_steps": 0.005590915679931641, "step": 611}
{"info/global_step": 612, "train_info/time_within_train_step": 24.764228582382202, "step": 612}
{"train_info/time_between_train_steps": 0.005788326263427734, "step": 612}
{"train_info/time_between_train_steps": 5.048306465148926, "step": 612}
{"info/global_step": 613, "train_info/time_within_train_step": 24.727211236953735, "step": 613}
{"train_info/time_between_train_steps": 0.004836082458496094, "step": 613}
{"info/global_step": 614, "train_info/time_within_train_step": 24.87230086326599, "step": 614}
{"train_info/time_between_train_steps": 0.005124092102050781, "step": 614}
{"info/global_step": 615, "train_info/time_within_train_step": 24.73614263534546, "step": 615}
{"train_info/time_between_train_steps": 0.005196809768676758, "step": 615}
{"info/global_step": 616, "train_info/time_within_train_step": 24.84704828262329, "step": 616}
{"train_info/time_between_train_steps": 0.0052967071533203125, "step": 616}
{"info/global_step": 617, "train_info/time_within_train_step": 24.74289083480835, "step": 617}
{"train_info/time_between_train_steps": 0.0053272247314453125, "step": 617}
{"info/global_step": 618, "train_info/time_within_train_step": 24.88630437850952, "step": 618}
{"train_info/time_between_train_steps": 0.0052242279052734375, "step": 618}
{"info/global_step": 619, "train_info/time_within_train_step": 24.74566102027893, "step": 619}
{"train_info/time_between_train_steps": 0.0050542354583740234, "step": 619}
{"info/global_step": 620, "train_info/time_within_train_step": 24.88273787498474, "step": 620}
{"train_info/time_between_train_steps": 0.005126476287841797, "step": 620}
{"info/global_step": 621, "train_info/time_within_train_step": 24.739728450775146, "step": 621}
{"train_info/time_between_train_steps": 0.005227804183959961, "step": 621}
{"info/global_step": 622, "train_info/time_within_train_step": 24.845060348510742, "step": 622}
{"train_info/time_between_train_steps": 0.0050814151763916016, "step": 622}
{"info/global_step": 623, "train_info/time_within_train_step": 24.735315561294556, "step": 623}
{"train_info/time_between_train_steps": 0.0053958892822265625, "step": 623}
{"info/global_step": 624, "train_info/time_within_train_step": 25.127198934555054, "step": 624}
{"train_info/time_between_train_steps": 0.0051572322845458984, "step": 624}
{"info/global_step": 625, "train_info/time_within_train_step": 24.729559898376465, "step": 625}
{"train_info/time_between_train_steps": 0.0051152706146240234, "step": 625}
{"info/global_step": 626, "train_info/time_within_train_step": 24.800490617752075, "step": 626}
{"train_info/time_between_train_steps": 0.0051496028900146484, "step": 626}
{"info/global_step": 627, "train_info/time_within_train_step": 24.75983476638794, "step": 627}
{"train_info/time_between_train_steps": 0.005038738250732422, "step": 627}
{"info/global_step": 628, "train_info/time_within_train_step": 24.728253602981567, "step": 628}
{"train_info/time_between_train_steps": 0.005323648452758789, "step": 628}
{"info/global_step": 629, "train_info/time_within_train_step": 24.723386764526367, "step": 629}
{"train_info/time_between_train_steps": 0.0053806304931640625, "step": 629}
{"info/global_step": 630, "train_info/time_within_train_step": 24.725805521011353, "step": 630}
{"train_info/time_between_train_steps": 0.005182981491088867, "step": 630}
{"info/global_step": 631, "train_info/time_within_train_step": 24.72704005241394, "step": 631}
{"train_info/time_between_train_steps": 0.0052869319915771484, "step": 631}
{"info/global_step": 632, "train_info/time_within_train_step": 24.723095417022705, "step": 632}
{"train_info/time_between_train_steps": 0.004937887191772461, "step": 632}
{"info/global_step": 633, "train_info/time_within_train_step": 24.734808444976807, "step": 633}
{"train_info/time_between_train_steps": 0.0051233768463134766, "step": 633}
{"info/global_step": 634, "train_info/time_within_train_step": 24.73098397254944, "step": 634}
{"train_info/time_between_train_steps": 0.004950523376464844, "step": 634}
{"info/global_step": 635, "train_info/time_within_train_step": 24.72571563720703, "step": 635}
{"train_info/time_between_train_steps": 0.00503087043762207, "step": 635}
{"info/global_step": 636, "train_info/time_within_train_step": 24.73618483543396, "step": 636}
{"train_info/time_between_train_steps": 0.005286216735839844, "step": 636}
{"info/global_step": 637, "train_info/time_within_train_step": 24.72663140296936, "step": 637}
{"train_info/time_between_train_steps": 0.004950523376464844, "step": 637}
{"info/global_step": 638, "train_info/time_within_train_step": 24.726420164108276, "step": 638}
{"train_info/time_between_train_steps": 0.005018472671508789, "step": 638}
{"info/global_step": 639, "train_info/time_within_train_step": 24.731470823287964, "step": 639}
{"train_info/time_between_train_steps": 0.005130767822265625, "step": 639}
{"info/global_step": 640, "train_info/time_within_train_step": 24.813066005706787, "step": 640}
{"train_info/time_between_train_steps": 0.004995584487915039, "step": 640}
{"info/global_step": 641, "train_info/time_within_train_step": 24.732569932937622, "step": 641}
{"train_info/time_between_train_steps": 0.005119800567626953, "step": 641}
{"info/global_step": 642, "train_info/time_within_train_step": 24.727071285247803, "step": 642}
{"train_info/time_between_train_steps": 0.0050508975982666016, "step": 642}
{"info/global_step": 643, "train_info/time_within_train_step": 24.97421908378601, "step": 643}
{"train_info/time_between_train_steps": 0.005093812942504883, "step": 643}
{"info/global_step": 644, "train_info/time_within_train_step": 24.74173092842102, "step": 644}
{"train_info/time_between_train_steps": 0.005177736282348633, "step": 644}
{"info/global_step": 645, "train_info/time_within_train_step": 24.747119903564453, "step": 645}
{"train_info/time_between_train_steps": 0.005548715591430664, "step": 645}
{"info/global_step": 646, "train_info/time_within_train_step": 24.77852964401245, "step": 646}
{"train_info/time_between_train_steps": 0.0066950321197509766, "step": 646}
{"train_info/time_between_train_steps": 5.197583436965942, "step": 646}
{"info/global_step": 647, "train_info/time_within_train_step": 24.73292875289917, "step": 647}
{"train_info/time_between_train_steps": 0.004796504974365234, "step": 647}
{"info/global_step": 648, "train_info/time_within_train_step": 24.890491724014282, "step": 648}
{"train_info/time_between_train_steps": 0.0051920413970947266, "step": 648}
{"info/global_step": 649, "train_info/time_within_train_step": 24.73512315750122, "step": 649}
{"train_info/time_between_train_steps": 0.00524592399597168, "step": 649}
{"info/global_step": 650, "train_info/time_within_train_step": 24.846534967422485, "step": 650}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740936400, "_runtime": 16311}, "step": 650}
{"logs": {"train/loss": 3.1697, "train/learning_rate": 0.00030555555555555555, "train/epoch": 19.0, "_timestamp": 1740936400, "_runtime": 16311}, "step": 650}
{"train_info/time_between_train_steps": 0.008714914321899414, "step": 650}
{"info/global_step": 651, "train_info/time_within_train_step": 24.7390296459198, "step": 651}
{"train_info/time_between_train_steps": 0.005209684371948242, "step": 651}
{"info/global_step": 652, "train_info/time_within_train_step": 24.881788969039917, "step": 652}
{"train_info/time_between_train_steps": 0.007405281066894531, "step": 652}
{"info/global_step": 653, "train_info/time_within_train_step": 24.740134716033936, "step": 653}
{"train_info/time_between_train_steps": 0.0050296783447265625, "step": 653}
{"info/global_step": 654, "train_info/time_within_train_step": 24.85319995880127, "step": 654}
{"train_info/time_between_train_steps": 0.0051059722900390625, "step": 654}
{"info/global_step": 655, "train_info/time_within_train_step": 24.83401870727539, "step": 655}
{"train_info/time_between_train_steps": 0.005487918853759766, "step": 655}
{"info/global_step": 656, "train_info/time_within_train_step": 24.86409282684326, "step": 656}
{"train_info/time_between_train_steps": 0.007323026657104492, "step": 656}
{"info/global_step": 657, "train_info/time_within_train_step": 24.7379252910614, "step": 657}
{"train_info/time_between_train_steps": 0.008162736892700195, "step": 657}
{"info/global_step": 658, "train_info/time_within_train_step": 24.883450269699097, "step": 658}
{"train_info/time_between_train_steps": 0.00525212287902832, "step": 658}
{"info/global_step": 659, "train_info/time_within_train_step": 24.751392602920532, "step": 659}
{"train_info/time_between_train_steps": 0.0052700042724609375, "step": 659}
{"info/global_step": 660, "train_info/time_within_train_step": 24.79580330848694, "step": 660}
{"train_info/time_between_train_steps": 0.0050580501556396484, "step": 660}
{"info/global_step": 661, "train_info/time_within_train_step": 24.74029803276062, "step": 661}
{"train_info/time_between_train_steps": 0.00479435920715332, "step": 661}
{"info/global_step": 662, "train_info/time_within_train_step": 24.723132133483887, "step": 662}
{"train_info/time_between_train_steps": 0.0052280426025390625, "step": 662}
{"info/global_step": 663, "train_info/time_within_train_step": 24.722511291503906, "step": 663}
{"train_info/time_between_train_steps": 0.005105018615722656, "step": 663}
{"info/global_step": 664, "train_info/time_within_train_step": 24.73542308807373, "step": 664}
{"train_info/time_between_train_steps": 0.00502324104309082, "step": 664}
{"info/global_step": 665, "train_info/time_within_train_step": 24.726361751556396, "step": 665}
{"train_info/time_between_train_steps": 0.005097866058349609, "step": 665}
{"info/global_step": 666, "train_info/time_within_train_step": 24.726837158203125, "step": 666}
{"train_info/time_between_train_steps": 0.004942417144775391, "step": 666}
{"info/global_step": 667, "train_info/time_within_train_step": 24.728418588638306, "step": 667}
{"train_info/time_between_train_steps": 0.0049533843994140625, "step": 667}
{"info/global_step": 668, "train_info/time_within_train_step": 24.748389720916748, "step": 668}
{"train_info/time_between_train_steps": 0.0050640106201171875, "step": 668}
{"info/global_step": 669, "train_info/time_within_train_step": 24.725419998168945, "step": 669}
{"train_info/time_between_train_steps": 0.006926536560058594, "step": 669}
{"info/global_step": 670, "train_info/time_within_train_step": 24.73281693458557, "step": 670}
{"train_info/time_between_train_steps": 0.005042552947998047, "step": 670}
{"info/global_step": 671, "train_info/time_within_train_step": 24.823866367340088, "step": 671}
{"train_info/time_between_train_steps": 0.005037069320678711, "step": 671}
{"info/global_step": 672, "train_info/time_within_train_step": 24.74393916130066, "step": 672}
{"train_info/time_between_train_steps": 0.00486445426940918, "step": 672}
{"info/global_step": 673, "train_info/time_within_train_step": 24.73993706703186, "step": 673}
{"train_info/time_between_train_steps": 0.005001544952392578, "step": 673}
{"info/global_step": 674, "train_info/time_within_train_step": 24.735979795455933, "step": 674}
{"train_info/time_between_train_steps": 0.005127429962158203, "step": 674}
{"info/global_step": 675, "train_info/time_within_train_step": 24.727715492248535, "step": 675}
{"train_info/time_between_train_steps": 0.0050771236419677734, "step": 675}
{"info/global_step": 676, "train_info/time_within_train_step": 24.728034019470215, "step": 676}
{"train_info/time_between_train_steps": 0.0050923824310302734, "step": 676}
{"info/global_step": 677, "train_info/time_within_train_step": 24.735392570495605, "step": 677}
{"train_info/time_between_train_steps": 0.00525212287902832, "step": 677}
{"info/global_step": 678, "train_info/time_within_train_step": 24.81847643852234, "step": 678}
{"train_info/time_between_train_steps": 0.006196260452270508, "step": 678}
{"info/global_step": 679, "train_info/time_within_train_step": 24.768595218658447, "step": 679}
{"train_info/time_between_train_steps": 0.00540471076965332, "step": 679}
{"info/global_step": 680, "train_info/time_within_train_step": 24.769683361053467, "step": 680}
{"train_info/time_between_train_steps": 0.0057871341705322266, "step": 680}
{"train_info/time_between_train_steps": 4.9380857944488525, "step": 680}
{"info/global_step": 681, "train_info/time_within_train_step": 24.95992684364319, "step": 681}
{"train_info/time_between_train_steps": 0.004792928695678711, "step": 681}
{"info/global_step": 682, "train_info/time_within_train_step": 24.83500075340271, "step": 682}
{"train_info/time_between_train_steps": 0.004853487014770508, "step": 682}
{"info/global_step": 683, "train_info/time_within_train_step": 24.74006414413452, "step": 683}
{"train_info/time_between_train_steps": 0.0049440860748291016, "step": 683}
{"info/global_step": 684, "train_info/time_within_train_step": 24.875264406204224, "step": 684}
{"train_info/time_between_train_steps": 0.0052258968353271484, "step": 684}
{"info/global_step": 685, "train_info/time_within_train_step": 24.73749542236328, "step": 685}
{"train_info/time_between_train_steps": 0.005120754241943359, "step": 685}
{"info/global_step": 686, "train_info/time_within_train_step": 24.980714082717896, "step": 686}
{"train_info/time_between_train_steps": 0.005347013473510742, "step": 686}
{"info/global_step": 687, "train_info/time_within_train_step": 24.743270874023438, "step": 687}
{"train_info/time_between_train_steps": 0.005151033401489258, "step": 687}
{"info/global_step": 688, "train_info/time_within_train_step": 24.864202976226807, "step": 688}
{"train_info/time_between_train_steps": 0.005190134048461914, "step": 688}
{"info/global_step": 689, "train_info/time_within_train_step": 24.834689378738403, "step": 689}
{"train_info/time_between_train_steps": 0.005424022674560547, "step": 689}
{"info/global_step": 690, "train_info/time_within_train_step": 24.944427251815796, "step": 690}
{"train_info/time_between_train_steps": 0.01311182975769043, "step": 690}
{"info/global_step": 691, "train_info/time_within_train_step": 24.80128240585327, "step": 691}
{"train_info/time_between_train_steps": 0.005400180816650391, "step": 691}
{"info/global_step": 692, "train_info/time_within_train_step": 24.887605667114258, "step": 692}
{"train_info/time_between_train_steps": 0.005341053009033203, "step": 692}
{"info/global_step": 693, "train_info/time_within_train_step": 24.874348640441895, "step": 693}
{"train_info/time_between_train_steps": 0.005349636077880859, "step": 693}
{"info/global_step": 694, "train_info/time_within_train_step": 24.812662363052368, "step": 694}
{"train_info/time_between_train_steps": 0.005167484283447266, "step": 694}
{"info/global_step": 695, "train_info/time_within_train_step": 24.75482487678528, "step": 695}
{"train_info/time_between_train_steps": 0.004935264587402344, "step": 695}
{"info/global_step": 696, "train_info/time_within_train_step": 24.899678230285645, "step": 696}
{"train_info/time_between_train_steps": 0.005248308181762695, "step": 696}
{"info/global_step": 697, "train_info/time_within_train_step": 24.770766019821167, "step": 697}
{"train_info/time_between_train_steps": 0.005003452301025391, "step": 697}
{"info/global_step": 698, "train_info/time_within_train_step": 24.75543999671936, "step": 698}
{"train_info/time_between_train_steps": 0.005144834518432617, "step": 698}
{"info/global_step": 699, "train_info/time_within_train_step": 24.754274129867554, "step": 699}
{"train_info/time_between_train_steps": 0.005117893218994141, "step": 699}
{"info/global_step": 700, "train_info/time_within_train_step": 24.751561880111694, "step": 700}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740937645, "_runtime": 17556}, "step": 700}
{"logs": {"train/loss": 3.1058, "train/learning_rate": 0.0002777777777777778, "train/epoch": 20.02, "_timestamp": 1740937645, "_runtime": 17556}, "step": 700}
{"train_info/time_between_train_steps": 11.20994520187378, "step": 700}
{"info/global_step": 701, "train_info/time_within_train_step": 24.749574184417725, "step": 701}
{"train_info/time_between_train_steps": 0.00485682487487793, "step": 701}
{"info/global_step": 702, "train_info/time_within_train_step": 24.82718539237976, "step": 702}
{"train_info/time_between_train_steps": 0.00525212287902832, "step": 702}
{"info/global_step": 703, "train_info/time_within_train_step": 24.737187147140503, "step": 703}
{"train_info/time_between_train_steps": 0.005021572113037109, "step": 703}
{"info/global_step": 704, "train_info/time_within_train_step": 24.73868227005005, "step": 704}
{"train_info/time_between_train_steps": 0.010044574737548828, "step": 704}
{"info/global_step": 705, "train_info/time_within_train_step": 24.739320039749146, "step": 705}
{"train_info/time_between_train_steps": 0.010071039199829102, "step": 705}
{"info/global_step": 706, "train_info/time_within_train_step": 24.740936040878296, "step": 706}
{"train_info/time_between_train_steps": 0.004952192306518555, "step": 706}
{"info/global_step": 707, "train_info/time_within_train_step": 24.74279522895813, "step": 707}
{"train_info/time_between_train_steps": 0.004996538162231445, "step": 707}
{"info/global_step": 708, "train_info/time_within_train_step": 24.73941135406494, "step": 708}
{"train_info/time_between_train_steps": 0.005243062973022461, "step": 708}
{"info/global_step": 709, "train_info/time_within_train_step": 24.74150061607361, "step": 709}
{"train_info/time_between_train_steps": 0.005129098892211914, "step": 709}
{"info/global_step": 710, "train_info/time_within_train_step": 24.745847463607788, "step": 710}
{"train_info/time_between_train_steps": 0.005075931549072266, "step": 710}
{"info/global_step": 711, "train_info/time_within_train_step": 24.751298189163208, "step": 711}
{"train_info/time_between_train_steps": 0.005132913589477539, "step": 711}
{"info/global_step": 712, "train_info/time_within_train_step": 24.755124807357788, "step": 712}
{"train_info/time_between_train_steps": 0.0052394866943359375, "step": 712}
{"info/global_step": 713, "train_info/time_within_train_step": 24.75218629837036, "step": 713}
{"train_info/time_between_train_steps": 0.0054547786712646484, "step": 713}
{"info/global_step": 714, "train_info/time_within_train_step": 24.7899067401886, "step": 714}
{"train_info/time_between_train_steps": 0.005962371826171875, "step": 714}
{"train_info/time_between_train_steps": 4.98201584815979, "step": 714}
{"info/global_step": 715, "train_info/time_within_train_step": 24.80935049057007, "step": 715}
{"train_info/time_between_train_steps": 0.009064674377441406, "step": 715}
{"info/global_step": 716, "train_info/time_within_train_step": 25.15603280067444, "step": 716}
{"train_info/time_between_train_steps": 0.004938602447509766, "step": 716}
{"info/global_step": 717, "train_info/time_within_train_step": 24.742401361465454, "step": 717}
{"train_info/time_between_train_steps": 0.005400657653808594, "step": 717}
{"info/global_step": 718, "train_info/time_within_train_step": 24.979378938674927, "step": 718}
{"train_info/time_between_train_steps": 0.005305051803588867, "step": 718}
{"info/global_step": 719, "train_info/time_within_train_step": 24.752899646759033, "step": 719}
{"train_info/time_between_train_steps": 0.0060291290283203125, "step": 719}
{"info/global_step": 720, "train_info/time_within_train_step": 24.8845112323761, "step": 720}
{"train_info/time_between_train_steps": 0.005286455154418945, "step": 720}
{"info/global_step": 721, "train_info/time_within_train_step": 24.760260343551636, "step": 721}
{"train_info/time_between_train_steps": 0.005463600158691406, "step": 721}
{"info/global_step": 722, "train_info/time_within_train_step": 24.865023374557495, "step": 722}
{"train_info/time_between_train_steps": 0.005161762237548828, "step": 722}
{"info/global_step": 723, "train_info/time_within_train_step": 24.74947190284729, "step": 723}
{"train_info/time_between_train_steps": 0.005259275436401367, "step": 723}
{"info/global_step": 724, "train_info/time_within_train_step": 24.9113712310791, "step": 724}
{"train_info/time_between_train_steps": 0.0052030086517333984, "step": 724}
{"info/global_step": 725, "train_info/time_within_train_step": 24.74404740333557, "step": 725}
{"train_info/time_between_train_steps": 0.005252361297607422, "step": 725}
{"info/global_step": 726, "train_info/time_within_train_step": 24.874088287353516, "step": 726}
{"train_info/time_between_train_steps": 0.005372047424316406, "step": 726}
{"info/global_step": 727, "train_info/time_within_train_step": 24.75866985321045, "step": 727}
{"train_info/time_between_train_steps": 0.005509853363037109, "step": 727}
{"info/global_step": 728, "train_info/time_within_train_step": 24.813669204711914, "step": 728}
{"train_info/time_between_train_steps": 0.005172014236450195, "step": 728}
{"info/global_step": 729, "train_info/time_within_train_step": 24.752926111221313, "step": 729}
{"train_info/time_between_train_steps": 0.004983425140380859, "step": 729}
{"info/global_step": 730, "train_info/time_within_train_step": 24.733726501464844, "step": 730}
{"train_info/time_between_train_steps": 0.0051271915435791016, "step": 730}
{"info/global_step": 731, "train_info/time_within_train_step": 24.73005986213684, "step": 731}
{"train_info/time_between_train_steps": 0.004929542541503906, "step": 731}
{"info/global_step": 732, "train_info/time_within_train_step": 24.733740091323853, "step": 732}
{"train_info/time_between_train_steps": 0.0050771236419677734, "step": 732}
{"info/global_step": 733, "train_info/time_within_train_step": 24.826823949813843, "step": 733}
{"train_info/time_between_train_steps": 0.005082368850708008, "step": 733}
{"info/global_step": 734, "train_info/time_within_train_step": 24.73387885093689, "step": 734}
{"train_info/time_between_train_steps": 0.004941701889038086, "step": 734}
{"info/global_step": 735, "train_info/time_within_train_step": 24.744832754135132, "step": 735}
{"train_info/time_between_train_steps": 0.0049932003021240234, "step": 735}
{"info/global_step": 736, "train_info/time_within_train_step": 24.879199981689453, "step": 736}
{"train_info/time_between_train_steps": 0.012064218521118164, "step": 736}
{"info/global_step": 737, "train_info/time_within_train_step": 24.76779556274414, "step": 737}
{"train_info/time_between_train_steps": 0.005033016204833984, "step": 737}
{"info/global_step": 738, "train_info/time_within_train_step": 24.737034559249878, "step": 738}
{"train_info/time_between_train_steps": 0.005115985870361328, "step": 738}
{"info/global_step": 739, "train_info/time_within_train_step": 24.7369704246521, "step": 739}
{"train_info/time_between_train_steps": 0.005086660385131836, "step": 739}
{"info/global_step": 740, "train_info/time_within_train_step": 24.732747554779053, "step": 740}
{"train_info/time_between_train_steps": 0.010358333587646484, "step": 740}
{"info/global_step": 741, "train_info/time_within_train_step": 24.737417459487915, "step": 741}
{"train_info/time_between_train_steps": 0.009983301162719727, "step": 741}
{"info/global_step": 742, "train_info/time_within_train_step": 24.741610527038574, "step": 742}
{"train_info/time_between_train_steps": 0.005204439163208008, "step": 742}
{"info/global_step": 743, "train_info/time_within_train_step": 24.734590530395508, "step": 743}
{"train_info/time_between_train_steps": 0.010019063949584961, "step": 743}
{"info/global_step": 744, "train_info/time_within_train_step": 24.752122402191162, "step": 744}
{"train_info/time_between_train_steps": 0.006413698196411133, "step": 744}
{"info/global_step": 745, "train_info/time_within_train_step": 24.905717372894287, "step": 745}
{"train_info/time_between_train_steps": 0.01024007797241211, "step": 745}
{"info/global_step": 746, "train_info/time_within_train_step": 24.745100498199463, "step": 746}
{"train_info/time_between_train_steps": 0.005181312561035156, "step": 746}
{"info/global_step": 747, "train_info/time_within_train_step": 24.751347541809082, "step": 747}
{"train_info/time_between_train_steps": 0.005353212356567383, "step": 747}
{"info/global_step": 748, "train_info/time_within_train_step": 24.77718758583069, "step": 748}
{"train_info/time_between_train_steps": 0.011250495910644531, "step": 748}
{"train_info/time_between_train_steps": 5.472787618637085, "step": 748}
{"info/global_step": 749, "train_info/time_within_train_step": 24.82198166847229, "step": 749}
{"train_info/time_between_train_steps": 0.004773139953613281, "step": 749}
{"info/global_step": 750, "train_info/time_within_train_step": 24.8321692943573, "step": 750}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740938907, "_runtime": 18818}, "step": 750}
{"logs": {"train/loss": 3.0578, "train/learning_rate": 0.00025, "train/epoch": 22.0, "_timestamp": 1740938907, "_runtime": 18818}, "step": 750}
{"train_info/time_between_train_steps": 0.008776187896728516, "step": 750}
{"info/global_step": 751, "train_info/time_within_train_step": 24.755528450012207, "step": 751}
{"train_info/time_between_train_steps": 0.005280971527099609, "step": 751}
{"info/global_step": 752, "train_info/time_within_train_step": 24.867413997650146, "step": 752}
{"train_info/time_between_train_steps": 0.005277156829833984, "step": 752}
{"info/global_step": 753, "train_info/time_within_train_step": 24.737590312957764, "step": 753}
{"train_info/time_between_train_steps": 0.005195140838623047, "step": 753}
{"info/global_step": 754, "train_info/time_within_train_step": 24.89277744293213, "step": 754}
{"train_info/time_between_train_steps": 0.005280494689941406, "step": 754}
{"info/global_step": 755, "train_info/time_within_train_step": 24.95790719985962, "step": 755}
{"train_info/time_between_train_steps": 0.005296230316162109, "step": 755}
{"info/global_step": 756, "train_info/time_within_train_step": 24.85051417350769, "step": 756}
{"train_info/time_between_train_steps": 0.005139827728271484, "step": 756}
{"info/global_step": 757, "train_info/time_within_train_step": 24.742788314819336, "step": 757}
{"train_info/time_between_train_steps": 0.005423069000244141, "step": 757}
{"info/global_step": 758, "train_info/time_within_train_step": 24.898043394088745, "step": 758}
{"train_info/time_between_train_steps": 0.005173683166503906, "step": 758}
{"info/global_step": 759, "train_info/time_within_train_step": 24.74614143371582, "step": 759}
{"train_info/time_between_train_steps": 0.005247592926025391, "step": 759}
{"info/global_step": 760, "train_info/time_within_train_step": 24.92180371284485, "step": 760}
{"train_info/time_between_train_steps": 0.005242347717285156, "step": 760}
{"info/global_step": 761, "train_info/time_within_train_step": 24.763720273971558, "step": 761}
{"train_info/time_between_train_steps": 0.005437612533569336, "step": 761}
{"info/global_step": 762, "train_info/time_within_train_step": 25.008288383483887, "step": 762}
{"train_info/time_between_train_steps": 0.005025625228881836, "step": 762}
{"info/global_step": 763, "train_info/time_within_train_step": 24.74237322807312, "step": 763}
{"train_info/time_between_train_steps": 0.0047454833984375, "step": 763}
{"info/global_step": 764, "train_info/time_within_train_step": 24.820007801055908, "step": 764}
{"train_info/time_between_train_steps": 0.005259275436401367, "step": 764}
{"info/global_step": 765, "train_info/time_within_train_step": 24.738297939300537, "step": 765}
{"train_info/time_between_train_steps": 0.004977703094482422, "step": 765}
{"info/global_step": 766, "train_info/time_within_train_step": 24.793734550476074, "step": 766}
{"train_info/time_between_train_steps": 0.005055665969848633, "step": 766}
{"info/global_step": 767, "train_info/time_within_train_step": 24.752402782440186, "step": 767}
{"train_info/time_between_train_steps": 0.005106210708618164, "step": 767}
{"info/global_step": 768, "train_info/time_within_train_step": 24.858275413513184, "step": 768}
{"train_info/time_between_train_steps": 0.005039691925048828, "step": 768}
{"info/global_step": 769, "train_info/time_within_train_step": 24.753454446792603, "step": 769}
{"train_info/time_between_train_steps": 0.0049173831939697266, "step": 769}
{"info/global_step": 770, "train_info/time_within_train_step": 24.74566912651062, "step": 770}
{"train_info/time_between_train_steps": 0.005206584930419922, "step": 770}
{"info/global_step": 771, "train_info/time_within_train_step": 24.74493408203125, "step": 771}
{"train_info/time_between_train_steps": 0.004995107650756836, "step": 771}
{"info/global_step": 772, "train_info/time_within_train_step": 24.738011360168457, "step": 772}
{"train_info/time_between_train_steps": 0.0050313472747802734, "step": 772}
{"info/global_step": 773, "train_info/time_within_train_step": 24.751749992370605, "step": 773}
{"train_info/time_between_train_steps": 0.0051462650299072266, "step": 773}
{"info/global_step": 774, "train_info/time_within_train_step": 24.742607831954956, "step": 774}
{"train_info/time_between_train_steps": 0.004952430725097656, "step": 774}
{"info/global_step": 775, "train_info/time_within_train_step": 24.741764783859253, "step": 775}
{"train_info/time_between_train_steps": 0.004922389984130859, "step": 775}
{"info/global_step": 776, "train_info/time_within_train_step": 24.7490496635437, "step": 776}
{"train_info/time_between_train_steps": 0.005152702331542969, "step": 776}
{"info/global_step": 777, "train_info/time_within_train_step": 24.747233152389526, "step": 777}
{"train_info/time_between_train_steps": 0.006063222885131836, "step": 777}
{"info/global_step": 778, "train_info/time_within_train_step": 24.747913122177124, "step": 778}
{"train_info/time_between_train_steps": 0.005078554153442383, "step": 778}
{"info/global_step": 779, "train_info/time_within_train_step": 24.75284194946289, "step": 779}
{"train_info/time_between_train_steps": 0.0058515071868896484, "step": 779}
{"info/global_step": 780, "train_info/time_within_train_step": 24.85191512107849, "step": 780}
{"train_info/time_between_train_steps": 0.005152702331542969, "step": 780}
{"info/global_step": 781, "train_info/time_within_train_step": 24.768505096435547, "step": 781}
{"train_info/time_between_train_steps": 0.005488395690917969, "step": 781}
{"info/global_step": 782, "train_info/time_within_train_step": 24.82995367050171, "step": 782}
{"train_info/time_between_train_steps": 0.0057256221771240234, "step": 782}
{"train_info/time_between_train_steps": 5.257819414138794, "step": 782}
{"info/global_step": 783, "train_info/time_within_train_step": 24.723772287368774, "step": 783}
{"train_info/time_between_train_steps": 0.004758596420288086, "step": 783}
{"info/global_step": 784, "train_info/time_within_train_step": 24.848224878311157, "step": 784}
{"train_info/time_between_train_steps": 0.004960536956787109, "step": 784}
{"info/global_step": 785, "train_info/time_within_train_step": 24.759700298309326, "step": 785}
{"train_info/time_between_train_steps": 0.005326032638549805, "step": 785}
{"info/global_step": 786, "train_info/time_within_train_step": 24.856507301330566, "step": 786}
{"train_info/time_between_train_steps": 0.005248308181762695, "step": 786}
{"info/global_step": 787, "train_info/time_within_train_step": 24.737996578216553, "step": 787}
{"train_info/time_between_train_steps": 0.005274295806884766, "step": 787}
{"info/global_step": 788, "train_info/time_within_train_step": 24.893155097961426, "step": 788}
{"train_info/time_between_train_steps": 0.005234479904174805, "step": 788}
{"info/global_step": 789, "train_info/time_within_train_step": 24.761844635009766, "step": 789}
{"train_info/time_between_train_steps": 0.005157947540283203, "step": 789}
{"info/global_step": 790, "train_info/time_within_train_step": 24.8480167388916, "step": 790}
{"train_info/time_between_train_steps": 0.00511932373046875, "step": 790}
{"info/global_step": 791, "train_info/time_within_train_step": 24.75035834312439, "step": 791}
{"train_info/time_between_train_steps": 0.005151271820068359, "step": 791}
{"info/global_step": 792, "train_info/time_within_train_step": 24.90314292907715, "step": 792}
{"train_info/time_between_train_steps": 0.005326986312866211, "step": 792}
{"info/global_step": 793, "train_info/time_within_train_step": 24.74224853515625, "step": 793}
{"train_info/time_between_train_steps": 0.0051937103271484375, "step": 793}
{"info/global_step": 794, "train_info/time_within_train_step": 24.874485731124878, "step": 794}
{"train_info/time_between_train_steps": 0.005301475524902344, "step": 794}
{"info/global_step": 795, "train_info/time_within_train_step": 24.753337860107422, "step": 795}
{"train_info/time_between_train_steps": 0.005477190017700195, "step": 795}
{"info/global_step": 796, "train_info/time_within_train_step": 24.898807048797607, "step": 796}
{"train_info/time_between_train_steps": 0.007394552230834961, "step": 796}
{"info/global_step": 797, "train_info/time_within_train_step": 24.751851320266724, "step": 797}
{"train_info/time_between_train_steps": 0.004951953887939453, "step": 797}
{"info/global_step": 798, "train_info/time_within_train_step": 24.756577491760254, "step": 798}
{"train_info/time_between_train_steps": 0.00529932975769043, "step": 798}
{"info/global_step": 799, "train_info/time_within_train_step": 24.739588499069214, "step": 799}
{"train_info/time_between_train_steps": 0.0049877166748046875, "step": 799}
{"info/global_step": 800, "train_info/time_within_train_step": 24.735326766967773, "step": 800}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740940152, "_runtime": 20063}, "step": 800}
{"logs": {"train/loss": 3.0036, "train/learning_rate": 0.00022222222222222218, "train/epoch": 23.02, "_timestamp": 1740940152, "_runtime": 20063}, "step": 800}
{"train_info/time_between_train_steps": 34.4662926197052, "step": 800}
{"info/global_step": 801, "train_info/time_within_train_step": 24.732064247131348, "step": 801}
{"train_info/time_between_train_steps": 0.004930973052978516, "step": 801}
{"info/global_step": 802, "train_info/time_within_train_step": 24.72780466079712, "step": 802}
{"train_info/time_between_train_steps": 0.008847236633300781, "step": 802}
{"info/global_step": 803, "train_info/time_within_train_step": 24.749732971191406, "step": 803}
{"train_info/time_between_train_steps": 0.004995107650756836, "step": 803}
{"info/global_step": 804, "train_info/time_within_train_step": 24.743443965911865, "step": 804}
{"train_info/time_between_train_steps": 0.0052220821380615234, "step": 804}
{"info/global_step": 805, "train_info/time_within_train_step": 24.740224599838257, "step": 805}
{"train_info/time_between_train_steps": 0.005149126052856445, "step": 805}
{"info/global_step": 806, "train_info/time_within_train_step": 24.739359378814697, "step": 806}
{"train_info/time_between_train_steps": 0.0050394535064697266, "step": 806}
{"info/global_step": 807, "train_info/time_within_train_step": 24.72994327545166, "step": 807}
{"train_info/time_between_train_steps": 0.010020256042480469, "step": 807}
{"info/global_step": 808, "train_info/time_within_train_step": 24.737224102020264, "step": 808}
{"train_info/time_between_train_steps": 0.005071878433227539, "step": 808}
{"info/global_step": 809, "train_info/time_within_train_step": 24.74551224708557, "step": 809}
{"train_info/time_between_train_steps": 0.004957437515258789, "step": 809}
{"info/global_step": 810, "train_info/time_within_train_step": 24.741072177886963, "step": 810}
{"train_info/time_between_train_steps": 0.005044460296630859, "step": 810}
{"info/global_step": 811, "train_info/time_within_train_step": 24.829742670059204, "step": 811}
{"train_info/time_between_train_steps": 0.005208253860473633, "step": 811}
{"info/global_step": 812, "train_info/time_within_train_step": 24.73840880393982, "step": 812}
{"train_info/time_between_train_steps": 0.005026578903198242, "step": 812}
{"info/global_step": 813, "train_info/time_within_train_step": 24.938704252243042, "step": 813}
{"train_info/time_between_train_steps": 0.005175352096557617, "step": 813}
{"info/global_step": 814, "train_info/time_within_train_step": 24.75017786026001, "step": 814}
{"train_info/time_between_train_steps": 0.005396604537963867, "step": 814}
{"info/global_step": 815, "train_info/time_within_train_step": 24.760598182678223, "step": 815}
{"train_info/time_between_train_steps": 0.005458354949951172, "step": 815}
{"info/global_step": 816, "train_info/time_within_train_step": 24.772044897079468, "step": 816}
{"train_info/time_between_train_steps": 0.005902528762817383, "step": 816}
{"train_info/time_between_train_steps": 4.9356536865234375, "step": 816}
{"info/global_step": 817, "train_info/time_within_train_step": 24.742335319519043, "step": 817}
{"train_info/time_between_train_steps": 0.004971027374267578, "step": 817}
{"info/global_step": 818, "train_info/time_within_train_step": 24.829982042312622, "step": 818}
{"train_info/time_between_train_steps": 0.004862308502197266, "step": 818}
{"info/global_step": 819, "train_info/time_within_train_step": 24.735510110855103, "step": 819}
{"train_info/time_between_train_steps": 0.004849910736083984, "step": 819}
{"info/global_step": 820, "train_info/time_within_train_step": 24.911346435546875, "step": 820}
{"train_info/time_between_train_steps": 0.0052106380462646484, "step": 820}
{"info/global_step": 821, "train_info/time_within_train_step": 24.74760127067566, "step": 821}
{"train_info/time_between_train_steps": 0.005301475524902344, "step": 821}
{"info/global_step": 822, "train_info/time_within_train_step": 24.86005449295044, "step": 822}
{"train_info/time_between_train_steps": 0.005182027816772461, "step": 822}
{"info/global_step": 823, "train_info/time_within_train_step": 24.744521856307983, "step": 823}
{"train_info/time_between_train_steps": 0.005341529846191406, "step": 823}
{"info/global_step": 824, "train_info/time_within_train_step": 24.902036905288696, "step": 824}
{"train_info/time_between_train_steps": 0.006738424301147461, "step": 824}
{"info/global_step": 825, "train_info/time_within_train_step": 24.75586175918579, "step": 825}
{"train_info/time_between_train_steps": 0.005066633224487305, "step": 825}
{"info/global_step": 826, "train_info/time_within_train_step": 24.860939502716064, "step": 826}
{"train_info/time_between_train_steps": 0.005079746246337891, "step": 826}
{"info/global_step": 827, "train_info/time_within_train_step": 24.861515998840332, "step": 827}
{"train_info/time_between_train_steps": 0.005597114562988281, "step": 827}
{"info/global_step": 828, "train_info/time_within_train_step": 24.883466958999634, "step": 828}
{"train_info/time_between_train_steps": 0.005150318145751953, "step": 828}
{"info/global_step": 829, "train_info/time_within_train_step": 24.8375027179718, "step": 829}
{"train_info/time_between_train_steps": 0.005352973937988281, "step": 829}
{"info/global_step": 830, "train_info/time_within_train_step": 24.84249234199524, "step": 830}
{"train_info/time_between_train_steps": 0.005217790603637695, "step": 830}
{"info/global_step": 831, "train_info/time_within_train_step": 24.758928298950195, "step": 831}
{"train_info/time_between_train_steps": 0.005034208297729492, "step": 831}
{"info/global_step": 832, "train_info/time_within_train_step": 24.83785104751587, "step": 832}
{"train_info/time_between_train_steps": 0.004988193511962891, "step": 832}
{"info/global_step": 833, "train_info/time_within_train_step": 24.753377437591553, "step": 833}
{"train_info/time_between_train_steps": 0.0049893856048583984, "step": 833}
{"info/global_step": 834, "train_info/time_within_train_step": 24.83100700378418, "step": 834}
{"train_info/time_between_train_steps": 0.005498647689819336, "step": 834}
{"info/global_step": 835, "train_info/time_within_train_step": 24.761279582977295, "step": 835}
{"train_info/time_between_train_steps": 0.005319356918334961, "step": 835}
{"info/global_step": 836, "train_info/time_within_train_step": 24.84245491027832, "step": 836}
{"train_info/time_between_train_steps": 0.005326509475708008, "step": 836}
{"info/global_step": 837, "train_info/time_within_train_step": 24.869540452957153, "step": 837}
{"train_info/time_between_train_steps": 0.0054705142974853516, "step": 837}
{"info/global_step": 838, "train_info/time_within_train_step": 24.78451371192932, "step": 838}
{"train_info/time_between_train_steps": 0.006028413772583008, "step": 838}
{"info/global_step": 839, "train_info/time_within_train_step": 24.904507637023926, "step": 839}
{"train_info/time_between_train_steps": 0.005055904388427734, "step": 839}
{"info/global_step": 840, "train_info/time_within_train_step": 24.818346738815308, "step": 840}
{"train_info/time_between_train_steps": 0.005303382873535156, "step": 840}
{"info/global_step": 841, "train_info/time_within_train_step": 24.775971174240112, "step": 841}
{"train_info/time_between_train_steps": 0.0052607059478759766, "step": 841}
{"info/global_step": 842, "train_info/time_within_train_step": 24.82200813293457, "step": 842}
{"train_info/time_between_train_steps": 0.005008697509765625, "step": 842}
{"info/global_step": 843, "train_info/time_within_train_step": 24.75094747543335, "step": 843}
{"train_info/time_between_train_steps": 0.010254144668579102, "step": 843}
{"info/global_step": 844, "train_info/time_within_train_step": 24.740201473236084, "step": 844}
{"train_info/time_between_train_steps": 0.010092735290527344, "step": 844}
{"info/global_step": 845, "train_info/time_within_train_step": 24.966997623443604, "step": 845}
{"train_info/time_between_train_steps": 0.014285564422607422, "step": 845}
{"info/global_step": 846, "train_info/time_within_train_step": 25.07261037826538, "step": 846}
{"train_info/time_between_train_steps": 0.012580394744873047, "step": 846}
{"info/global_step": 847, "train_info/time_within_train_step": 24.794183254241943, "step": 847}
{"train_info/time_between_train_steps": 0.010268449783325195, "step": 847}
{"info/global_step": 848, "train_info/time_within_train_step": 24.747262716293335, "step": 848}
{"train_info/time_between_train_steps": 0.005089759826660156, "step": 848}
{"info/global_step": 849, "train_info/time_within_train_step": 24.752334594726562, "step": 849}
{"train_info/time_between_train_steps": 0.006290912628173828, "step": 849}
{"info/global_step": 850, "train_info/time_within_train_step": 24.774523735046387, "step": 850}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740941432, "_runtime": 21343}, "step": 850}
{"logs": {"train/loss": 2.961, "train/learning_rate": 0.00019444444444444443, "train/epoch": 24.03, "_timestamp": 1740941432, "_runtime": 21343}, "step": 850}
{"train_info/time_between_train_steps": 0.013668298721313477, "step": 850}
{"train_info/time_between_train_steps": 5.106842756271362, "step": 850}
{"info/global_step": 851, "train_info/time_within_train_step": 24.733670711517334, "step": 851}
{"train_info/time_between_train_steps": 0.005094051361083984, "step": 851}
{"info/global_step": 852, "train_info/time_within_train_step": 24.886136293411255, "step": 852}
{"train_info/time_between_train_steps": 0.0051538944244384766, "step": 852}
{"info/global_step": 853, "train_info/time_within_train_step": 24.744484424591064, "step": 853}
{"train_info/time_between_train_steps": 0.005243539810180664, "step": 853}
{"info/global_step": 854, "train_info/time_within_train_step": 24.85015082359314, "step": 854}
{"train_info/time_between_train_steps": 0.005160331726074219, "step": 854}
{"info/global_step": 855, "train_info/time_within_train_step": 24.740307569503784, "step": 855}
{"train_info/time_between_train_steps": 0.005196094512939453, "step": 855}
{"info/global_step": 856, "train_info/time_within_train_step": 24.904690504074097, "step": 856}
{"train_info/time_between_train_steps": 0.005273103713989258, "step": 856}
{"info/global_step": 857, "train_info/time_within_train_step": 24.743293523788452, "step": 857}
{"train_info/time_between_train_steps": 0.0052525997161865234, "step": 857}
{"info/global_step": 858, "train_info/time_within_train_step": 24.94609832763672, "step": 858}
{"train_info/time_between_train_steps": 0.005135297775268555, "step": 858}
{"info/global_step": 859, "train_info/time_within_train_step": 24.754475355148315, "step": 859}
{"train_info/time_between_train_steps": 0.005431413650512695, "step": 859}
{"info/global_step": 860, "train_info/time_within_train_step": 24.8814594745636, "step": 860}
{"train_info/time_between_train_steps": 0.005242109298706055, "step": 860}
{"info/global_step": 861, "train_info/time_within_train_step": 24.75252079963684, "step": 861}
{"train_info/time_between_train_steps": 0.010424137115478516, "step": 861}
{"info/global_step": 862, "train_info/time_within_train_step": 24.87264919281006, "step": 862}
{"train_info/time_between_train_steps": 0.005294322967529297, "step": 862}
{"info/global_step": 863, "train_info/time_within_train_step": 24.7731192111969, "step": 863}
{"train_info/time_between_train_steps": 0.005620002746582031, "step": 863}
{"info/global_step": 864, "train_info/time_within_train_step": 24.819195985794067, "step": 864}
{"train_info/time_between_train_steps": 0.005087375640869141, "step": 864}
{"info/global_step": 865, "train_info/time_within_train_step": 24.75111174583435, "step": 865}
{"train_info/time_between_train_steps": 0.0048847198486328125, "step": 865}
{"info/global_step": 866, "train_info/time_within_train_step": 24.732815742492676, "step": 866}
{"train_info/time_between_train_steps": 0.0051670074462890625, "step": 866}
{"info/global_step": 867, "train_info/time_within_train_step": 24.735766172409058, "step": 867}
{"train_info/time_between_train_steps": 0.010064125061035156, "step": 867}
{"info/global_step": 868, "train_info/time_within_train_step": 24.75270962715149, "step": 868}
{"train_info/time_between_train_steps": 0.010151863098144531, "step": 868}
{"info/global_step": 869, "train_info/time_within_train_step": 24.745765924453735, "step": 869}
{"train_info/time_between_train_steps": 0.005154132843017578, "step": 869}
{"info/global_step": 870, "train_info/time_within_train_step": 24.73708176612854, "step": 870}
{"train_info/time_between_train_steps": 0.009881019592285156, "step": 870}
{"info/global_step": 871, "train_info/time_within_train_step": 24.75837278366089, "step": 871}
{"train_info/time_between_train_steps": 0.009990930557250977, "step": 871}
{"info/global_step": 872, "train_info/time_within_train_step": 24.743107318878174, "step": 872}
{"train_info/time_between_train_steps": 0.010080337524414062, "step": 872}
{"info/global_step": 873, "train_info/time_within_train_step": 24.742371559143066, "step": 873}
{"train_info/time_between_train_steps": 0.004992008209228516, "step": 873}
{"info/global_step": 874, "train_info/time_within_train_step": 24.82385230064392, "step": 874}
{"train_info/time_between_train_steps": 0.005116939544677734, "step": 874}
{"info/global_step": 875, "train_info/time_within_train_step": 24.74836492538452, "step": 875}
{"train_info/time_between_train_steps": 0.0051686763763427734, "step": 875}
{"info/global_step": 876, "train_info/time_within_train_step": 24.738882541656494, "step": 876}
{"train_info/time_between_train_steps": 0.004912614822387695, "step": 876}
{"info/global_step": 877, "train_info/time_within_train_step": 24.745928525924683, "step": 877}
{"train_info/time_between_train_steps": 0.005099058151245117, "step": 877}
{"info/global_step": 878, "train_info/time_within_train_step": 24.739187479019165, "step": 878}
{"train_info/time_between_train_steps": 0.005151987075805664, "step": 878}
{"info/global_step": 879, "train_info/time_within_train_step": 24.73366928100586, "step": 879}
{"train_info/time_between_train_steps": 0.005076408386230469, "step": 879}
{"info/global_step": 880, "train_info/time_within_train_step": 24.7330641746521, "step": 880}
{"train_info/time_between_train_steps": 0.005020618438720703, "step": 880}
{"info/global_step": 881, "train_info/time_within_train_step": 24.748188018798828, "step": 881}
{"train_info/time_between_train_steps": 0.005357265472412109, "step": 881}
{"info/global_step": 882, "train_info/time_within_train_step": 24.748573303222656, "step": 882}
{"train_info/time_between_train_steps": 0.005173683166503906, "step": 882}
{"info/global_step": 883, "train_info/time_within_train_step": 24.755971908569336, "step": 883}
{"train_info/time_between_train_steps": 0.010692358016967773, "step": 883}
{"info/global_step": 884, "train_info/time_within_train_step": 24.77951145172119, "step": 884}
{"train_info/time_between_train_steps": 0.006517648696899414, "step": 884}
{"train_info/time_between_train_steps": 5.1995930671691895, "step": 884}
{"info/global_step": 885, "train_info/time_within_train_step": 24.721521377563477, "step": 885}
{"train_info/time_between_train_steps": 0.004874229431152344, "step": 885}
{"info/global_step": 886, "train_info/time_within_train_step": 24.836138010025024, "step": 886}
{"train_info/time_between_train_steps": 0.005028486251831055, "step": 886}
{"info/global_step": 887, "train_info/time_within_train_step": 24.745968341827393, "step": 887}
{"train_info/time_between_train_steps": 0.005333900451660156, "step": 887}
{"info/global_step": 888, "train_info/time_within_train_step": 24.855433464050293, "step": 888}
{"train_info/time_between_train_steps": 0.005362510681152344, "step": 888}
{"info/global_step": 889, "train_info/time_within_train_step": 24.82427215576172, "step": 889}
{"train_info/time_between_train_steps": 0.005102396011352539, "step": 889}
{"info/global_step": 890, "train_info/time_within_train_step": 24.896050453186035, "step": 890}
{"train_info/time_between_train_steps": 0.005311727523803711, "step": 890}
{"info/global_step": 891, "train_info/time_within_train_step": 24.74709677696228, "step": 891}
{"train_info/time_between_train_steps": 0.005227565765380859, "step": 891}
{"info/global_step": 892, "train_info/time_within_train_step": 24.847925186157227, "step": 892}
{"train_info/time_between_train_steps": 0.010123729705810547, "step": 892}
{"info/global_step": 893, "train_info/time_within_train_step": 24.747163772583008, "step": 893}
{"train_info/time_between_train_steps": 0.008237600326538086, "step": 893}
{"info/global_step": 894, "train_info/time_within_train_step": 24.889220476150513, "step": 894}
{"train_info/time_between_train_steps": 0.005917787551879883, "step": 894}
{"info/global_step": 895, "train_info/time_within_train_step": 24.742790937423706, "step": 895}
{"train_info/time_between_train_steps": 0.010251998901367188, "step": 895}
{"info/global_step": 896, "train_info/time_within_train_step": 24.87823224067688, "step": 896}
{"train_info/time_between_train_steps": 0.0105438232421875, "step": 896}
{"info/global_step": 897, "train_info/time_within_train_step": 24.842561960220337, "step": 897}
{"train_info/time_between_train_steps": 0.005578279495239258, "step": 897}
{"info/global_step": 898, "train_info/time_within_train_step": 24.80878186225891, "step": 898}
{"train_info/time_between_train_steps": 0.007184267044067383, "step": 898}
{"info/global_step": 899, "train_info/time_within_train_step": 24.76058316230774, "step": 899}
{"train_info/time_between_train_steps": 0.004893302917480469, "step": 899}
{"info/global_step": 900, "train_info/time_within_train_step": 24.736268281936646, "step": 900}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740942682, "_runtime": 22593}, "step": 900}
{"logs": {"train/loss": 2.9245, "train/learning_rate": 0.00016666666666666666, "train/epoch": 26.01, "_timestamp": 1740942682, "_runtime": 22593}, "step": 900}
{"train_info/time_between_train_steps": 18.293416023254395, "step": 900}
{"info/global_step": 901, "train_info/time_within_train_step": 24.737264156341553, "step": 901}
{"train_info/time_between_train_steps": 0.0050046443939208984, "step": 901}
{"info/global_step": 902, "train_info/time_within_train_step": 24.73079228401184, "step": 902}
{"train_info/time_between_train_steps": 0.005228757858276367, "step": 902}
{"info/global_step": 903, "train_info/time_within_train_step": 24.73400640487671, "step": 903}
{"train_info/time_between_train_steps": 0.005161762237548828, "step": 903}
{"info/global_step": 904, "train_info/time_within_train_step": 24.730623483657837, "step": 904}
{"train_info/time_between_train_steps": 0.00503849983215332, "step": 904}
{"info/global_step": 905, "train_info/time_within_train_step": 24.831061124801636, "step": 905}
{"train_info/time_between_train_steps": 0.004949808120727539, "step": 905}
{"info/global_step": 906, "train_info/time_within_train_step": 24.734426498413086, "step": 906}
{"train_info/time_between_train_steps": 0.005193471908569336, "step": 906}
{"info/global_step": 907, "train_info/time_within_train_step": 24.733107089996338, "step": 907}
{"train_info/time_between_train_steps": 0.005086183547973633, "step": 907}
{"info/global_step": 908, "train_info/time_within_train_step": 24.733511447906494, "step": 908}
{"train_info/time_between_train_steps": 0.0051479339599609375, "step": 908}
{"info/global_step": 909, "train_info/time_within_train_step": 24.742443084716797, "step": 909}
{"train_info/time_between_train_steps": 0.005185842514038086, "step": 909}
{"info/global_step": 910, "train_info/time_within_train_step": 24.735383987426758, "step": 910}
{"train_info/time_between_train_steps": 0.005086421966552734, "step": 910}
{"info/global_step": 911, "train_info/time_within_train_step": 24.735469818115234, "step": 911}
{"train_info/time_between_train_steps": 0.005087614059448242, "step": 911}
{"info/global_step": 912, "train_info/time_within_train_step": 24.737317085266113, "step": 912}
{"train_info/time_between_train_steps": 0.005307674407958984, "step": 912}
{"info/global_step": 913, "train_info/time_within_train_step": 24.741678476333618, "step": 913}
{"train_info/time_between_train_steps": 0.0051004886627197266, "step": 913}
{"info/global_step": 914, "train_info/time_within_train_step": 24.735703945159912, "step": 914}
{"train_info/time_between_train_steps": 0.005128383636474609, "step": 914}
{"info/global_step": 915, "train_info/time_within_train_step": 24.74292254447937, "step": 915}
{"train_info/time_between_train_steps": 0.005288362503051758, "step": 915}
{"info/global_step": 916, "train_info/time_within_train_step": 24.745091676712036, "step": 916}
{"train_info/time_between_train_steps": 0.005156040191650391, "step": 916}
{"info/global_step": 917, "train_info/time_within_train_step": 24.752007961273193, "step": 917}
{"train_info/time_between_train_steps": 0.005522012710571289, "step": 917}
{"info/global_step": 918, "train_info/time_within_train_step": 24.77823781967163, "step": 918}
{"train_info/time_between_train_steps": 0.006041765213012695, "step": 918}
{"train_info/time_between_train_steps": 4.94118070602417, "step": 918}
{"info/global_step": 919, "train_info/time_within_train_step": 24.72512912750244, "step": 919}
{"train_info/time_between_train_steps": 0.004786491394042969, "step": 919}
{"info/global_step": 920, "train_info/time_within_train_step": 24.953460931777954, "step": 920}
{"train_info/time_between_train_steps": 0.0050241947174072266, "step": 920}
{"info/global_step": 921, "train_info/time_within_train_step": 24.747750282287598, "step": 921}
{"train_info/time_between_train_steps": 0.0052661895751953125, "step": 921}
{"info/global_step": 922, "train_info/time_within_train_step": 24.87618327140808, "step": 922}
{"train_info/time_between_train_steps": 0.010436296463012695, "step": 922}
{"info/global_step": 923, "train_info/time_within_train_step": 24.73814296722412, "step": 923}
{"train_info/time_between_train_steps": 0.005182504653930664, "step": 923}
{"info/global_step": 924, "train_info/time_within_train_step": 24.89376425743103, "step": 924}
{"train_info/time_between_train_steps": 0.005335807800292969, "step": 924}
{"info/global_step": 925, "train_info/time_within_train_step": 24.75312066078186, "step": 925}
{"train_info/time_between_train_steps": 0.005314350128173828, "step": 925}
{"info/global_step": 926, "train_info/time_within_train_step": 24.854260206222534, "step": 926}
{"train_info/time_between_train_steps": 0.010001420974731445, "step": 926}
{"info/global_step": 927, "train_info/time_within_train_step": 24.747204542160034, "step": 927}
{"train_info/time_between_train_steps": 0.005349636077880859, "step": 927}
{"info/global_step": 928, "train_info/time_within_train_step": 24.913373470306396, "step": 928}
{"train_info/time_between_train_steps": 0.0052525997161865234, "step": 928}
{"info/global_step": 929, "train_info/time_within_train_step": 24.749176502227783, "step": 929}
{"train_info/time_between_train_steps": 0.005312681198120117, "step": 929}
{"info/global_step": 930, "train_info/time_within_train_step": 24.86114811897278, "step": 930}
{"train_info/time_between_train_steps": 0.005297660827636719, "step": 930}
{"info/global_step": 931, "train_info/time_within_train_step": 24.75690507888794, "step": 931}
{"train_info/time_between_train_steps": 0.005556344985961914, "step": 931}
{"info/global_step": 932, "train_info/time_within_train_step": 24.82136344909668, "step": 932}
{"train_info/time_between_train_steps": 0.0052449703216552734, "step": 932}
{"info/global_step": 933, "train_info/time_within_train_step": 24.750139713287354, "step": 933}
{"train_info/time_between_train_steps": 0.005005359649658203, "step": 933}
{"info/global_step": 934, "train_info/time_within_train_step": 24.73408794403076, "step": 934}
{"train_info/time_between_train_steps": 0.005325794219970703, "step": 934}
{"info/global_step": 935, "train_info/time_within_train_step": 24.734386444091797, "step": 935}
{"train_info/time_between_train_steps": 0.004972934722900391, "step": 935}
{"info/global_step": 936, "train_info/time_within_train_step": 24.819382667541504, "step": 936}
{"train_info/time_between_train_steps": 0.005007743835449219, "step": 936}
{"info/global_step": 937, "train_info/time_within_train_step": 24.73298454284668, "step": 937}
{"train_info/time_between_train_steps": 0.005028724670410156, "step": 937}
{"info/global_step": 938, "train_info/time_within_train_step": 24.729300022125244, "step": 938}
{"train_info/time_between_train_steps": 0.0050160884857177734, "step": 938}
{"info/global_step": 939, "train_info/time_within_train_step": 24.738168478012085, "step": 939}
{"train_info/time_between_train_steps": 0.009977579116821289, "step": 939}
{"info/global_step": 940, "train_info/time_within_train_step": 24.73225212097168, "step": 940}
{"train_info/time_between_train_steps": 0.010007381439208984, "step": 940}
{"info/global_step": 941, "train_info/time_within_train_step": 24.73315930366516, "step": 941}
{"train_info/time_between_train_steps": 0.009805440902709961, "step": 941}
{"info/global_step": 942, "train_info/time_within_train_step": 24.74220585823059, "step": 942}
{"train_info/time_between_train_steps": 0.01015329360961914, "step": 942}
{"info/global_step": 943, "train_info/time_within_train_step": 24.740252017974854, "step": 943}
{"train_info/time_between_train_steps": 0.005257129669189453, "step": 943}
{"info/global_step": 944, "train_info/time_within_train_step": 24.74307656288147, "step": 944}
{"train_info/time_between_train_steps": 0.004919767379760742, "step": 944}
{"info/global_step": 945, "train_info/time_within_train_step": 24.965453147888184, "step": 945}
{"train_info/time_between_train_steps": 0.005287885665893555, "step": 945}
{"info/global_step": 946, "train_info/time_within_train_step": 24.777655601501465, "step": 946}
{"train_info/time_between_train_steps": 0.007153511047363281, "step": 946}
{"info/global_step": 947, "train_info/time_within_train_step": 24.7368426322937, "step": 947}
{"train_info/time_between_train_steps": 0.005065441131591797, "step": 947}
{"info/global_step": 948, "train_info/time_within_train_step": 24.739182233810425, "step": 948}
{"train_info/time_between_train_steps": 0.005160808563232422, "step": 948}
{"info/global_step": 949, "train_info/time_within_train_step": 24.742422819137573, "step": 949}
{"train_info/time_between_train_steps": 0.00533747673034668, "step": 949}
{"info/global_step": 950, "train_info/time_within_train_step": 24.74461793899536, "step": 950}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740943945, "_runtime": 23856}, "step": 950}
{"logs": {"train/loss": 2.8828, "train/learning_rate": 0.0001388888888888889, "train/epoch": 27.03, "_timestamp": 1740943945, "_runtime": 23856}, "step": 950}
{"train_info/time_between_train_steps": 0.015385866165161133, "step": 950}
{"info/global_step": 951, "train_info/time_within_train_step": 24.765313148498535, "step": 951}
{"train_info/time_between_train_steps": 0.0056304931640625, "step": 951}
{"info/global_step": 952, "train_info/time_within_train_step": 24.872532844543457, "step": 952}
{"train_info/time_between_train_steps": 0.00567317008972168, "step": 952}
{"train_info/time_between_train_steps": 5.1262171268463135, "step": 952}
{"info/global_step": 953, "train_info/time_within_train_step": 24.740983247756958, "step": 953}
{"train_info/time_between_train_steps": 0.004983425140380859, "step": 953}
{"info/global_step": 954, "train_info/time_within_train_step": 24.892764806747437, "step": 954}
{"train_info/time_between_train_steps": 0.005164623260498047, "step": 954}
{"info/global_step": 955, "train_info/time_within_train_step": 24.749382495880127, "step": 955}
{"train_info/time_between_train_steps": 0.005257606506347656, "step": 955}
{"info/global_step": 956, "train_info/time_within_train_step": 24.879669427871704, "step": 956}
{"train_info/time_between_train_steps": 0.006251335144042969, "step": 956}
{"info/global_step": 957, "train_info/time_within_train_step": 24.7354416847229, "step": 957}
{"train_info/time_between_train_steps": 0.0051190853118896484, "step": 957}
{"info/global_step": 958, "train_info/time_within_train_step": 24.901258945465088, "step": 958}
{"train_info/time_between_train_steps": 0.005556821823120117, "step": 958}
{"info/global_step": 959, "train_info/time_within_train_step": 24.742106199264526, "step": 959}
{"train_info/time_between_train_steps": 0.005210399627685547, "step": 959}
{"info/global_step": 960, "train_info/time_within_train_step": 24.8530695438385, "step": 960}
{"train_info/time_between_train_steps": 0.005095243453979492, "step": 960}
{"info/global_step": 961, "train_info/time_within_train_step": 24.76705503463745, "step": 961}
{"train_info/time_between_train_steps": 0.005578041076660156, "step": 961}
{"info/global_step": 962, "train_info/time_within_train_step": 24.883227348327637, "step": 962}
{"train_info/time_between_train_steps": 0.005196809768676758, "step": 962}
{"info/global_step": 963, "train_info/time_within_train_step": 24.752398014068604, "step": 963}
{"train_info/time_between_train_steps": 0.0053098201751708984, "step": 963}
{"info/global_step": 964, "train_info/time_within_train_step": 24.89039444923401, "step": 964}
{"train_info/time_between_train_steps": 0.006713151931762695, "step": 964}
{"info/global_step": 965, "train_info/time_within_train_step": 24.768248081207275, "step": 965}
{"train_info/time_between_train_steps": 0.00540614128112793, "step": 965}
{"info/global_step": 966, "train_info/time_within_train_step": 24.814319610595703, "step": 966}
{"train_info/time_between_train_steps": 0.005273580551147461, "step": 966}
{"info/global_step": 967, "train_info/time_within_train_step": 24.853972911834717, "step": 967}
{"train_info/time_between_train_steps": 0.0050013065338134766, "step": 967}
{"info/global_step": 968, "train_info/time_within_train_step": 24.74630117416382, "step": 968}
{"train_info/time_between_train_steps": 0.009910345077514648, "step": 968}
{"info/global_step": 969, "train_info/time_within_train_step": 24.750214338302612, "step": 969}
{"train_info/time_between_train_steps": 0.004916191101074219, "step": 969}
{"info/global_step": 970, "train_info/time_within_train_step": 24.73115372657776, "step": 970}
{"train_info/time_between_train_steps": 0.005056858062744141, "step": 970}
{"info/global_step": 971, "train_info/time_within_train_step": 24.732321739196777, "step": 971}
{"train_info/time_between_train_steps": 0.005111217498779297, "step": 971}
{"info/global_step": 972, "train_info/time_within_train_step": 24.72966694831848, "step": 972}
{"train_info/time_between_train_steps": 0.004984140396118164, "step": 972}
{"info/global_step": 973, "train_info/time_within_train_step": 24.75279474258423, "step": 973}
{"train_info/time_between_train_steps": 0.005015373229980469, "step": 973}
{"info/global_step": 974, "train_info/time_within_train_step": 24.741918563842773, "step": 974}
{"train_info/time_between_train_steps": 0.0060520172119140625, "step": 974}
{"info/global_step": 975, "train_info/time_within_train_step": 24.748592376708984, "step": 975}
{"train_info/time_between_train_steps": 0.0049855709075927734, "step": 975}
{"info/global_step": 976, "train_info/time_within_train_step": 24.74134922027588, "step": 976}
{"train_info/time_between_train_steps": 0.005114078521728516, "step": 976}
{"info/global_step": 977, "train_info/time_within_train_step": 24.744691848754883, "step": 977}
{"train_info/time_between_train_steps": 0.005071163177490234, "step": 977}
{"info/global_step": 978, "train_info/time_within_train_step": 24.73592519760132, "step": 978}
{"train_info/time_between_train_steps": 0.0050525665283203125, "step": 978}
{"info/global_step": 979, "train_info/time_within_train_step": 24.73751735687256, "step": 979}
{"train_info/time_between_train_steps": 0.0050923824310302734, "step": 979}
{"info/global_step": 980, "train_info/time_within_train_step": 24.734169483184814, "step": 980}
{"train_info/time_between_train_steps": 0.005124807357788086, "step": 980}
{"info/global_step": 981, "train_info/time_within_train_step": 24.733536958694458, "step": 981}
{"train_info/time_between_train_steps": 0.00503993034362793, "step": 981}
{"info/global_step": 982, "train_info/time_within_train_step": 24.74267268180847, "step": 982}
{"train_info/time_between_train_steps": 0.005045175552368164, "step": 982}
{"info/global_step": 983, "train_info/time_within_train_step": 24.833707332611084, "step": 983}
{"train_info/time_between_train_steps": 0.0062236785888671875, "step": 983}
{"info/global_step": 984, "train_info/time_within_train_step": 24.75015115737915, "step": 984}
{"train_info/time_between_train_steps": 0.005378246307373047, "step": 984}
{"info/global_step": 985, "train_info/time_within_train_step": 24.770047187805176, "step": 985}
{"train_info/time_between_train_steps": 0.009067058563232422, "step": 985}
{"info/global_step": 986, "train_info/time_within_train_step": 24.792525053024292, "step": 986}
{"train_info/time_between_train_steps": 0.0057830810546875, "step": 986}
{"train_info/time_between_train_steps": 5.2486748695373535, "step": 986}
{"info/global_step": 987, "train_info/time_within_train_step": 24.73691177368164, "step": 987}
{"train_info/time_between_train_steps": 0.0047607421875, "step": 987}
{"info/global_step": 988, "train_info/time_within_train_step": 24.871479749679565, "step": 988}
{"train_info/time_between_train_steps": 0.009413957595825195, "step": 988}
{"info/global_step": 989, "train_info/time_within_train_step": 24.748512268066406, "step": 989}
{"train_info/time_between_train_steps": 0.005238056182861328, "step": 989}
{"info/global_step": 990, "train_info/time_within_train_step": 24.85158371925354, "step": 990}
{"train_info/time_between_train_steps": 0.00524592399597168, "step": 990}
{"info/global_step": 991, "train_info/time_within_train_step": 24.74134111404419, "step": 991}
{"train_info/time_between_train_steps": 0.00918126106262207, "step": 991}
{"info/global_step": 992, "train_info/time_within_train_step": 24.891923189163208, "step": 992}
{"train_info/time_between_train_steps": 0.0052716732025146484, "step": 992}
{"info/global_step": 993, "train_info/time_within_train_step": 24.740737676620483, "step": 993}
{"train_info/time_between_train_steps": 0.005361795425415039, "step": 993}
{"info/global_step": 994, "train_info/time_within_train_step": 24.853770971298218, "step": 994}
{"train_info/time_between_train_steps": 0.005171775817871094, "step": 994}
{"info/global_step": 995, "train_info/time_within_train_step": 24.74477791786194, "step": 995}
{"train_info/time_between_train_steps": 0.005322694778442383, "step": 995}
{"info/global_step": 996, "train_info/time_within_train_step": 24.885828018188477, "step": 996}
{"train_info/time_between_train_steps": 0.005210399627685547, "step": 996}
{"info/global_step": 997, "train_info/time_within_train_step": 24.73964834213257, "step": 997}
{"train_info/time_between_train_steps": 0.005158901214599609, "step": 997}
{"info/global_step": 998, "train_info/time_within_train_step": 24.972063064575195, "step": 998}
{"train_info/time_between_train_steps": 0.005331516265869141, "step": 998}
{"info/global_step": 999, "train_info/time_within_train_step": 24.75139284133911, "step": 999}
{"train_info/time_between_train_steps": 0.005383491516113281, "step": 999}
{"info/global_step": 1000, "train_info/time_within_train_step": 24.80208921432495, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1740945195, "_runtime": 25106}, "step": 1000}
{"logs": {"train/loss": 2.8517, "train/learning_rate": 0.00011111111111111109, "train/epoch": 29.01, "_timestamp": 1740945195, "_runtime": 25106}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1740945198, "_runtime": 25109}, "step": 1000}
{"logs": {"eval/loss": 3.6034152507781982, "eval/runtime": 2.188, "eval/samples_per_second": 57.129, "eval/steps_per_second": 3.656, "train/epoch": 29.01, "_timestamp": 1740945198, "_runtime": 25109}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1740945198, "_runtime": 25109}, "step": 1000}
{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 3.6034152507781982, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 36.723440275299986, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 2.188, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 57.129, "train/epoch": 29.01, "_timestamp": 1740945198, "_runtime": 25109}, "step": 1000}
{"train_info/time_between_train_steps": 16.75835418701172, "step": 1000}
{"info/global_step": 1001, "train_info/time_within_train_step": 24.78515124320984, "step": 1001}
{"train_info/time_between_train_steps": 0.0051343441009521484, "step": 1001}
{"info/global_step": 1002, "train_info/time_within_train_step": 24.735469102859497, "step": 1002}
{"train_info/time_between_train_steps": 0.009742021560668945, "step": 1002}
{"info/global_step": 1003, "train_info/time_within_train_step": 24.729798078536987, "step": 1003}
{"train_info/time_between_train_steps": 0.009601831436157227, "step": 1003}
{"info/global_step": 1004, "train_info/time_within_train_step": 24.73819923400879, "step": 1004}
{"train_info/time_between_train_steps": 0.005195140838623047, "step": 1004}
{"info/global_step": 1005, "train_info/time_within_train_step": 24.73814344406128, "step": 1005}
{"train_info/time_between_train_steps": 0.004896879196166992, "step": 1005}
{"info/global_step": 1006, "train_info/time_within_train_step": 24.73424243927002, "step": 1006}
{"train_info/time_between_train_steps": 0.005862236022949219, "step": 1006}
{"info/global_step": 1007, "train_info/time_within_train_step": 24.7495858669281, "step": 1007}
{"train_info/time_between_train_steps": 0.005125761032104492, "step": 1007}
{"info/global_step": 1008, "train_info/time_within_train_step": 24.736500024795532, "step": 1008}
{"train_info/time_between_train_steps": 0.004954338073730469, "step": 1008}
{"info/global_step": 1009, "train_info/time_within_train_step": 24.735714435577393, "step": 1009}
{"train_info/time_between_train_steps": 0.005006551742553711, "step": 1009}
{"info/global_step": 1010, "train_info/time_within_train_step": 24.73499822616577, "step": 1010}
{"train_info/time_between_train_steps": 0.006016731262207031, "step": 1010}
{"info/global_step": 1011, "train_info/time_within_train_step": 24.732688665390015, "step": 1011}
{"train_info/time_between_train_steps": 0.005049467086791992, "step": 1011}
{"info/global_step": 1012, "train_info/time_within_train_step": 24.734997034072876, "step": 1012}
{"train_info/time_between_train_steps": 0.005003213882446289, "step": 1012}
{"info/global_step": 1013, "train_info/time_within_train_step": 24.74205708503723, "step": 1013}
{"train_info/time_between_train_steps": 0.0051419734954833984, "step": 1013}
{"info/global_step": 1014, "train_info/time_within_train_step": 24.825170755386353, "step": 1014}
{"train_info/time_between_train_steps": 0.005179166793823242, "step": 1014}
{"info/global_step": 1015, "train_info/time_within_train_step": 24.74096393585205, "step": 1015}
{"train_info/time_between_train_steps": 0.00501704216003418, "step": 1015}
{"info/global_step": 1016, "train_info/time_within_train_step": 24.744569778442383, "step": 1016}
{"train_info/time_between_train_steps": 0.004985332489013672, "step": 1016}
{"info/global_step": 1017, "train_info/time_within_train_step": 24.7456374168396, "step": 1017}
{"train_info/time_between_train_steps": 0.0052394866943359375, "step": 1017}
{"info/global_step": 1018, "train_info/time_within_train_step": 24.75002431869507, "step": 1018}
{"train_info/time_between_train_steps": 0.010416507720947266, "step": 1018}
{"info/global_step": 1019, "train_info/time_within_train_step": 24.762285470962524, "step": 1019}
{"train_info/time_between_train_steps": 0.005587339401245117, "step": 1019}
{"info/global_step": 1020, "train_info/time_within_train_step": 24.784470081329346, "step": 1020}
{"train_info/time_between_train_steps": 0.0067980289459228516, "step": 1020}
{"train_info/time_between_train_steps": 5.007440805435181, "step": 1020}
{"info/global_step": 1021, "train_info/time_within_train_step": 24.974412202835083, "step": 1021}
{"train_info/time_between_train_steps": 0.004863262176513672, "step": 1021}
{"info/global_step": 1022, "train_info/time_within_train_step": 24.885623693466187, "step": 1022}
{"train_info/time_between_train_steps": 0.004993915557861328, "step": 1022}
{"info/global_step": 1023, "train_info/time_within_train_step": 24.752718448638916, "step": 1023}
{"train_info/time_between_train_steps": 0.005161762237548828, "step": 1023}
{"info/global_step": 1024, "train_info/time_within_train_step": 24.849137544631958, "step": 1024}
{"train_info/time_between_train_steps": 0.005136728286743164, "step": 1024}
{"info/global_step": 1025, "train_info/time_within_train_step": 24.737316370010376, "step": 1025}
{"train_info/time_between_train_steps": 0.005131244659423828, "step": 1025}
{"info/global_step": 1026, "train_info/time_within_train_step": 24.904560565948486, "step": 1026}
{"train_info/time_between_train_steps": 0.0058481693267822266, "step": 1026}
{"info/global_step": 1027, "train_info/time_within_train_step": 24.739434719085693, "step": 1027}
{"train_info/time_between_train_steps": 0.00504755973815918, "step": 1027}
{"info/global_step": 1028, "train_info/time_within_train_step": 24.8510639667511, "step": 1028}
{"train_info/time_between_train_steps": 0.005042552947998047, "step": 1028}
{"info/global_step": 1029, "train_info/time_within_train_step": 24.83392906188965, "step": 1029}
{"train_info/time_between_train_steps": 0.005414724349975586, "step": 1029}
{"info/global_step": 1030, "train_info/time_within_train_step": 24.863687992095947, "step": 1030}
{"train_info/time_between_train_steps": 0.005276679992675781, "step": 1030}
{"info/global_step": 1031, "train_info/time_within_train_step": 24.73900008201599, "step": 1031}
{"train_info/time_between_train_steps": 0.00525975227355957, "step": 1031}
{"info/global_step": 1032, "train_info/time_within_train_step": 24.88993501663208, "step": 1032}
{"train_info/time_between_train_steps": 0.005285501480102539, "step": 1032}
{"info/global_step": 1033, "train_info/time_within_train_step": 24.755873680114746, "step": 1033}
{"train_info/time_between_train_steps": 0.0052525997161865234, "step": 1033}
{"info/global_step": 1034, "train_info/time_within_train_step": 24.813108921051025, "step": 1034}
{"train_info/time_between_train_steps": 0.005141496658325195, "step": 1034}
{"info/global_step": 1035, "train_info/time_within_train_step": 24.7487051486969, "step": 1035}
{"train_info/time_between_train_steps": 0.004907131195068359, "step": 1035}
{"info/global_step": 1036, "train_info/time_within_train_step": 24.733892679214478, "step": 1036}
{"train_info/time_between_train_steps": 0.005087137222290039, "step": 1036}
{"info/global_step": 1037, "train_info/time_within_train_step": 24.727938890457153, "step": 1037}
{"train_info/time_between_train_steps": 0.004950523376464844, "step": 1037}
{"info/global_step": 1038, "train_info/time_within_train_step": 24.7278790473938, "step": 1038}
{"train_info/time_between_train_steps": 0.005023479461669922, "step": 1038}
{"info/global_step": 1039, "train_info/time_within_train_step": 24.74013376235962, "step": 1039}
{"train_info/time_between_train_steps": 0.005067586898803711, "step": 1039}
{"info/global_step": 1040, "train_info/time_within_train_step": 24.740692138671875, "step": 1040}
{"train_info/time_between_train_steps": 0.005016803741455078, "step": 1040}
{"info/global_step": 1041, "train_info/time_within_train_step": 24.745171546936035, "step": 1041}
{"train_info/time_between_train_steps": 0.005042076110839844, "step": 1041}
{"info/global_step": 1042, "train_info/time_within_train_step": 24.749491453170776, "step": 1042}
{"train_info/time_between_train_steps": 0.005198240280151367, "step": 1042}
{"info/global_step": 1043, "train_info/time_within_train_step": 24.74141836166382, "step": 1043}
{"train_info/time_between_train_steps": 0.005973339080810547, "step": 1043}
{"info/global_step": 1044, "train_info/time_within_train_step": 24.732882499694824, "step": 1044}
{"train_info/time_between_train_steps": 0.005227804183959961, "step": 1044}
{"info/global_step": 1045, "train_info/time_within_train_step": 24.825211763381958, "step": 1045}
{"train_info/time_between_train_steps": 0.010250329971313477, "step": 1045}
{"info/global_step": 1046, "train_info/time_within_train_step": 24.736858367919922, "step": 1046}
{"train_info/time_between_train_steps": 0.005014896392822266, "step": 1046}
{"info/global_step": 1047, "train_info/time_within_train_step": 24.755456686019897, "step": 1047}
{"train_info/time_between_train_steps": 0.005540609359741211, "step": 1047}
{"info/global_step": 1048, "train_info/time_within_train_step": 24.887818574905396, "step": 1048}
{"train_info/time_between_train_steps": 0.005234718322753906, "step": 1048}
{"info/global_step": 1049, "train_info/time_within_train_step": 24.736143350601196, "step": 1049}
{"train_info/time_between_train_steps": 0.004995584487915039, "step": 1049}
{"info/global_step": 1050, "train_info/time_within_train_step": 24.732226371765137, "step": 1050}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1740946456, "_runtime": 26367}, "step": 1050}
{"logs": {"train/loss": 2.8153, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 30.02, "_timestamp": 1740946456, "_runtime": 26367}, "step": 1050}
{"train_info/time_between_train_steps": 0.008616447448730469, "step": 1050}
{"info/global_step": 1051, "train_info/time_within_train_step": 24.73636531829834, "step": 1051}
{"train_info/time_between_train_steps": 0.0051727294921875, "step": 1051}
{"info/global_step": 1052, "train_info/time_within_train_step": 24.751734018325806, "step": 1052}
{"train_info/time_between_train_steps": 0.005186319351196289, "step": 1052}
{"info/global_step": 1053, "train_info/time_within_train_step": 24.75111699104309, "step": 1053}
{"train_info/time_between_train_steps": 0.005530357360839844, "step": 1053}
{"info/global_step": 1054, "train_info/time_within_train_step": 24.91477370262146, "step": 1054}
{"train_info/time_between_train_steps": 0.006164073944091797, "step": 1054}
{"train_info/time_between_train_steps": 4.988671779632568, "step": 1054}
{"info/global_step": 1055, "train_info/time_within_train_step": 24.730581045150757, "step": 1055}
{"train_info/time_between_train_steps": 0.004843950271606445, "step": 1055}
{"info/global_step": 1056, "train_info/time_within_train_step": 24.834989309310913, "step": 1056}
{"train_info/time_between_train_steps": 0.004963874816894531, "step": 1056}
{"info/global_step": 1057, "train_info/time_within_train_step": 24.741113662719727, "step": 1057}
{"train_info/time_between_train_steps": 0.005429983139038086, "step": 1057}
{"info/global_step": 1058, "train_info/time_within_train_step": 24.896669387817383, "step": 1058}
{"train_info/time_between_train_steps": 0.005417346954345703, "step": 1058}
{"info/global_step": 1059, "train_info/time_within_train_step": 24.748435258865356, "step": 1059}
{"train_info/time_between_train_steps": 0.0050830841064453125, "step": 1059}
{"info/global_step": 1060, "train_info/time_within_train_step": 24.880038499832153, "step": 1060}
{"train_info/time_between_train_steps": 0.005263328552246094, "step": 1060}
{"info/global_step": 1061, "train_info/time_within_train_step": 24.853325366973877, "step": 1061}
{"train_info/time_between_train_steps": 0.005666255950927734, "step": 1061}
{"info/global_step": 1062, "train_info/time_within_train_step": 24.88454294204712, "step": 1062}
{"train_info/time_between_train_steps": 0.0071794986724853516, "step": 1062}
{"info/global_step": 1063, "train_info/time_within_train_step": 24.74895405769348, "step": 1063}
{"train_info/time_between_train_steps": 0.0052835941314697266, "step": 1063}
{"info/global_step": 1064, "train_info/time_within_train_step": 24.931083917617798, "step": 1064}
{"train_info/time_between_train_steps": 0.00516057014465332, "step": 1064}
{"info/global_step": 1065, "train_info/time_within_train_step": 24.797163248062134, "step": 1065}
{"train_info/time_between_train_steps": 0.0053937435150146484, "step": 1065}
{"info/global_step": 1066, "train_info/time_within_train_step": 24.929473400115967, "step": 1066}
{"train_info/time_between_train_steps": 0.005265474319458008, "step": 1066}
{"info/global_step": 1067, "train_info/time_within_train_step": 24.85111665725708, "step": 1067}
{"train_info/time_between_train_steps": 0.00572967529296875, "step": 1067}
{"info/global_step": 1068, "train_info/time_within_train_step": 24.832199811935425, "step": 1068}
{"train_info/time_between_train_steps": 0.005118608474731445, "step": 1068}
{"info/global_step": 1069, "train_info/time_within_train_step": 24.85094404220581, "step": 1069}
{"train_info/time_between_train_steps": 0.004887104034423828, "step": 1069}
{"info/global_step": 1070, "train_info/time_within_train_step": 24.806568145751953, "step": 1070}
{"train_info/time_between_train_steps": 0.005131959915161133, "step": 1070}
{"info/global_step": 1071, "train_info/time_within_train_step": 24.815837860107422, "step": 1071}
{"train_info/time_between_train_steps": 0.0049016475677490234, "step": 1071}
{"info/global_step": 1072, "train_info/time_within_train_step": 24.864219903945923, "step": 1072}
{"train_info/time_between_train_steps": 0.0050165653228759766, "step": 1072}
{"info/global_step": 1073, "train_info/time_within_train_step": 24.7812020778656, "step": 1073}
{"train_info/time_between_train_steps": 0.0051610469818115234, "step": 1073}
{"info/global_step": 1074, "train_info/time_within_train_step": 24.862202644348145, "step": 1074}
{"train_info/time_between_train_steps": 0.00502467155456543, "step": 1074}
{"info/global_step": 1075, "train_info/time_within_train_step": 24.864962100982666, "step": 1075}
{"train_info/time_between_train_steps": 0.0050792694091796875, "step": 1075}
{"info/global_step": 1076, "train_info/time_within_train_step": 24.838151216506958, "step": 1076}
{"train_info/time_between_train_steps": 0.0051877498626708984, "step": 1076}
{"info/global_step": 1077, "train_info/time_within_train_step": 24.920220613479614, "step": 1077}
{"train_info/time_between_train_steps": 0.005040884017944336, "step": 1077}
{"info/global_step": 1078, "train_info/time_within_train_step": 24.805391550064087, "step": 1078}
{"train_info/time_between_train_steps": 0.005095243453979492, "step": 1078}
{"info/global_step": 1079, "train_info/time_within_train_step": 24.82115650177002, "step": 1079}
{"train_info/time_between_train_steps": 0.0050601959228515625, "step": 1079}
{"info/global_step": 1080, "train_info/time_within_train_step": 24.86413073539734, "step": 1080}
{"train_info/time_between_train_steps": 0.00512242317199707, "step": 1080}
{"info/global_step": 1081, "train_info/time_within_train_step": 24.751189947128296, "step": 1081}
{"train_info/time_between_train_steps": 0.004979610443115234, "step": 1081}
{"info/global_step": 1082, "train_info/time_within_train_step": 24.744818687438965, "step": 1082}
{"train_info/time_between_train_steps": 0.005291461944580078, "step": 1082}
{"info/global_step": 1083, "train_info/time_within_train_step": 24.840547800064087, "step": 1083}
{"train_info/time_between_train_steps": 0.0050847530364990234, "step": 1083}
{"info/global_step": 1084, "train_info/time_within_train_step": 24.75126576423645, "step": 1084}
{"train_info/time_between_train_steps": 0.0050656795501708984, "step": 1084}
{"info/global_step": 1085, "train_info/time_within_train_step": 24.747551679611206, "step": 1085}
{"train_info/time_between_train_steps": 0.005185604095458984, "step": 1085}
{"info/global_step": 1086, "train_info/time_within_train_step": 24.761295080184937, "step": 1086}
{"train_info/time_between_train_steps": 0.005340576171875, "step": 1086}
{"info/global_step": 1087, "train_info/time_within_train_step": 24.763726949691772, "step": 1087}
{"train_info/time_between_train_steps": 0.005346536636352539, "step": 1087}
{"info/global_step": 1088, "train_info/time_within_train_step": 24.782508850097656, "step": 1088}
{"train_info/time_between_train_steps": 0.0058710575103759766, "step": 1088}
{"train_info/time_between_train_steps": 5.215270519256592, "step": 1088}
{"info/global_step": 1089, "train_info/time_within_train_step": 24.73370361328125, "step": 1089}
{"train_info/time_between_train_steps": 0.004937410354614258, "step": 1089}
{"info/global_step": 1090, "train_info/time_within_train_step": 24.840214729309082, "step": 1090}
{"train_info/time_between_train_steps": 0.009830713272094727, "step": 1090}
{"info/global_step": 1091, "train_info/time_within_train_step": 24.745601654052734, "step": 1091}
{"train_info/time_between_train_steps": 0.009590625762939453, "step": 1091}
{"info/global_step": 1092, "train_info/time_within_train_step": 24.991545915603638, "step": 1092}
{"train_info/time_between_train_steps": 0.005522489547729492, "step": 1092}
{"info/global_step": 1093, "train_info/time_within_train_step": 24.740122318267822, "step": 1093}
{"train_info/time_between_train_steps": 0.0051250457763671875, "step": 1093}
{"info/global_step": 1094, "train_info/time_within_train_step": 24.861422538757324, "step": 1094}
{"train_info/time_between_train_steps": 0.005192756652832031, "step": 1094}
{"info/global_step": 1095, "train_info/time_within_train_step": 24.75605607032776, "step": 1095}
{"train_info/time_between_train_steps": 0.00531458854675293, "step": 1095}
{"info/global_step": 1096, "train_info/time_within_train_step": 24.876007318496704, "step": 1096}
{"train_info/time_between_train_steps": 0.0050470829010009766, "step": 1096}
{"info/global_step": 1097, "train_info/time_within_train_step": 24.75364875793457, "step": 1097}
{"train_info/time_between_train_steps": 0.006029605865478516, "step": 1097}
{"info/global_step": 1098, "train_info/time_within_train_step": 24.906179428100586, "step": 1098}
{"train_info/time_between_train_steps": 0.005123138427734375, "step": 1098}
{"info/global_step": 1099, "train_info/time_within_train_step": 24.75841212272644, "step": 1099}
{"train_info/time_between_train_steps": 0.005289793014526367, "step": 1099}
{"info/global_step": 1100, "train_info/time_within_train_step": 24.871258974075317, "step": 1100}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1740947708, "_runtime": 27619}, "step": 1100}
{"logs": {"train/loss": 2.7906, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 32.01, "_timestamp": 1740947708, "_runtime": 27619}, "step": 1100}
{"train_info/time_between_train_steps": 11.981548309326172, "step": 1100}
{"info/global_step": 1101, "train_info/time_within_train_step": 24.78836989402771, "step": 1101}
{"train_info/time_between_train_steps": 0.005401611328125, "step": 1101}
{"info/global_step": 1102, "train_info/time_within_train_step": 25.01677107810974, "step": 1102}
{"train_info/time_between_train_steps": 0.005091190338134766, "step": 1102}
{"info/global_step": 1103, "train_info/time_within_train_step": 24.735819101333618, "step": 1103}
{"train_info/time_between_train_steps": 0.004750967025756836, "step": 1103}
{"info/global_step": 1104, "train_info/time_within_train_step": 24.72482204437256, "step": 1104}
{"train_info/time_between_train_steps": 0.004947662353515625, "step": 1104}
{"info/global_step": 1105, "train_info/time_within_train_step": 24.745993852615356, "step": 1105}
{"train_info/time_between_train_steps": 0.00513768196105957, "step": 1105}
{"info/global_step": 1106, "train_info/time_within_train_step": 24.736786365509033, "step": 1106}
{"train_info/time_between_train_steps": 0.0050771236419677734, "step": 1106}
{"info/global_step": 1107, "train_info/time_within_train_step": 24.827090978622437, "step": 1107}
{"train_info/time_between_train_steps": 0.004949092864990234, "step": 1107}
{"info/global_step": 1108, "train_info/time_within_train_step": 24.73524045944214, "step": 1108}
{"train_info/time_between_train_steps": 0.0051364898681640625, "step": 1108}
{"info/global_step": 1109, "train_info/time_within_train_step": 24.753793716430664, "step": 1109}
{"train_info/time_between_train_steps": 0.005380153656005859, "step": 1109}
{"info/global_step": 1110, "train_info/time_within_train_step": 24.74251389503479, "step": 1110}
{"train_info/time_between_train_steps": 0.005457878112792969, "step": 1110}
{"info/global_step": 1111, "train_info/time_within_train_step": 24.73648738861084, "step": 1111}
{"train_info/time_between_train_steps": 0.005077838897705078, "step": 1111}
{"info/global_step": 1112, "train_info/time_within_train_step": 24.733436107635498, "step": 1112}
{"train_info/time_between_train_steps": 0.005029201507568359, "step": 1112}
{"info/global_step": 1113, "train_info/time_within_train_step": 24.736164331436157, "step": 1113}
{"train_info/time_between_train_steps": 0.005967140197753906, "step": 1113}
{"info/global_step": 1114, "train_info/time_within_train_step": 24.758759260177612, "step": 1114}
{"train_info/time_between_train_steps": 0.005072355270385742, "step": 1114}
{"info/global_step": 1115, "train_info/time_within_train_step": 24.741222620010376, "step": 1115}
{"train_info/time_between_train_steps": 0.005088329315185547, "step": 1115}
{"info/global_step": 1116, "train_info/time_within_train_step": 24.73537254333496, "step": 1116}
{"train_info/time_between_train_steps": 0.0050847530364990234, "step": 1116}
{"info/global_step": 1117, "train_info/time_within_train_step": 24.745615005493164, "step": 1117}
{"train_info/time_between_train_steps": 0.005236148834228516, "step": 1117}
{"info/global_step": 1118, "train_info/time_within_train_step": 24.738025188446045, "step": 1118}
{"train_info/time_between_train_steps": 0.0050427913665771484, "step": 1118}
{"info/global_step": 1119, "train_info/time_within_train_step": 24.74389624595642, "step": 1119}
{"train_info/time_between_train_steps": 0.0051953792572021484, "step": 1119}
{"info/global_step": 1120, "train_info/time_within_train_step": 24.75368309020996, "step": 1120}
{"train_info/time_between_train_steps": 0.005446672439575195, "step": 1120}
{"info/global_step": 1121, "train_info/time_within_train_step": 24.835537910461426, "step": 1121}
{"train_info/time_between_train_steps": 0.005556344985961914, "step": 1121}
{"info/global_step": 1122, "train_info/time_within_train_step": 24.784913539886475, "step": 1122}
{"train_info/time_between_train_steps": 0.0057773590087890625, "step": 1122}
{"train_info/time_between_train_steps": 5.431433200836182, "step": 1122}
{"info/global_step": 1123, "train_info/time_within_train_step": 24.874668836593628, "step": 1123}
{"train_info/time_between_train_steps": 0.0051038265228271484, "step": 1123}
{"info/global_step": 1124, "train_info/time_within_train_step": 24.836130619049072, "step": 1124}
{"train_info/time_between_train_steps": 0.00494694709777832, "step": 1124}
{"info/global_step": 1125, "train_info/time_within_train_step": 24.735222101211548, "step": 1125}
{"train_info/time_between_train_steps": 0.005021572113037109, "step": 1125}
{"info/global_step": 1126, "train_info/time_within_train_step": 24.89668035507202, "step": 1126}
{"train_info/time_between_train_steps": 0.005368471145629883, "step": 1126}
{"info/global_step": 1127, "train_info/time_within_train_step": 24.814770936965942, "step": 1127}
{"train_info/time_between_train_steps": 0.0050885677337646484, "step": 1127}
{"info/global_step": 1128, "train_info/time_within_train_step": 24.867023468017578, "step": 1128}
{"train_info/time_between_train_steps": 0.00520634651184082, "step": 1128}
{"info/global_step": 1129, "train_info/time_within_train_step": 24.88012385368347, "step": 1129}
{"train_info/time_between_train_steps": 0.00526118278503418, "step": 1129}
{"info/global_step": 1130, "train_info/time_within_train_step": 24.88142967224121, "step": 1130}
{"train_info/time_between_train_steps": 0.005278348922729492, "step": 1130}
{"info/global_step": 1131, "train_info/time_within_train_step": 24.749903440475464, "step": 1131}
{"train_info/time_between_train_steps": 0.005167961120605469, "step": 1131}
{"info/global_step": 1132, "train_info/time_within_train_step": 24.887627840042114, "step": 1132}
{"train_info/time_between_train_steps": 0.0071299076080322266, "step": 1132}
{"info/global_step": 1133, "train_info/time_within_train_step": 24.749542474746704, "step": 1133}
{"train_info/time_between_train_steps": 0.0073163509368896484, "step": 1133}
{"info/global_step": 1134, "train_info/time_within_train_step": 24.855805158615112, "step": 1134}
{"train_info/time_between_train_steps": 0.005257368087768555, "step": 1134}
{"info/global_step": 1135, "train_info/time_within_train_step": 24.75735592842102, "step": 1135}
{"train_info/time_between_train_steps": 0.006976604461669922, "step": 1135}
{"info/global_step": 1136, "train_info/time_within_train_step": 24.81652045249939, "step": 1136}
{"train_info/time_between_train_steps": 0.005200624465942383, "step": 1136}
{"info/global_step": 1137, "train_info/time_within_train_step": 24.747105360031128, "step": 1137}
{"train_info/time_between_train_steps": 0.0048868656158447266, "step": 1137}
{"info/global_step": 1138, "train_info/time_within_train_step": 24.733964681625366, "step": 1138}
{"train_info/time_between_train_steps": 0.005022525787353516, "step": 1138}
{"info/global_step": 1139, "train_info/time_within_train_step": 24.822150945663452, "step": 1139}
{"train_info/time_between_train_steps": 0.005093812942504883, "step": 1139}
{"info/global_step": 1140, "train_info/time_within_train_step": 24.73378038406372, "step": 1140}
{"train_info/time_between_train_steps": 0.004979133605957031, "step": 1140}
{"info/global_step": 1141, "train_info/time_within_train_step": 24.731776475906372, "step": 1141}
{"train_info/time_between_train_steps": 0.004934072494506836, "step": 1141}
{"info/global_step": 1142, "train_info/time_within_train_step": 24.75628137588501, "step": 1142}
{"train_info/time_between_train_steps": 0.010684490203857422, "step": 1142}
{"info/global_step": 1143, "train_info/time_within_train_step": 24.758147716522217, "step": 1143}
{"train_info/time_between_train_steps": 0.005063056945800781, "step": 1143}
{"info/global_step": 1144, "train_info/time_within_train_step": 24.73966073989868, "step": 1144}
{"train_info/time_between_train_steps": 0.009240150451660156, "step": 1144}
{"info/global_step": 1145, "train_info/time_within_train_step": 24.928630113601685, "step": 1145}
{"train_info/time_between_train_steps": 0.009459495544433594, "step": 1145}
{"info/global_step": 1146, "train_info/time_within_train_step": 24.739048957824707, "step": 1146}
{"train_info/time_between_train_steps": 0.005106210708618164, "step": 1146}
{"info/global_step": 1147, "train_info/time_within_train_step": 24.73452663421631, "step": 1147}
{"train_info/time_between_train_steps": 0.005216360092163086, "step": 1147}
{"info/global_step": 1148, "train_info/time_within_train_step": 24.735958337783813, "step": 1148}
{"train_info/time_between_train_steps": 0.009501934051513672, "step": 1148}
{"info/global_step": 1149, "train_info/time_within_train_step": 24.94100069999695, "step": 1149}
{"train_info/time_between_train_steps": 0.005103588104248047, "step": 1149}
{"info/global_step": 1150, "train_info/time_within_train_step": 24.735499143600464, "step": 1150}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1740948965, "_runtime": 28876}, "step": 1150}
{"logs": {"train/loss": 2.7617, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 33.02, "_timestamp": 1740948965, "_runtime": 28876}, "step": 1150}
{"train_info/time_between_train_steps": 0.008869171142578125, "step": 1150}
{"info/global_step": 1151, "train_info/time_within_train_step": 24.748843908309937, "step": 1151}
{"train_info/time_between_train_steps": 0.00526118278503418, "step": 1151}
{"info/global_step": 1152, "train_info/time_within_train_step": 24.74847149848938, "step": 1152}
{"train_info/time_between_train_steps": 0.0049932003021240234, "step": 1152}
{"info/global_step": 1153, "train_info/time_within_train_step": 24.741109132766724, "step": 1153}
{"train_info/time_between_train_steps": 0.005384922027587891, "step": 1153}
{"info/global_step": 1154, "train_info/time_within_train_step": 24.82947540283203, "step": 1154}
{"train_info/time_between_train_steps": 0.005237579345703125, "step": 1154}
{"info/global_step": 1155, "train_info/time_within_train_step": 24.763916492462158, "step": 1155}
{"train_info/time_between_train_steps": 0.009108543395996094, "step": 1155}
{"info/global_step": 1156, "train_info/time_within_train_step": 24.76762104034424, "step": 1156}
{"train_info/time_between_train_steps": 0.010960102081298828, "step": 1156}
{"train_info/time_between_train_steps": 4.955047369003296, "step": 1156}
{"info/global_step": 1157, "train_info/time_within_train_step": 24.749000787734985, "step": 1157}
{"train_info/time_between_train_steps": 0.005326032638549805, "step": 1157}
{"info/global_step": 1158, "train_info/time_within_train_step": 24.86748743057251, "step": 1158}
{"train_info/time_between_train_steps": 0.0052661895751953125, "step": 1158}
{"info/global_step": 1159, "train_info/time_within_train_step": 24.731801748275757, "step": 1159}
{"train_info/time_between_train_steps": 0.0050084590911865234, "step": 1159}
{"info/global_step": 1160, "train_info/time_within_train_step": 24.84636640548706, "step": 1160}
{"train_info/time_between_train_steps": 0.005124092102050781, "step": 1160}
{"info/global_step": 1161, "train_info/time_within_train_step": 24.73783779144287, "step": 1161}
{"train_info/time_between_train_steps": 0.0054128170013427734, "step": 1161}
{"info/global_step": 1162, "train_info/time_within_train_step": 24.89162850379944, "step": 1162}
{"train_info/time_between_train_steps": 0.0053081512451171875, "step": 1162}
{"info/global_step": 1163, "train_info/time_within_train_step": 24.744975805282593, "step": 1163}
{"train_info/time_between_train_steps": 0.005193948745727539, "step": 1163}
{"info/global_step": 1164, "train_info/time_within_train_step": 24.86790108680725, "step": 1164}
{"train_info/time_between_train_steps": 0.005100727081298828, "step": 1164}
{"info/global_step": 1165, "train_info/time_within_train_step": 24.756397008895874, "step": 1165}
{"train_info/time_between_train_steps": 0.005393266677856445, "step": 1165}
{"info/global_step": 1166, "train_info/time_within_train_step": 24.86513042449951, "step": 1166}
{"train_info/time_between_train_steps": 0.005101203918457031, "step": 1166}
{"info/global_step": 1167, "train_info/time_within_train_step": 24.748547077178955, "step": 1167}
{"train_info/time_between_train_steps": 0.010386943817138672, "step": 1167}
{"info/global_step": 1168, "train_info/time_within_train_step": 24.910316467285156, "step": 1168}
{"train_info/time_between_train_steps": 0.010100364685058594, "step": 1168}
{"info/global_step": 1169, "train_info/time_within_train_step": 24.73851776123047, "step": 1169}
{"train_info/time_between_train_steps": 0.010208606719970703, "step": 1169}
{"info/global_step": 1170, "train_info/time_within_train_step": 24.89320707321167, "step": 1170}
{"train_info/time_between_train_steps": 0.010451793670654297, "step": 1170}
{"info/global_step": 1171, "train_info/time_within_train_step": 24.76414132118225, "step": 1171}
{"train_info/time_between_train_steps": 0.009840965270996094, "step": 1171}
{"info/global_step": 1172, "train_info/time_within_train_step": 24.730381727218628, "step": 1172}
{"train_info/time_between_train_steps": 0.004906892776489258, "step": 1172}
{"info/global_step": 1173, "train_info/time_within_train_step": 24.731504678726196, "step": 1173}
{"train_info/time_between_train_steps": 0.0050601959228515625, "step": 1173}
{"info/global_step": 1174, "train_info/time_within_train_step": 24.73419690132141, "step": 1174}
{"train_info/time_between_train_steps": 0.005194902420043945, "step": 1174}
{"info/global_step": 1175, "train_info/time_within_train_step": 24.730759382247925, "step": 1175}
{"train_info/time_between_train_steps": 0.004965305328369141, "step": 1175}
{"info/global_step": 1176, "train_info/time_within_train_step": 24.732258319854736, "step": 1176}
{"train_info/time_between_train_steps": 0.0050640106201171875, "step": 1176}
{"info/global_step": 1177, "train_info/time_within_train_step": 24.752427339553833, "step": 1177}
{"train_info/time_between_train_steps": 0.005180835723876953, "step": 1177}
{"info/global_step": 1178, "train_info/time_within_train_step": 24.79007124900818, "step": 1178}
{"train_info/time_between_train_steps": 0.009814023971557617, "step": 1178}
{"info/global_step": 1179, "train_info/time_within_train_step": 24.830644845962524, "step": 1179}
{"train_info/time_between_train_steps": 0.00539398193359375, "step": 1179}
{"info/global_step": 1180, "train_info/time_within_train_step": 24.755497932434082, "step": 1180}
{"train_info/time_between_train_steps": 0.005280733108520508, "step": 1180}
{"info/global_step": 1181, "train_info/time_within_train_step": 24.865291357040405, "step": 1181}
{"train_info/time_between_train_steps": 0.005064249038696289, "step": 1181}
{"info/global_step": 1182, "train_info/time_within_train_step": 24.862280130386353, "step": 1182}
{"train_info/time_between_train_steps": 0.005002260208129883, "step": 1182}
{"info/global_step": 1183, "train_info/time_within_train_step": 24.877304553985596, "step": 1183}
{"train_info/time_between_train_steps": 0.005173444747924805, "step": 1183}
{"info/global_step": 1184, "train_info/time_within_train_step": 24.74685287475586, "step": 1184}
{"train_info/time_between_train_steps": 0.00991058349609375, "step": 1184}
{"info/global_step": 1185, "train_info/time_within_train_step": 24.992945194244385, "step": 1185}
{"train_info/time_between_train_steps": 0.0050656795501708984, "step": 1185}
{"info/global_step": 1186, "train_info/time_within_train_step": 24.830803632736206, "step": 1186}
{"train_info/time_between_train_steps": 0.005246639251708984, "step": 1186}
{"info/global_step": 1187, "train_info/time_within_train_step": 24.74946928024292, "step": 1187}
{"train_info/time_between_train_steps": 0.005278110504150391, "step": 1187}
{"info/global_step": 1188, "train_info/time_within_train_step": 24.74472141265869, "step": 1188}
{"train_info/time_between_train_steps": 0.005303859710693359, "step": 1188}
{"info/global_step": 1189, "train_info/time_within_train_step": 24.75689196586609, "step": 1189}
{"train_info/time_between_train_steps": 0.005463838577270508, "step": 1189}
{"info/global_step": 1190, "train_info/time_within_train_step": 24.772303819656372, "step": 1190}
{"train_info/time_between_train_steps": 0.005722761154174805, "step": 1190}
{"train_info/time_between_train_steps": 5.162113189697266, "step": 1190}
{"info/global_step": 1191, "train_info/time_within_train_step": 24.740589380264282, "step": 1191}
{"train_info/time_between_train_steps": 0.004927396774291992, "step": 1191}
{"info/global_step": 1192, "train_info/time_within_train_step": 24.896800756454468, "step": 1192}
{"train_info/time_between_train_steps": 0.00523686408996582, "step": 1192}
{"info/global_step": 1193, "train_info/time_within_train_step": 24.806026935577393, "step": 1193}
{"train_info/time_between_train_steps": 0.005263328552246094, "step": 1193}
{"info/global_step": 1194, "train_info/time_within_train_step": 24.852476358413696, "step": 1194}
{"train_info/time_between_train_steps": 0.005318641662597656, "step": 1194}
{"info/global_step": 1195, "train_info/time_within_train_step": 24.747018814086914, "step": 1195}
{"train_info/time_between_train_steps": 0.0054225921630859375, "step": 1195}
{"info/global_step": 1196, "train_info/time_within_train_step": 24.90599298477173, "step": 1196}
{"train_info/time_between_train_steps": 0.005473613739013672, "step": 1196}
{"info/global_step": 1197, "train_info/time_within_train_step": 24.74543261528015, "step": 1197}
{"train_info/time_between_train_steps": 0.005196571350097656, "step": 1197}
{"info/global_step": 1198, "train_info/time_within_train_step": 24.87511658668518, "step": 1198}
{"train_info/time_between_train_steps": 0.0053174495697021484, "step": 1198}
{"info/global_step": 1199, "train_info/time_within_train_step": 24.753899335861206, "step": 1199}
{"train_info/time_between_train_steps": 0.005558967590332031, "step": 1199}
{"info/global_step": 1200, "train_info/time_within_train_step": 24.86520743370056, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1740950216, "_runtime": 30127}, "step": 1200}
{"logs": {"train/loss": 2.7459, "train/learning_rate": 0.0, "train/epoch": 35.01, "_timestamp": 1740950216, "_runtime": 30127}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1740950243, "_runtime": 30154}, "step": 1200}
{"logs": {"train/train_runtime": 30155.4308, "train/train_samples_per_second": 20.374, "train/train_steps_per_second": 0.04, "train/total_flos": 3.2177068572672e+17, "train/train_loss": 3.564861613114675, "train/epoch": 35.01, "_timestamp": 1740950243, "_runtime": 30154}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1581.5537109375, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1740950267, "_runtime": 30178}, "step": 1200}
{"logs": {"eval/loss": 3.62945556640625, "eval/runtime": 3.6726, "eval/samples_per_second": 34.036, "eval/steps_per_second": 2.178, "train/epoch": 35.01, "_timestamp": 1740950267, "_runtime": 30178}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1581.5537109375, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1740950268, "_runtime": 30179}, "step": 1200}
{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 3.62945556640625, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 37.69229008107535, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 3.6726, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 34.036, "train/epoch": 35.01, "_timestamp": 1740950268, "_runtime": 30179}, "step": 1200}