GPT2_small_TR53 / metrics.json
xiulinyang's picture
Adding model checkpoints and config files
2eae8f4
{"num_parameters": 124439808, "trainable_parameters": 124439808, "step": 0}
{"train_info/time_between_train_steps": 3.821139097213745, "step": 0}
{"info/global_step": 1, "train_info/time_within_train_step": 28.533889055252075, "step": 1}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 19761.71484375, "train_info/memory_reserved": 22624.0, "train_info/memory_max_reserved": 22624.0, "_timestamp": 1733861725, "_runtime": 37}, "step": 1}
{"logs": {"train/loss": 10.8568, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1733861725, "_runtime": 37}, "step": 1}
{"train_info/time_between_train_steps": 0.008469104766845703, "step": 1}
{"info/global_step": 2, "train_info/time_within_train_step": 28.037352323532104, "step": 2}
{"train_info/time_between_train_steps": 0.005648136138916016, "step": 2}
{"info/global_step": 3, "train_info/time_within_train_step": 27.87070369720459, "step": 3}
{"train_info/time_between_train_steps": 0.005811452865600586, "step": 3}
{"info/global_step": 4, "train_info/time_within_train_step": 28.119908809661865, "step": 4}
{"train_info/time_between_train_steps": 0.010096311569213867, "step": 4}
{"info/global_step": 5, "train_info/time_within_train_step": 28.18924331665039, "step": 5}
{"train_info/time_between_train_steps": 0.005335807800292969, "step": 5}
{"info/global_step": 6, "train_info/time_within_train_step": 27.95185136795044, "step": 6}
{"train_info/time_between_train_steps": 0.0058629512786865234, "step": 6}
{"info/global_step": 7, "train_info/time_within_train_step": 28.15664267539978, "step": 7}
{"train_info/time_between_train_steps": 0.013402462005615234, "step": 7}
{"info/global_step": 8, "train_info/time_within_train_step": 27.89963722229004, "step": 8}
{"train_info/time_between_train_steps": 0.014599084854125977, "step": 8}
{"info/global_step": 9, "train_info/time_within_train_step": 28.237628936767578, "step": 9}
{"train_info/time_between_train_steps": 0.00685882568359375, "step": 9}
{"info/global_step": 10, "train_info/time_within_train_step": 27.834078788757324, "step": 10}
{"train_info/time_between_train_steps": 0.013814210891723633, "step": 10}
{"info/global_step": 11, "train_info/time_within_train_step": 28.312318325042725, "step": 11}
{"train_info/time_between_train_steps": 0.006107330322265625, "step": 11}
{"info/global_step": 12, "train_info/time_within_train_step": 28.011987924575806, "step": 12}
{"train_info/time_between_train_steps": 0.005248308181762695, "step": 12}
{"info/global_step": 13, "train_info/time_within_train_step": 27.861613273620605, "step": 13}
{"train_info/time_between_train_steps": 0.005290985107421875, "step": 13}
{"info/global_step": 14, "train_info/time_within_train_step": 27.869736194610596, "step": 14}
{"train_info/time_between_train_steps": 0.0052640438079833984, "step": 14}
{"info/global_step": 15, "train_info/time_within_train_step": 27.908385515213013, "step": 15}
{"train_info/time_between_train_steps": 0.005279541015625, "step": 15}
{"info/global_step": 16, "train_info/time_within_train_step": 27.986371994018555, "step": 16}
{"train_info/time_between_train_steps": 0.0054624080657958984, "step": 16}
{"info/global_step": 17, "train_info/time_within_train_step": 27.933210849761963, "step": 17}
{"train_info/time_between_train_steps": 0.005207538604736328, "step": 17}
{"info/global_step": 18, "train_info/time_within_train_step": 27.833080053329468, "step": 18}
{"train_info/time_between_train_steps": 0.005620718002319336, "step": 18}
{"info/global_step": 19, "train_info/time_within_train_step": 27.832363605499268, "step": 19}
{"train_info/time_between_train_steps": 0.010288476943969727, "step": 19}
{"info/global_step": 20, "train_info/time_within_train_step": 27.97080087661743, "step": 20}
{"train_info/time_between_train_steps": 0.007299661636352539, "step": 20}
{"info/global_step": 21, "train_info/time_within_train_step": 27.89056944847107, "step": 21}
{"train_info/time_between_train_steps": 0.005644321441650391, "step": 21}
{"info/global_step": 22, "train_info/time_within_train_step": 27.957114696502686, "step": 22}
{"train_info/time_between_train_steps": 0.006374359130859375, "step": 22}
{"info/global_step": 23, "train_info/time_within_train_step": 27.912258625030518, "step": 23}
{"train_info/time_between_train_steps": 0.005713939666748047, "step": 23}
{"info/global_step": 24, "train_info/time_within_train_step": 27.911243200302124, "step": 24}
{"train_info/time_between_train_steps": 0.00562286376953125, "step": 24}
{"train_info/time_between_train_steps": 5.126796722412109, "step": 24}
{"info/global_step": 25, "train_info/time_within_train_step": 27.819792985916138, "step": 25}
{"train_info/time_between_train_steps": 0.005560874938964844, "step": 25}
{"info/global_step": 26, "train_info/time_within_train_step": 28.104661464691162, "step": 26}
{"train_info/time_between_train_steps": 0.0054476261138916016, "step": 26}
{"info/global_step": 27, "train_info/time_within_train_step": 27.90863800048828, "step": 27}
{"train_info/time_between_train_steps": 0.0054759979248046875, "step": 27}
{"info/global_step": 28, "train_info/time_within_train_step": 28.002175331115723, "step": 28}
{"train_info/time_between_train_steps": 0.005541801452636719, "step": 28}
{"info/global_step": 29, "train_info/time_within_train_step": 27.869744777679443, "step": 29}
{"train_info/time_between_train_steps": 0.005255460739135742, "step": 29}
{"info/global_step": 30, "train_info/time_within_train_step": 27.88740587234497, "step": 30}
{"train_info/time_between_train_steps": 0.005084037780761719, "step": 30}
{"info/global_step": 31, "train_info/time_within_train_step": 27.947638750076294, "step": 31}
{"train_info/time_between_train_steps": 0.005289793014526367, "step": 31}
{"info/global_step": 32, "train_info/time_within_train_step": 28.10380220413208, "step": 32}
{"train_info/time_between_train_steps": 0.009924650192260742, "step": 32}
{"info/global_step": 33, "train_info/time_within_train_step": 27.89262628555298, "step": 33}
{"train_info/time_between_train_steps": 0.0055010318756103516, "step": 33}
{"info/global_step": 34, "train_info/time_within_train_step": 27.8582661151886, "step": 34}
{"train_info/time_between_train_steps": 0.0054607391357421875, "step": 34}
{"info/global_step": 35, "train_info/time_within_train_step": 27.92349410057068, "step": 35}
{"train_info/time_between_train_steps": 0.009967803955078125, "step": 35}
{"info/global_step": 36, "train_info/time_within_train_step": 27.88943123817444, "step": 36}
{"train_info/time_between_train_steps": 0.005645275115966797, "step": 36}
{"info/global_step": 37, "train_info/time_within_train_step": 27.88342046737671, "step": 37}
{"train_info/time_between_train_steps": 0.010091781616210938, "step": 37}
{"info/global_step": 38, "train_info/time_within_train_step": 27.82862401008606, "step": 38}
{"train_info/time_between_train_steps": 0.005346059799194336, "step": 38}
{"info/global_step": 39, "train_info/time_within_train_step": 27.98231291770935, "step": 39}
{"train_info/time_between_train_steps": 0.009741067886352539, "step": 39}
{"info/global_step": 40, "train_info/time_within_train_step": 27.859386205673218, "step": 40}
{"train_info/time_between_train_steps": 0.0057337284088134766, "step": 40}
{"info/global_step": 41, "train_info/time_within_train_step": 27.910923957824707, "step": 41}
{"train_info/time_between_train_steps": 0.005632877349853516, "step": 41}
{"info/global_step": 42, "train_info/time_within_train_step": 27.88668203353882, "step": 42}
{"train_info/time_between_train_steps": 0.014742851257324219, "step": 42}
{"info/global_step": 43, "train_info/time_within_train_step": 27.924360990524292, "step": 43}
{"train_info/time_between_train_steps": 0.005479097366333008, "step": 43}
{"info/global_step": 44, "train_info/time_within_train_step": 27.88132882118225, "step": 44}
{"train_info/time_between_train_steps": 0.014685869216918945, "step": 44}
{"info/global_step": 45, "train_info/time_within_train_step": 27.976166009902954, "step": 45}
{"train_info/time_between_train_steps": 0.01074528694152832, "step": 45}
{"info/global_step": 46, "train_info/time_within_train_step": 27.91370916366577, "step": 46}
{"train_info/time_between_train_steps": 0.0055637359619140625, "step": 46}
{"info/global_step": 47, "train_info/time_within_train_step": 28.028409957885742, "step": 47}
{"train_info/time_between_train_steps": 0.005727529525756836, "step": 47}
{"info/global_step": 48, "train_info/time_within_train_step": 27.91259527206421, "step": 48}
{"train_info/time_between_train_steps": 0.005834102630615234, "step": 48}
{"train_info/time_between_train_steps": 5.275522232055664, "step": 48}
{"info/global_step": 49, "train_info/time_within_train_step": 27.926105737686157, "step": 49}
{"train_info/time_between_train_steps": 0.005899667739868164, "step": 49}
{"info/global_step": 50, "train_info/time_within_train_step": 28.046265602111816, "step": 50}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733863106, "_runtime": 1418}, "step": 50}
{"logs": {"train/loss": 8.4903, "train/learning_rate": 0.00025, "train/epoch": 2.0, "_timestamp": 1733863106, "_runtime": 1418}, "step": 50}
{"train_info/time_between_train_steps": 0.018194198608398438, "step": 50}
{"info/global_step": 51, "train_info/time_within_train_step": 27.860803365707397, "step": 51}
{"train_info/time_between_train_steps": 0.005678415298461914, "step": 51}
{"info/global_step": 52, "train_info/time_within_train_step": 27.95051383972168, "step": 52}
{"train_info/time_between_train_steps": 0.005599498748779297, "step": 52}
{"info/global_step": 53, "train_info/time_within_train_step": 27.84534239768982, "step": 53}
{"train_info/time_between_train_steps": 0.005167722702026367, "step": 53}
{"info/global_step": 54, "train_info/time_within_train_step": 27.898667812347412, "step": 54}
{"train_info/time_between_train_steps": 0.005662202835083008, "step": 54}
{"info/global_step": 55, "train_info/time_within_train_step": 27.82908058166504, "step": 55}
{"train_info/time_between_train_steps": 0.005223751068115234, "step": 55}
{"info/global_step": 56, "train_info/time_within_train_step": 27.924776315689087, "step": 56}
{"train_info/time_between_train_steps": 0.005299091339111328, "step": 56}
{"info/global_step": 57, "train_info/time_within_train_step": 27.85494303703308, "step": 57}
{"train_info/time_between_train_steps": 0.012265205383300781, "step": 57}
{"info/global_step": 58, "train_info/time_within_train_step": 27.89437484741211, "step": 58}
{"train_info/time_between_train_steps": 0.01020669937133789, "step": 58}
{"info/global_step": 59, "train_info/time_within_train_step": 27.883049726486206, "step": 59}
{"train_info/time_between_train_steps": 0.005450010299682617, "step": 59}
{"info/global_step": 60, "train_info/time_within_train_step": 27.914623975753784, "step": 60}
{"train_info/time_between_train_steps": 0.005243062973022461, "step": 60}
{"info/global_step": 61, "train_info/time_within_train_step": 27.864964485168457, "step": 61}
{"train_info/time_between_train_steps": 0.005204677581787109, "step": 61}
{"info/global_step": 62, "train_info/time_within_train_step": 27.89541006088257, "step": 62}
{"train_info/time_between_train_steps": 0.005498170852661133, "step": 62}
{"info/global_step": 63, "train_info/time_within_train_step": 28.01825761795044, "step": 63}
{"train_info/time_between_train_steps": 0.005452394485473633, "step": 63}
{"info/global_step": 64, "train_info/time_within_train_step": 27.840373992919922, "step": 64}
{"train_info/time_between_train_steps": 0.0054509639739990234, "step": 64}
{"info/global_step": 65, "train_info/time_within_train_step": 27.91447901725769, "step": 65}
{"train_info/time_between_train_steps": 0.005467653274536133, "step": 65}
{"info/global_step": 66, "train_info/time_within_train_step": 27.868010759353638, "step": 66}
{"train_info/time_between_train_steps": 0.009564638137817383, "step": 66}
{"info/global_step": 67, "train_info/time_within_train_step": 27.89435911178589, "step": 67}
{"train_info/time_between_train_steps": 0.006176471710205078, "step": 67}
{"info/global_step": 68, "train_info/time_within_train_step": 27.859719276428223, "step": 68}
{"train_info/time_between_train_steps": 0.005562782287597656, "step": 68}
{"info/global_step": 69, "train_info/time_within_train_step": 27.964381456375122, "step": 69}
{"train_info/time_between_train_steps": 0.005448818206787109, "step": 69}
{"info/global_step": 70, "train_info/time_within_train_step": 27.82854700088501, "step": 70}
{"train_info/time_between_train_steps": 0.011949777603149414, "step": 70}
{"info/global_step": 71, "train_info/time_within_train_step": 27.937572717666626, "step": 71}
{"train_info/time_between_train_steps": 0.005756378173828125, "step": 71}
{"info/global_step": 72, "train_info/time_within_train_step": 27.877082109451294, "step": 72}
{"train_info/time_between_train_steps": 0.005797386169433594, "step": 72}
{"train_info/time_between_train_steps": 5.539104461669922, "step": 72}
{"info/global_step": 73, "train_info/time_within_train_step": 27.92402696609497, "step": 73}
{"train_info/time_between_train_steps": 0.011109352111816406, "step": 73}
{"info/global_step": 74, "train_info/time_within_train_step": 28.00415802001953, "step": 74}
{"train_info/time_between_train_steps": 0.006369590759277344, "step": 74}
{"info/global_step": 75, "train_info/time_within_train_step": 27.94434690475464, "step": 75}
{"train_info/time_between_train_steps": 0.0053560733795166016, "step": 75}
{"info/global_step": 76, "train_info/time_within_train_step": 27.982746124267578, "step": 76}
{"train_info/time_between_train_steps": 0.005368471145629883, "step": 76}
{"info/global_step": 77, "train_info/time_within_train_step": 27.895103693008423, "step": 77}
{"train_info/time_between_train_steps": 0.006207466125488281, "step": 77}
{"info/global_step": 78, "train_info/time_within_train_step": 27.97312641143799, "step": 78}
{"train_info/time_between_train_steps": 0.005048990249633789, "step": 78}
{"info/global_step": 79, "train_info/time_within_train_step": 27.880038022994995, "step": 79}
{"train_info/time_between_train_steps": 0.005433797836303711, "step": 79}
{"info/global_step": 80, "train_info/time_within_train_step": 27.864113569259644, "step": 80}
{"train_info/time_between_train_steps": 0.005471229553222656, "step": 80}
{"info/global_step": 81, "train_info/time_within_train_step": 27.88240623474121, "step": 81}
{"train_info/time_between_train_steps": 0.005268573760986328, "step": 81}
{"info/global_step": 82, "train_info/time_within_train_step": 27.937636137008667, "step": 82}
{"train_info/time_between_train_steps": 0.0065059661865234375, "step": 82}
{"info/global_step": 83, "train_info/time_within_train_step": 27.875128030776978, "step": 83}
{"train_info/time_between_train_steps": 0.005377531051635742, "step": 83}
{"info/global_step": 84, "train_info/time_within_train_step": 27.833176612854004, "step": 84}
{"train_info/time_between_train_steps": 0.013754844665527344, "step": 84}
{"info/global_step": 85, "train_info/time_within_train_step": 27.91662859916687, "step": 85}
{"train_info/time_between_train_steps": 0.005378007888793945, "step": 85}
{"info/global_step": 86, "train_info/time_within_train_step": 27.929656982421875, "step": 86}
{"train_info/time_between_train_steps": 0.010367870330810547, "step": 86}
{"info/global_step": 87, "train_info/time_within_train_step": 27.86956238746643, "step": 87}
{"train_info/time_between_train_steps": 0.0109100341796875, "step": 87}
{"info/global_step": 88, "train_info/time_within_train_step": 27.96914505958557, "step": 88}
{"train_info/time_between_train_steps": 0.005514860153198242, "step": 88}
{"info/global_step": 89, "train_info/time_within_train_step": 27.8777859210968, "step": 89}
{"train_info/time_between_train_steps": 0.005585432052612305, "step": 89}
{"info/global_step": 90, "train_info/time_within_train_step": 27.92362093925476, "step": 90}
{"train_info/time_between_train_steps": 0.005262613296508789, "step": 90}
{"info/global_step": 91, "train_info/time_within_train_step": 27.891221046447754, "step": 91}
{"train_info/time_between_train_steps": 0.009668827056884766, "step": 91}
{"info/global_step": 92, "train_info/time_within_train_step": 27.906431436538696, "step": 92}
{"train_info/time_between_train_steps": 0.005475759506225586, "step": 92}
{"info/global_step": 93, "train_info/time_within_train_step": 27.924067735671997, "step": 93}
{"train_info/time_between_train_steps": 0.010826349258422852, "step": 93}
{"info/global_step": 94, "train_info/time_within_train_step": 27.95855140686035, "step": 94}
{"train_info/time_between_train_steps": 0.0054624080657958984, "step": 94}
{"info/global_step": 95, "train_info/time_within_train_step": 27.871114015579224, "step": 95}
{"train_info/time_between_train_steps": 0.005692958831787109, "step": 95}
{"info/global_step": 96, "train_info/time_within_train_step": 27.877554178237915, "step": 96}
{"train_info/time_between_train_steps": 0.0058100223541259766, "step": 96}
{"train_info/time_between_train_steps": 5.1437668800354, "step": 96}
{"info/global_step": 97, "train_info/time_within_train_step": 27.86967706680298, "step": 97}
{"train_info/time_between_train_steps": 0.005918979644775391, "step": 97}
{"info/global_step": 98, "train_info/time_within_train_step": 28.016448974609375, "step": 98}
{"train_info/time_between_train_steps": 0.011922121047973633, "step": 98}
{"info/global_step": 99, "train_info/time_within_train_step": 27.938883781433105, "step": 99}
{"train_info/time_between_train_steps": 0.005344867706298828, "step": 99}
{"info/global_step": 100, "train_info/time_within_train_step": 27.948858499526978, "step": 100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733864512, "_runtime": 2824}, "step": 100}
{"logs": {"train/loss": 7.2157, "train/learning_rate": 0.0005, "train/epoch": 4.0, "_timestamp": 1733864512, "_runtime": 2824}, "step": 100}
{"train_info/time_between_train_steps": 2.5753893852233887, "step": 100}
{"info/global_step": 101, "train_info/time_within_train_step": 28.01094675064087, "step": 101}
{"train_info/time_between_train_steps": 0.0052280426025390625, "step": 101}
{"info/global_step": 102, "train_info/time_within_train_step": 27.856173753738403, "step": 102}
{"train_info/time_between_train_steps": 0.005151033401489258, "step": 102}
{"info/global_step": 103, "train_info/time_within_train_step": 27.863196849822998, "step": 103}
{"train_info/time_between_train_steps": 0.005470752716064453, "step": 103}
{"info/global_step": 104, "train_info/time_within_train_step": 27.845460653305054, "step": 104}
{"train_info/time_between_train_steps": 0.00522303581237793, "step": 104}
{"info/global_step": 105, "train_info/time_within_train_step": 27.890036582946777, "step": 105}
{"train_info/time_between_train_steps": 0.0053937435150146484, "step": 105}
{"info/global_step": 106, "train_info/time_within_train_step": 27.85034418106079, "step": 106}
{"train_info/time_between_train_steps": 0.00945901870727539, "step": 106}
{"info/global_step": 107, "train_info/time_within_train_step": 27.940770864486694, "step": 107}
{"train_info/time_between_train_steps": 0.0052950382232666016, "step": 107}
{"info/global_step": 108, "train_info/time_within_train_step": 27.857229948043823, "step": 108}
{"train_info/time_between_train_steps": 0.005430936813354492, "step": 108}
{"info/global_step": 109, "train_info/time_within_train_step": 27.867021083831787, "step": 109}
{"train_info/time_between_train_steps": 0.010390043258666992, "step": 109}
{"info/global_step": 110, "train_info/time_within_train_step": 27.927757501602173, "step": 110}
{"train_info/time_between_train_steps": 0.005270719528198242, "step": 110}
{"info/global_step": 111, "train_info/time_within_train_step": 27.872534036636353, "step": 111}
{"train_info/time_between_train_steps": 0.011554956436157227, "step": 111}
{"info/global_step": 112, "train_info/time_within_train_step": 27.89185643196106, "step": 112}
{"train_info/time_between_train_steps": 0.005768299102783203, "step": 112}
{"info/global_step": 113, "train_info/time_within_train_step": 27.87519097328186, "step": 113}
{"train_info/time_between_train_steps": 0.005689859390258789, "step": 113}
{"info/global_step": 114, "train_info/time_within_train_step": 27.877984046936035, "step": 114}
{"train_info/time_between_train_steps": 0.005509376525878906, "step": 114}
{"info/global_step": 115, "train_info/time_within_train_step": 27.90910792350769, "step": 115}
{"train_info/time_between_train_steps": 0.005732297897338867, "step": 115}
{"info/global_step": 116, "train_info/time_within_train_step": 27.897411346435547, "step": 116}
{"train_info/time_between_train_steps": 0.0055124759674072266, "step": 116}
{"info/global_step": 117, "train_info/time_within_train_step": 27.810490608215332, "step": 117}
{"train_info/time_between_train_steps": 0.005469083786010742, "step": 117}
{"info/global_step": 118, "train_info/time_within_train_step": 27.966025590896606, "step": 118}
{"train_info/time_between_train_steps": 0.005712032318115234, "step": 118}
{"info/global_step": 119, "train_info/time_within_train_step": 27.87128472328186, "step": 119}
{"train_info/time_between_train_steps": 0.006020545959472656, "step": 119}
{"info/global_step": 120, "train_info/time_within_train_step": 27.965394735336304, "step": 120}
{"train_info/time_between_train_steps": 0.015111923217773438, "step": 120}
{"train_info/time_between_train_steps": 5.249781131744385, "step": 120}
{"info/global_step": 121, "train_info/time_within_train_step": 27.81099033355713, "step": 121}
{"train_info/time_between_train_steps": 0.005724668502807617, "step": 121}
{"info/global_step": 122, "train_info/time_within_train_step": 28.07422637939453, "step": 122}
{"train_info/time_between_train_steps": 0.005447864532470703, "step": 122}
{"info/global_step": 123, "train_info/time_within_train_step": 27.86060333251953, "step": 123}
{"train_info/time_between_train_steps": 0.009648561477661133, "step": 123}
{"info/global_step": 124, "train_info/time_within_train_step": 27.96206283569336, "step": 124}
{"train_info/time_between_train_steps": 0.005552053451538086, "step": 124}
{"info/global_step": 125, "train_info/time_within_train_step": 28.005625009536743, "step": 125}
{"train_info/time_between_train_steps": 0.005424976348876953, "step": 125}
{"info/global_step": 126, "train_info/time_within_train_step": 27.919677257537842, "step": 126}
{"train_info/time_between_train_steps": 0.005380153656005859, "step": 126}
{"info/global_step": 127, "train_info/time_within_train_step": 27.847646951675415, "step": 127}
{"train_info/time_between_train_steps": 0.009386539459228516, "step": 127}
{"info/global_step": 128, "train_info/time_within_train_step": 27.91883373260498, "step": 128}
{"train_info/time_between_train_steps": 0.005613803863525391, "step": 128}
{"info/global_step": 129, "train_info/time_within_train_step": 27.84879422187805, "step": 129}
{"train_info/time_between_train_steps": 0.005271196365356445, "step": 129}
{"info/global_step": 130, "train_info/time_within_train_step": 27.823144674301147, "step": 130}
{"train_info/time_between_train_steps": 0.013925552368164062, "step": 130}
{"info/global_step": 131, "train_info/time_within_train_step": 27.924867391586304, "step": 131}
{"train_info/time_between_train_steps": 0.005182027816772461, "step": 131}
{"info/global_step": 132, "train_info/time_within_train_step": 27.839778184890747, "step": 132}
{"train_info/time_between_train_steps": 0.005640983581542969, "step": 132}
{"info/global_step": 133, "train_info/time_within_train_step": 27.886006832122803, "step": 133}
{"train_info/time_between_train_steps": 0.0054013729095458984, "step": 133}
{"info/global_step": 134, "train_info/time_within_train_step": 27.874873638153076, "step": 134}
{"train_info/time_between_train_steps": 0.009658098220825195, "step": 134}
{"info/global_step": 135, "train_info/time_within_train_step": 27.84233021736145, "step": 135}
{"train_info/time_between_train_steps": 0.005398988723754883, "step": 135}
{"info/global_step": 136, "train_info/time_within_train_step": 27.884586811065674, "step": 136}
{"train_info/time_between_train_steps": 0.009964466094970703, "step": 136}
{"info/global_step": 137, "train_info/time_within_train_step": 27.895139694213867, "step": 137}
{"train_info/time_between_train_steps": 0.005768537521362305, "step": 137}
{"info/global_step": 138, "train_info/time_within_train_step": 27.9070463180542, "step": 138}
{"train_info/time_between_train_steps": 0.010411977767944336, "step": 138}
{"info/global_step": 139, "train_info/time_within_train_step": 27.9529767036438, "step": 139}
{"train_info/time_between_train_steps": 0.005345344543457031, "step": 139}
{"info/global_step": 140, "train_info/time_within_train_step": 27.88967490196228, "step": 140}
{"train_info/time_between_train_steps": 0.008183002471923828, "step": 140}
{"info/global_step": 141, "train_info/time_within_train_step": 27.960476398468018, "step": 141}
{"train_info/time_between_train_steps": 0.00974893569946289, "step": 141}
{"info/global_step": 142, "train_info/time_within_train_step": 27.884103059768677, "step": 142}
{"train_info/time_between_train_steps": 0.005866527557373047, "step": 142}
{"info/global_step": 143, "train_info/time_within_train_step": 27.896954774856567, "step": 143}
{"train_info/time_between_train_steps": 0.00549769401550293, "step": 143}
{"info/global_step": 144, "train_info/time_within_train_step": 27.89739680290222, "step": 144}
{"train_info/time_between_train_steps": 0.006129264831542969, "step": 144}
{"train_info/time_between_train_steps": 5.425424098968506, "step": 144}
{"info/global_step": 145, "train_info/time_within_train_step": 27.834883213043213, "step": 145}
{"train_info/time_between_train_steps": 0.0051310062408447266, "step": 145}
{"info/global_step": 146, "train_info/time_within_train_step": 28.02673649787903, "step": 146}
{"train_info/time_between_train_steps": 0.005354881286621094, "step": 146}
{"info/global_step": 147, "train_info/time_within_train_step": 27.918845176696777, "step": 147}
{"train_info/time_between_train_steps": 0.00532984733581543, "step": 147}
{"info/global_step": 148, "train_info/time_within_train_step": 27.948442459106445, "step": 148}
{"train_info/time_between_train_steps": 0.005659580230712891, "step": 148}
{"info/global_step": 149, "train_info/time_within_train_step": 27.846700191497803, "step": 149}
{"train_info/time_between_train_steps": 0.006077289581298828, "step": 149}
{"info/global_step": 150, "train_info/time_within_train_step": 27.854774236679077, "step": 150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733865921, "_runtime": 4233}, "step": 150}
{"logs": {"train/loss": 6.6121, "train/learning_rate": 0.0005833333333333333, "train/epoch": 6.0, "_timestamp": 1733865921, "_runtime": 4233}, "step": 150}
{"train_info/time_between_train_steps": 0.00804591178894043, "step": 150}
{"info/global_step": 151, "train_info/time_within_train_step": 27.857871532440186, "step": 151}
{"train_info/time_between_train_steps": 0.008490324020385742, "step": 151}
{"info/global_step": 152, "train_info/time_within_train_step": 27.974483489990234, "step": 152}
{"train_info/time_between_train_steps": 0.005115509033203125, "step": 152}
{"info/global_step": 153, "train_info/time_within_train_step": 27.92187786102295, "step": 153}
{"train_info/time_between_train_steps": 0.009986162185668945, "step": 153}
{"info/global_step": 154, "train_info/time_within_train_step": 27.911165714263916, "step": 154}
{"train_info/time_between_train_steps": 0.005217075347900391, "step": 154}
{"info/global_step": 155, "train_info/time_within_train_step": 27.820499658584595, "step": 155}
{"train_info/time_between_train_steps": 0.005408048629760742, "step": 155}
{"info/global_step": 156, "train_info/time_within_train_step": 27.980628490447998, "step": 156}
{"train_info/time_between_train_steps": 0.006457090377807617, "step": 156}
{"info/global_step": 157, "train_info/time_within_train_step": 27.837635278701782, "step": 157}
{"train_info/time_between_train_steps": 0.005362749099731445, "step": 157}
{"info/global_step": 158, "train_info/time_within_train_step": 27.898962259292603, "step": 158}
{"train_info/time_between_train_steps": 0.005330801010131836, "step": 158}
{"info/global_step": 159, "train_info/time_within_train_step": 27.890092372894287, "step": 159}
{"train_info/time_between_train_steps": 0.005282163619995117, "step": 159}
{"info/global_step": 160, "train_info/time_within_train_step": 27.824662685394287, "step": 160}
{"train_info/time_between_train_steps": 0.005444049835205078, "step": 160}
{"info/global_step": 161, "train_info/time_within_train_step": 27.962764263153076, "step": 161}
{"train_info/time_between_train_steps": 0.005165576934814453, "step": 161}
{"info/global_step": 162, "train_info/time_within_train_step": 27.83262276649475, "step": 162}
{"train_info/time_between_train_steps": 0.0052471160888671875, "step": 162}
{"info/global_step": 163, "train_info/time_within_train_step": 27.883310079574585, "step": 163}
{"train_info/time_between_train_steps": 0.005480527877807617, "step": 163}
{"info/global_step": 164, "train_info/time_within_train_step": 27.879080057144165, "step": 164}
{"train_info/time_between_train_steps": 0.0071392059326171875, "step": 164}
{"info/global_step": 165, "train_info/time_within_train_step": 27.953266143798828, "step": 165}
{"train_info/time_between_train_steps": 0.005618095397949219, "step": 165}
{"info/global_step": 166, "train_info/time_within_train_step": 27.933587312698364, "step": 166}
{"train_info/time_between_train_steps": 0.0060193538665771484, "step": 166}
{"info/global_step": 167, "train_info/time_within_train_step": 27.992498874664307, "step": 167}
{"train_info/time_between_train_steps": 0.005940914154052734, "step": 167}
{"info/global_step": 168, "train_info/time_within_train_step": 27.864049434661865, "step": 168}
{"train_info/time_between_train_steps": 0.011033773422241211, "step": 168}
{"train_info/time_between_train_steps": 5.190542936325073, "step": 168}
{"info/global_step": 169, "train_info/time_within_train_step": 27.862074613571167, "step": 169}
{"train_info/time_between_train_steps": 0.00539398193359375, "step": 169}
{"info/global_step": 170, "train_info/time_within_train_step": 27.974599361419678, "step": 170}
{"train_info/time_between_train_steps": 0.005474567413330078, "step": 170}
{"info/global_step": 171, "train_info/time_within_train_step": 27.99712634086609, "step": 171}
{"train_info/time_between_train_steps": 0.005408525466918945, "step": 171}
{"info/global_step": 172, "train_info/time_within_train_step": 28.066603183746338, "step": 172}
{"train_info/time_between_train_steps": 0.0054361820220947266, "step": 172}
{"info/global_step": 173, "train_info/time_within_train_step": 27.93461775779724, "step": 173}
{"train_info/time_between_train_steps": 0.0051136016845703125, "step": 173}
{"info/global_step": 174, "train_info/time_within_train_step": 27.89629817008972, "step": 174}
{"train_info/time_between_train_steps": 0.005347490310668945, "step": 174}
{"info/global_step": 175, "train_info/time_within_train_step": 27.856720447540283, "step": 175}
{"train_info/time_between_train_steps": 0.010079145431518555, "step": 175}
{"info/global_step": 176, "train_info/time_within_train_step": 27.869271516799927, "step": 176}
{"train_info/time_between_train_steps": 0.00527501106262207, "step": 176}
{"info/global_step": 177, "train_info/time_within_train_step": 27.85781955718994, "step": 177}
{"train_info/time_between_train_steps": 0.010607481002807617, "step": 177}
{"info/global_step": 178, "train_info/time_within_train_step": 27.906853675842285, "step": 178}
{"train_info/time_between_train_steps": 0.00543975830078125, "step": 178}
{"info/global_step": 179, "train_info/time_within_train_step": 27.887194395065308, "step": 179}
{"train_info/time_between_train_steps": 0.005355119705200195, "step": 179}
{"info/global_step": 180, "train_info/time_within_train_step": 27.888171195983887, "step": 180}
{"train_info/time_between_train_steps": 0.0054438114166259766, "step": 180}
{"info/global_step": 181, "train_info/time_within_train_step": 27.87649631500244, "step": 181}
{"train_info/time_between_train_steps": 0.005704641342163086, "step": 181}
{"info/global_step": 182, "train_info/time_within_train_step": 27.92414164543152, "step": 182}
{"train_info/time_between_train_steps": 0.006415843963623047, "step": 182}
{"info/global_step": 183, "train_info/time_within_train_step": 27.848407983779907, "step": 183}
{"train_info/time_between_train_steps": 0.005649566650390625, "step": 183}
{"info/global_step": 184, "train_info/time_within_train_step": 27.884580373764038, "step": 184}
{"train_info/time_between_train_steps": 0.01051950454711914, "step": 184}
{"info/global_step": 185, "train_info/time_within_train_step": 27.90295720100403, "step": 185}
{"train_info/time_between_train_steps": 0.005264759063720703, "step": 185}
{"info/global_step": 186, "train_info/time_within_train_step": 27.85777759552002, "step": 186}
{"train_info/time_between_train_steps": 0.005407094955444336, "step": 186}
{"info/global_step": 187, "train_info/time_within_train_step": 27.923032522201538, "step": 187}
{"train_info/time_between_train_steps": 0.006235599517822266, "step": 187}
{"info/global_step": 188, "train_info/time_within_train_step": 27.938955068588257, "step": 188}
{"train_info/time_between_train_steps": 0.01044011116027832, "step": 188}
{"info/global_step": 189, "train_info/time_within_train_step": 27.91809344291687, "step": 189}
{"train_info/time_between_train_steps": 0.011632204055786133, "step": 189}
{"info/global_step": 190, "train_info/time_within_train_step": 27.87188482284546, "step": 190}
{"train_info/time_between_train_steps": 0.006090402603149414, "step": 190}
{"info/global_step": 191, "train_info/time_within_train_step": 28.00863265991211, "step": 191}
{"train_info/time_between_train_steps": 0.005842447280883789, "step": 191}
{"info/global_step": 192, "train_info/time_within_train_step": 27.863271713256836, "step": 192}
{"train_info/time_between_train_steps": 0.0059506893157958984, "step": 192}
{"train_info/time_between_train_steps": 5.24846625328064, "step": 192}
{"info/global_step": 193, "train_info/time_within_train_step": 27.896165370941162, "step": 193}
{"train_info/time_between_train_steps": 0.005080223083496094, "step": 193}
{"info/global_step": 194, "train_info/time_within_train_step": 27.951216459274292, "step": 194}
{"train_info/time_between_train_steps": 0.009551525115966797, "step": 194}
{"info/global_step": 195, "train_info/time_within_train_step": 27.889395236968994, "step": 195}
{"train_info/time_between_train_steps": 0.009166479110717773, "step": 195}
{"info/global_step": 196, "train_info/time_within_train_step": 27.9456467628479, "step": 196}
{"train_info/time_between_train_steps": 0.005602598190307617, "step": 196}
{"info/global_step": 197, "train_info/time_within_train_step": 27.889535427093506, "step": 197}
{"train_info/time_between_train_steps": 0.005179882049560547, "step": 197}
{"info/global_step": 198, "train_info/time_within_train_step": 27.810219764709473, "step": 198}
{"train_info/time_between_train_steps": 0.0057489871978759766, "step": 198}
{"info/global_step": 199, "train_info/time_within_train_step": 27.873029947280884, "step": 199}
{"train_info/time_between_train_steps": 0.006817817687988281, "step": 199}
{"info/global_step": 200, "train_info/time_within_train_step": 27.90688467025757, "step": 200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733867327, "_runtime": 5639}, "step": 200}
{"logs": {"train/loss": 6.0811, "train/learning_rate": 0.0005555555555555556, "train/epoch": 8.01, "_timestamp": 1733867327, "_runtime": 5639}, "step": 200}
{"train_info/time_between_train_steps": 2.4157602787017822, "step": 200}
{"info/global_step": 201, "train_info/time_within_train_step": 27.913870573043823, "step": 201}
{"train_info/time_between_train_steps": 0.008521795272827148, "step": 201}
{"info/global_step": 202, "train_info/time_within_train_step": 27.8715603351593, "step": 202}
{"train_info/time_between_train_steps": 0.005393028259277344, "step": 202}
{"info/global_step": 203, "train_info/time_within_train_step": 28.006418228149414, "step": 203}
{"train_info/time_between_train_steps": 0.006293535232543945, "step": 203}
{"info/global_step": 204, "train_info/time_within_train_step": 27.85329794883728, "step": 204}
{"train_info/time_between_train_steps": 0.005535125732421875, "step": 204}
{"info/global_step": 205, "train_info/time_within_train_step": 27.944677352905273, "step": 205}
{"train_info/time_between_train_steps": 0.005331754684448242, "step": 205}
{"info/global_step": 206, "train_info/time_within_train_step": 27.834398984909058, "step": 206}
{"train_info/time_between_train_steps": 0.005268096923828125, "step": 206}
{"info/global_step": 207, "train_info/time_within_train_step": 27.901167154312134, "step": 207}
{"train_info/time_between_train_steps": 0.0054318904876708984, "step": 207}
{"info/global_step": 208, "train_info/time_within_train_step": 27.914040088653564, "step": 208}
{"train_info/time_between_train_steps": 0.005574941635131836, "step": 208}
{"info/global_step": 209, "train_info/time_within_train_step": 27.889857292175293, "step": 209}
{"train_info/time_between_train_steps": 0.005930423736572266, "step": 209}
{"info/global_step": 210, "train_info/time_within_train_step": 27.902791023254395, "step": 210}
{"train_info/time_between_train_steps": 0.005293369293212891, "step": 210}
{"info/global_step": 211, "train_info/time_within_train_step": 27.893150568008423, "step": 211}
{"train_info/time_between_train_steps": 0.00590062141418457, "step": 211}
{"info/global_step": 212, "train_info/time_within_train_step": 27.991011142730713, "step": 212}
{"train_info/time_between_train_steps": 0.005436420440673828, "step": 212}
{"info/global_step": 213, "train_info/time_within_train_step": 27.91648769378662, "step": 213}
{"train_info/time_between_train_steps": 0.0063343048095703125, "step": 213}
{"info/global_step": 214, "train_info/time_within_train_step": 27.953208208084106, "step": 214}
{"train_info/time_between_train_steps": 0.005563259124755859, "step": 214}
{"info/global_step": 215, "train_info/time_within_train_step": 27.94828987121582, "step": 215}
{"train_info/time_between_train_steps": 0.005845069885253906, "step": 215}
{"info/global_step": 216, "train_info/time_within_train_step": 27.971690893173218, "step": 216}
{"train_info/time_between_train_steps": 0.011038780212402344, "step": 216}
{"train_info/time_between_train_steps": 5.599370718002319, "step": 216}
{"info/global_step": 217, "train_info/time_within_train_step": 27.882237911224365, "step": 217}
{"train_info/time_between_train_steps": 0.0056307315826416016, "step": 217}
{"info/global_step": 218, "train_info/time_within_train_step": 28.080852031707764, "step": 218}
{"train_info/time_between_train_steps": 0.005543231964111328, "step": 218}
{"info/global_step": 219, "train_info/time_within_train_step": 28.04484510421753, "step": 219}
{"train_info/time_between_train_steps": 0.0054781436920166016, "step": 219}
{"info/global_step": 220, "train_info/time_within_train_step": 27.982690811157227, "step": 220}
{"train_info/time_between_train_steps": 0.0056610107421875, "step": 220}
{"info/global_step": 221, "train_info/time_within_train_step": 28.064523458480835, "step": 221}
{"train_info/time_between_train_steps": 0.010109663009643555, "step": 221}
{"info/global_step": 222, "train_info/time_within_train_step": 27.929218769073486, "step": 222}
{"train_info/time_between_train_steps": 0.005980253219604492, "step": 222}
{"info/global_step": 223, "train_info/time_within_train_step": 27.86570954322815, "step": 223}
{"train_info/time_between_train_steps": 0.0056438446044921875, "step": 223}
{"info/global_step": 224, "train_info/time_within_train_step": 27.89176082611084, "step": 224}
{"train_info/time_between_train_steps": 0.005543708801269531, "step": 224}
{"info/global_step": 225, "train_info/time_within_train_step": 27.87575364112854, "step": 225}
{"train_info/time_between_train_steps": 0.006125926971435547, "step": 225}
{"info/global_step": 226, "train_info/time_within_train_step": 27.8488667011261, "step": 226}
{"train_info/time_between_train_steps": 0.010565042495727539, "step": 226}
{"info/global_step": 227, "train_info/time_within_train_step": 27.90395975112915, "step": 227}
{"train_info/time_between_train_steps": 0.0054781436920166016, "step": 227}
{"info/global_step": 228, "train_info/time_within_train_step": 27.926060676574707, "step": 228}
{"train_info/time_between_train_steps": 0.010333061218261719, "step": 228}
{"info/global_step": 229, "train_info/time_within_train_step": 27.90238070487976, "step": 229}
{"train_info/time_between_train_steps": 0.00576019287109375, "step": 229}
{"info/global_step": 230, "train_info/time_within_train_step": 27.89388680458069, "step": 230}
{"train_info/time_between_train_steps": 0.010326862335205078, "step": 230}
{"info/global_step": 231, "train_info/time_within_train_step": 27.941290855407715, "step": 231}
{"train_info/time_between_train_steps": 0.00861978530883789, "step": 231}
{"info/global_step": 232, "train_info/time_within_train_step": 27.88461947441101, "step": 232}
{"train_info/time_between_train_steps": 0.005505561828613281, "step": 232}
{"info/global_step": 233, "train_info/time_within_train_step": 27.934995651245117, "step": 233}
{"train_info/time_between_train_steps": 0.005434751510620117, "step": 233}
{"info/global_step": 234, "train_info/time_within_train_step": 27.97720956802368, "step": 234}
{"train_info/time_between_train_steps": 0.010189294815063477, "step": 234}
{"info/global_step": 235, "train_info/time_within_train_step": 27.927281141281128, "step": 235}
{"train_info/time_between_train_steps": 0.005486249923706055, "step": 235}
{"info/global_step": 236, "train_info/time_within_train_step": 27.921709537506104, "step": 236}
{"train_info/time_between_train_steps": 0.010803699493408203, "step": 236}
{"info/global_step": 237, "train_info/time_within_train_step": 27.98872399330139, "step": 237}
{"train_info/time_between_train_steps": 0.00561976432800293, "step": 237}
{"info/global_step": 238, "train_info/time_within_train_step": 27.91378140449524, "step": 238}
{"train_info/time_between_train_steps": 0.005858182907104492, "step": 238}
{"info/global_step": 239, "train_info/time_within_train_step": 27.92412781715393, "step": 239}
{"train_info/time_between_train_steps": 0.0060274600982666016, "step": 239}
{"info/global_step": 240, "train_info/time_within_train_step": 27.998769283294678, "step": 240}
{"train_info/time_between_train_steps": 0.0061016082763671875, "step": 240}
{"train_info/time_between_train_steps": 5.345746040344238, "step": 240}
{"info/global_step": 241, "train_info/time_within_train_step": 27.91753911972046, "step": 241}
{"train_info/time_between_train_steps": 0.010732173919677734, "step": 241}
{"info/global_step": 242, "train_info/time_within_train_step": 28.116531372070312, "step": 242}
{"train_info/time_between_train_steps": 0.00556635856628418, "step": 242}
{"info/global_step": 243, "train_info/time_within_train_step": 27.874912977218628, "step": 243}
{"train_info/time_between_train_steps": 0.005785226821899414, "step": 243}
{"info/global_step": 244, "train_info/time_within_train_step": 28.001402139663696, "step": 244}
{"train_info/time_between_train_steps": 0.005778074264526367, "step": 244}
{"info/global_step": 245, "train_info/time_within_train_step": 27.85223364830017, "step": 245}
{"train_info/time_between_train_steps": 0.0052225589752197266, "step": 245}
{"info/global_step": 246, "train_info/time_within_train_step": 27.893455028533936, "step": 246}
{"train_info/time_between_train_steps": 0.005319356918334961, "step": 246}
{"info/global_step": 247, "train_info/time_within_train_step": 27.843024015426636, "step": 247}
{"train_info/time_between_train_steps": 0.010188102722167969, "step": 247}
{"info/global_step": 248, "train_info/time_within_train_step": 27.96091866493225, "step": 248}
{"train_info/time_between_train_steps": 0.005468606948852539, "step": 248}
{"info/global_step": 249, "train_info/time_within_train_step": 27.842076539993286, "step": 249}
{"train_info/time_between_train_steps": 0.005692481994628906, "step": 249}
{"info/global_step": 250, "train_info/time_within_train_step": 28.08454203605652, "step": 250}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733868737, "_runtime": 7049}, "step": 250}
{"logs": {"train/loss": 5.6744, "train/learning_rate": 0.0005277777777777777, "train/epoch": 10.01, "_timestamp": 1733868737, "_runtime": 7049}, "step": 250}
{"train_info/time_between_train_steps": 0.01365041732788086, "step": 250}
{"info/global_step": 251, "train_info/time_within_train_step": 27.859680891036987, "step": 251}
{"train_info/time_between_train_steps": 0.010239839553833008, "step": 251}
{"info/global_step": 252, "train_info/time_within_train_step": 27.83976650238037, "step": 252}
{"train_info/time_between_train_steps": 0.009843587875366211, "step": 252}
{"info/global_step": 253, "train_info/time_within_train_step": 27.933988332748413, "step": 253}
{"train_info/time_between_train_steps": 0.005249977111816406, "step": 253}
{"info/global_step": 254, "train_info/time_within_train_step": 27.869959592819214, "step": 254}
{"train_info/time_between_train_steps": 0.005375385284423828, "step": 254}
{"info/global_step": 255, "train_info/time_within_train_step": 27.89018225669861, "step": 255}
{"train_info/time_between_train_steps": 0.005431413650512695, "step": 255}
{"info/global_step": 256, "train_info/time_within_train_step": 27.85981273651123, "step": 256}
{"train_info/time_between_train_steps": 0.005416393280029297, "step": 256}
{"info/global_step": 257, "train_info/time_within_train_step": 27.983348846435547, "step": 257}
{"train_info/time_between_train_steps": 0.005534172058105469, "step": 257}
{"info/global_step": 258, "train_info/time_within_train_step": 27.955776691436768, "step": 258}
{"train_info/time_between_train_steps": 0.009979248046875, "step": 258}
{"info/global_step": 259, "train_info/time_within_train_step": 27.934094190597534, "step": 259}
{"train_info/time_between_train_steps": 0.005521535873413086, "step": 259}
{"info/global_step": 260, "train_info/time_within_train_step": 27.861037731170654, "step": 260}
{"train_info/time_between_train_steps": 0.005658864974975586, "step": 260}
{"info/global_step": 261, "train_info/time_within_train_step": 27.95903754234314, "step": 261}
{"train_info/time_between_train_steps": 0.00575709342956543, "step": 261}
{"info/global_step": 262, "train_info/time_within_train_step": 27.888697147369385, "step": 262}
{"train_info/time_between_train_steps": 0.010955572128295898, "step": 262}
{"info/global_step": 263, "train_info/time_within_train_step": 27.937700033187866, "step": 263}
{"train_info/time_between_train_steps": 0.00578761100769043, "step": 263}
{"info/global_step": 264, "train_info/time_within_train_step": 27.888998985290527, "step": 264}
{"train_info/time_between_train_steps": 0.006703853607177734, "step": 264}
{"train_info/time_between_train_steps": 5.412487506866455, "step": 264}
{"info/global_step": 265, "train_info/time_within_train_step": 33.5150728225708, "step": 265}
{"train_info/time_between_train_steps": 0.005140781402587891, "step": 265}
{"info/global_step": 266, "train_info/time_within_train_step": 54.9160692691803, "step": 266}
{"train_info/time_between_train_steps": 0.005522012710571289, "step": 266}
{"info/global_step": 267, "train_info/time_within_train_step": 54.870261669158936, "step": 267}
{"train_info/time_between_train_steps": 0.00984954833984375, "step": 267}
{"info/global_step": 268, "train_info/time_within_train_step": 54.62228012084961, "step": 268}
{"train_info/time_between_train_steps": 0.005709648132324219, "step": 268}
{"info/global_step": 269, "train_info/time_within_train_step": 54.72721862792969, "step": 269}
{"train_info/time_between_train_steps": 0.012401103973388672, "step": 269}
{"info/global_step": 270, "train_info/time_within_train_step": 54.54993009567261, "step": 270}
{"train_info/time_between_train_steps": 0.0053937435150146484, "step": 270}
{"info/global_step": 271, "train_info/time_within_train_step": 54.4993531703949, "step": 271}
{"train_info/time_between_train_steps": 0.010281085968017578, "step": 271}
{"info/global_step": 272, "train_info/time_within_train_step": 54.74463629722595, "step": 272}
{"train_info/time_between_train_steps": 0.00545048713684082, "step": 272}
{"info/global_step": 273, "train_info/time_within_train_step": 54.677117109298706, "step": 273}
{"train_info/time_between_train_steps": 0.007695198059082031, "step": 273}
{"info/global_step": 274, "train_info/time_within_train_step": 54.71284222602844, "step": 274}
{"train_info/time_between_train_steps": 0.015003204345703125, "step": 274}
{"info/global_step": 275, "train_info/time_within_train_step": 54.5838348865509, "step": 275}
{"train_info/time_between_train_steps": 0.006484031677246094, "step": 275}
{"info/global_step": 276, "train_info/time_within_train_step": 54.64979910850525, "step": 276}
{"train_info/time_between_train_steps": 0.006408214569091797, "step": 276}
{"info/global_step": 277, "train_info/time_within_train_step": 47.28894925117493, "step": 277}
{"train_info/time_between_train_steps": 0.005303621292114258, "step": 277}
{"info/global_step": 278, "train_info/time_within_train_step": 27.888726472854614, "step": 278}
{"train_info/time_between_train_steps": 0.005271196365356445, "step": 278}
{"info/global_step": 279, "train_info/time_within_train_step": 27.842493772506714, "step": 279}
{"train_info/time_between_train_steps": 0.007112026214599609, "step": 279}
{"info/global_step": 280, "train_info/time_within_train_step": 27.91629123687744, "step": 280}
{"train_info/time_between_train_steps": 0.005514621734619141, "step": 280}
{"info/global_step": 281, "train_info/time_within_train_step": 27.94734501838684, "step": 281}
{"train_info/time_between_train_steps": 0.005294322967529297, "step": 281}
{"info/global_step": 282, "train_info/time_within_train_step": 27.8762469291687, "step": 282}
{"train_info/time_between_train_steps": 0.0058727264404296875, "step": 282}
{"info/global_step": 283, "train_info/time_within_train_step": 27.92640209197998, "step": 283}
{"train_info/time_between_train_steps": 0.005160808563232422, "step": 283}
{"info/global_step": 284, "train_info/time_within_train_step": 27.910324096679688, "step": 284}
{"train_info/time_between_train_steps": 0.006075859069824219, "step": 284}
{"info/global_step": 285, "train_info/time_within_train_step": 27.867588996887207, "step": 285}
{"train_info/time_between_train_steps": 0.01023721694946289, "step": 285}
{"info/global_step": 286, "train_info/time_within_train_step": 27.858565092086792, "step": 286}
{"train_info/time_between_train_steps": 0.010214090347290039, "step": 286}
{"info/global_step": 287, "train_info/time_within_train_step": 32.92755913734436, "step": 287}
{"train_info/time_between_train_steps": 0.005651950836181641, "step": 287}
{"info/global_step": 288, "train_info/time_within_train_step": 54.19832730293274, "step": 288}
{"train_info/time_between_train_steps": 0.010259389877319336, "step": 288}
{"train_info/time_between_train_steps": 7.2443788051605225, "step": 288}
{"info/global_step": 289, "train_info/time_within_train_step": 54.14817786216736, "step": 289}
{"train_info/time_between_train_steps": 0.005767107009887695, "step": 289}
{"info/global_step": 290, "train_info/time_within_train_step": 54.397077560424805, "step": 290}
{"train_info/time_between_train_steps": 0.0055849552154541016, "step": 290}
{"info/global_step": 291, "train_info/time_within_train_step": 54.23816776275635, "step": 291}
{"train_info/time_between_train_steps": 0.005911350250244141, "step": 291}
{"info/global_step": 292, "train_info/time_within_train_step": 54.19840908050537, "step": 292}
{"train_info/time_between_train_steps": 0.010102272033691406, "step": 292}
{"info/global_step": 293, "train_info/time_within_train_step": 54.2811074256897, "step": 293}
{"train_info/time_between_train_steps": 0.005193233489990234, "step": 293}
{"info/global_step": 294, "train_info/time_within_train_step": 54.43468976020813, "step": 294}
{"train_info/time_between_train_steps": 0.010524272918701172, "step": 294}
{"info/global_step": 295, "train_info/time_within_train_step": 54.253355503082275, "step": 295}
{"train_info/time_between_train_steps": 0.01051020622253418, "step": 295}
{"info/global_step": 296, "train_info/time_within_train_step": 55.04879403114319, "step": 296}
{"train_info/time_between_train_steps": 0.00558018684387207, "step": 296}
{"info/global_step": 297, "train_info/time_within_train_step": 54.34609532356262, "step": 297}
{"train_info/time_between_train_steps": 0.005360603332519531, "step": 297}
{"info/global_step": 298, "train_info/time_within_train_step": 54.577178716659546, "step": 298}
{"train_info/time_between_train_steps": 0.010412216186523438, "step": 298}
{"info/global_step": 299, "train_info/time_within_train_step": 45.98192262649536, "step": 299}
{"train_info/time_between_train_steps": 0.005329608917236328, "step": 299}
{"info/global_step": 300, "train_info/time_within_train_step": 27.815983295440674, "step": 300}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733870779, "_runtime": 9091}, "step": 300}
{"logs": {"train/loss": 5.4147, "train/learning_rate": 0.0005, "train/epoch": 12.01, "_timestamp": 1733870779, "_runtime": 9091}, "step": 300}
{"train_info/time_between_train_steps": 2.4862406253814697, "step": 300}
{"info/global_step": 301, "train_info/time_within_train_step": 27.95231795310974, "step": 301}
{"train_info/time_between_train_steps": 0.010192155838012695, "step": 301}
{"info/global_step": 302, "train_info/time_within_train_step": 27.912920236587524, "step": 302}
{"train_info/time_between_train_steps": 0.009202241897583008, "step": 302}
{"info/global_step": 303, "train_info/time_within_train_step": 27.942954063415527, "step": 303}
{"train_info/time_between_train_steps": 0.00543522834777832, "step": 303}
{"info/global_step": 304, "train_info/time_within_train_step": 27.916218042373657, "step": 304}
{"train_info/time_between_train_steps": 0.0053865909576416016, "step": 304}
{"info/global_step": 305, "train_info/time_within_train_step": 27.97864031791687, "step": 305}
{"train_info/time_between_train_steps": 0.005716085433959961, "step": 305}
{"info/global_step": 306, "train_info/time_within_train_step": 27.850365161895752, "step": 306}
{"train_info/time_between_train_steps": 0.0052754878997802734, "step": 306}
{"info/global_step": 307, "train_info/time_within_train_step": 27.87501049041748, "step": 307}
{"train_info/time_between_train_steps": 0.005446195602416992, "step": 307}
{"info/global_step": 308, "train_info/time_within_train_step": 27.890231132507324, "step": 308}
{"train_info/time_between_train_steps": 0.009997129440307617, "step": 308}
{"info/global_step": 309, "train_info/time_within_train_step": 27.950765371322632, "step": 309}
{"train_info/time_between_train_steps": 0.0058116912841796875, "step": 309}
{"info/global_step": 310, "train_info/time_within_train_step": 27.922719478607178, "step": 310}
{"train_info/time_between_train_steps": 0.011106729507446289, "step": 310}
{"info/global_step": 311, "train_info/time_within_train_step": 27.96547031402588, "step": 311}
{"train_info/time_between_train_steps": 0.0059015750885009766, "step": 311}
{"info/global_step": 312, "train_info/time_within_train_step": 28.105748414993286, "step": 312}
{"train_info/time_between_train_steps": 0.006141185760498047, "step": 312}
{"train_info/time_between_train_steps": 5.200135707855225, "step": 312}
{"info/global_step": 313, "train_info/time_within_train_step": 27.94357967376709, "step": 313}
{"train_info/time_between_train_steps": 0.006500959396362305, "step": 313}
{"info/global_step": 314, "train_info/time_within_train_step": 28.057218074798584, "step": 314}
{"train_info/time_between_train_steps": 0.010511398315429688, "step": 314}
{"info/global_step": 315, "train_info/time_within_train_step": 27.940613746643066, "step": 315}
{"train_info/time_between_train_steps": 0.005811929702758789, "step": 315}
{"info/global_step": 316, "train_info/time_within_train_step": 28.0390043258667, "step": 316}
{"train_info/time_between_train_steps": 0.009774208068847656, "step": 316}
{"info/global_step": 317, "train_info/time_within_train_step": 27.88076138496399, "step": 317}
{"train_info/time_between_train_steps": 0.0052258968353271484, "step": 317}
{"info/global_step": 318, "train_info/time_within_train_step": 28.030539751052856, "step": 318}
{"train_info/time_between_train_steps": 0.014481306076049805, "step": 318}
{"info/global_step": 319, "train_info/time_within_train_step": 27.872583627700806, "step": 319}
{"train_info/time_between_train_steps": 0.005280971527099609, "step": 319}
{"info/global_step": 320, "train_info/time_within_train_step": 27.928632259368896, "step": 320}
{"train_info/time_between_train_steps": 0.007923364639282227, "step": 320}
{"info/global_step": 321, "train_info/time_within_train_step": 27.86077070236206, "step": 321}
{"train_info/time_between_train_steps": 0.005402565002441406, "step": 321}
{"info/global_step": 322, "train_info/time_within_train_step": 27.893105030059814, "step": 322}
{"train_info/time_between_train_steps": 0.00884556770324707, "step": 322}
{"info/global_step": 323, "train_info/time_within_train_step": 27.911871194839478, "step": 323}
{"train_info/time_between_train_steps": 0.013902902603149414, "step": 323}
{"info/global_step": 324, "train_info/time_within_train_step": 28.014004230499268, "step": 324}
{"train_info/time_between_train_steps": 0.014440536499023438, "step": 324}
{"info/global_step": 325, "train_info/time_within_train_step": 27.917236328125, "step": 325}
{"train_info/time_between_train_steps": 0.013857603073120117, "step": 325}
{"info/global_step": 326, "train_info/time_within_train_step": 27.988632917404175, "step": 326}
{"train_info/time_between_train_steps": 0.005274772644042969, "step": 326}
{"info/global_step": 327, "train_info/time_within_train_step": 27.926281213760376, "step": 327}
{"train_info/time_between_train_steps": 0.0054438114166259766, "step": 327}
{"info/global_step": 328, "train_info/time_within_train_step": 28.04514455795288, "step": 328}
{"train_info/time_between_train_steps": 0.009557247161865234, "step": 328}
{"info/global_step": 329, "train_info/time_within_train_step": 27.916889190673828, "step": 329}
{"train_info/time_between_train_steps": 0.005468606948852539, "step": 329}
{"info/global_step": 330, "train_info/time_within_train_step": 27.922077894210815, "step": 330}
{"train_info/time_between_train_steps": 0.005370616912841797, "step": 330}
{"info/global_step": 331, "train_info/time_within_train_step": 27.923028230667114, "step": 331}
{"train_info/time_between_train_steps": 0.010865926742553711, "step": 331}
{"info/global_step": 332, "train_info/time_within_train_step": 27.8688805103302, "step": 332}
{"train_info/time_between_train_steps": 0.0054285526275634766, "step": 332}
{"info/global_step": 333, "train_info/time_within_train_step": 27.93871521949768, "step": 333}
{"train_info/time_between_train_steps": 0.005581378936767578, "step": 333}
{"info/global_step": 334, "train_info/time_within_train_step": 27.96034002304077, "step": 334}
{"train_info/time_between_train_steps": 0.005595684051513672, "step": 334}
{"info/global_step": 335, "train_info/time_within_train_step": 27.929439783096313, "step": 335}
{"train_info/time_between_train_steps": 0.010567903518676758, "step": 335}
{"info/global_step": 336, "train_info/time_within_train_step": 27.92082953453064, "step": 336}
{"train_info/time_between_train_steps": 0.005933046340942383, "step": 336}
{"train_info/time_between_train_steps": 5.33640193939209, "step": 336}
{"info/global_step": 337, "train_info/time_within_train_step": 27.91355299949646, "step": 337}
{"train_info/time_between_train_steps": 0.0051305294036865234, "step": 337}
{"info/global_step": 338, "train_info/time_within_train_step": 28.06067657470703, "step": 338}
{"train_info/time_between_train_steps": 0.005434274673461914, "step": 338}
{"info/global_step": 339, "train_info/time_within_train_step": 27.965662717819214, "step": 339}
{"train_info/time_between_train_steps": 0.010189056396484375, "step": 339}
{"info/global_step": 340, "train_info/time_within_train_step": 27.946305751800537, "step": 340}
{"train_info/time_between_train_steps": 0.0054225921630859375, "step": 340}
{"info/global_step": 341, "train_info/time_within_train_step": 27.912734270095825, "step": 341}
{"train_info/time_between_train_steps": 0.005174875259399414, "step": 341}
{"info/global_step": 342, "train_info/time_within_train_step": 27.81847834587097, "step": 342}
{"train_info/time_between_train_steps": 0.010183334350585938, "step": 342}
{"info/global_step": 343, "train_info/time_within_train_step": 27.983673810958862, "step": 343}
{"train_info/time_between_train_steps": 0.0051190853118896484, "step": 343}
{"info/global_step": 344, "train_info/time_within_train_step": 27.842815160751343, "step": 344}
{"train_info/time_between_train_steps": 0.005388736724853516, "step": 344}
{"info/global_step": 345, "train_info/time_within_train_step": 27.87504506111145, "step": 345}
{"train_info/time_between_train_steps": 0.00942540168762207, "step": 345}
{"info/global_step": 346, "train_info/time_within_train_step": 27.853031396865845, "step": 346}
{"train_info/time_between_train_steps": 0.00800943374633789, "step": 346}
{"info/global_step": 347, "train_info/time_within_train_step": 27.878655910491943, "step": 347}
{"train_info/time_between_train_steps": 0.005389213562011719, "step": 347}
{"info/global_step": 348, "train_info/time_within_train_step": 27.876102685928345, "step": 348}
{"train_info/time_between_train_steps": 0.010813713073730469, "step": 348}
{"info/global_step": 349, "train_info/time_within_train_step": 27.9240505695343, "step": 349}
{"train_info/time_between_train_steps": 0.005380392074584961, "step": 349}
{"info/global_step": 350, "train_info/time_within_train_step": 27.859062433242798, "step": 350}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733872189, "_runtime": 10501}, "step": 350}
{"logs": {"train/loss": 5.246, "train/learning_rate": 0.00047222222222222224, "train/epoch": 14.01, "_timestamp": 1733872189, "_runtime": 10501}, "step": 350}
{"train_info/time_between_train_steps": 0.0072078704833984375, "step": 350}
{"info/global_step": 351, "train_info/time_within_train_step": 27.838289260864258, "step": 351}
{"train_info/time_between_train_steps": 0.006203889846801758, "step": 351}
{"info/global_step": 352, "train_info/time_within_train_step": 27.94213056564331, "step": 352}
{"train_info/time_between_train_steps": 0.00999140739440918, "step": 352}
{"info/global_step": 353, "train_info/time_within_train_step": 27.85683512687683, "step": 353}
{"train_info/time_between_train_steps": 0.005193948745727539, "step": 353}
{"info/global_step": 354, "train_info/time_within_train_step": 27.94767117500305, "step": 354}
{"train_info/time_between_train_steps": 0.00541377067565918, "step": 354}
{"info/global_step": 355, "train_info/time_within_train_step": 27.84339213371277, "step": 355}
{"train_info/time_between_train_steps": 0.005814790725708008, "step": 355}
{"info/global_step": 356, "train_info/time_within_train_step": 27.874053716659546, "step": 356}
{"train_info/time_between_train_steps": 0.0056629180908203125, "step": 356}
{"info/global_step": 357, "train_info/time_within_train_step": 27.891692399978638, "step": 357}
{"train_info/time_between_train_steps": 0.005610942840576172, "step": 357}
{"info/global_step": 358, "train_info/time_within_train_step": 27.927151679992676, "step": 358}
{"train_info/time_between_train_steps": 0.006050586700439453, "step": 358}
{"info/global_step": 359, "train_info/time_within_train_step": 28.016385078430176, "step": 359}
{"train_info/time_between_train_steps": 0.005617856979370117, "step": 359}
{"info/global_step": 360, "train_info/time_within_train_step": 27.848596572875977, "step": 360}
{"train_info/time_between_train_steps": 0.0060024261474609375, "step": 360}
{"train_info/time_between_train_steps": 5.487926959991455, "step": 360}
{"info/global_step": 361, "train_info/time_within_train_step": 27.910669088363647, "step": 361}
{"train_info/time_between_train_steps": 0.010767936706542969, "step": 361}
{"info/global_step": 362, "train_info/time_within_train_step": 28.05900502204895, "step": 362}
{"train_info/time_between_train_steps": 0.005725383758544922, "step": 362}
{"info/global_step": 363, "train_info/time_within_train_step": 27.927067756652832, "step": 363}
{"train_info/time_between_train_steps": 0.0055768489837646484, "step": 363}
{"info/global_step": 364, "train_info/time_within_train_step": 27.906662464141846, "step": 364}
{"train_info/time_between_train_steps": 0.005615234375, "step": 364}
{"info/global_step": 365, "train_info/time_within_train_step": 28.010314226150513, "step": 365}
{"train_info/time_between_train_steps": 0.014490604400634766, "step": 365}
{"info/global_step": 366, "train_info/time_within_train_step": 27.816113233566284, "step": 366}
{"train_info/time_between_train_steps": 0.005274772644042969, "step": 366}
{"info/global_step": 367, "train_info/time_within_train_step": 27.923080921173096, "step": 367}
{"train_info/time_between_train_steps": 0.009685516357421875, "step": 367}
{"info/global_step": 368, "train_info/time_within_train_step": 27.908674001693726, "step": 368}
{"train_info/time_between_train_steps": 0.010564327239990234, "step": 368}
{"info/global_step": 369, "train_info/time_within_train_step": 27.894200086593628, "step": 369}
{"train_info/time_between_train_steps": 0.005381107330322266, "step": 369}
{"info/global_step": 370, "train_info/time_within_train_step": 27.835965156555176, "step": 370}
{"train_info/time_between_train_steps": 0.005221366882324219, "step": 370}
{"info/global_step": 371, "train_info/time_within_train_step": 27.866164684295654, "step": 371}
{"train_info/time_between_train_steps": 0.005327701568603516, "step": 371}
{"info/global_step": 372, "train_info/time_within_train_step": 27.922224044799805, "step": 372}
{"train_info/time_between_train_steps": 0.005484104156494141, "step": 372}
{"info/global_step": 373, "train_info/time_within_train_step": 27.93669080734253, "step": 373}
{"train_info/time_between_train_steps": 0.005464792251586914, "step": 373}
{"info/global_step": 374, "train_info/time_within_train_step": 27.982857704162598, "step": 374}
{"train_info/time_between_train_steps": 0.010157108306884766, "step": 374}
{"info/global_step": 375, "train_info/time_within_train_step": 27.819478511810303, "step": 375}
{"train_info/time_between_train_steps": 0.008983850479125977, "step": 375}
{"info/global_step": 376, "train_info/time_within_train_step": 27.968738079071045, "step": 376}
{"train_info/time_between_train_steps": 0.005590677261352539, "step": 376}
{"info/global_step": 377, "train_info/time_within_train_step": 27.891096115112305, "step": 377}
{"train_info/time_between_train_steps": 0.005487203598022461, "step": 377}
{"info/global_step": 378, "train_info/time_within_train_step": 27.92504358291626, "step": 378}
{"train_info/time_between_train_steps": 0.0057337284088134766, "step": 378}
{"info/global_step": 379, "train_info/time_within_train_step": 27.873619079589844, "step": 379}
{"train_info/time_between_train_steps": 0.005158662796020508, "step": 379}
{"info/global_step": 380, "train_info/time_within_train_step": 27.91353416442871, "step": 380}
{"train_info/time_between_train_steps": 0.00658416748046875, "step": 380}
{"info/global_step": 381, "train_info/time_within_train_step": 27.88924789428711, "step": 381}
{"train_info/time_between_train_steps": 0.005296468734741211, "step": 381}
{"info/global_step": 382, "train_info/time_within_train_step": 27.89810347557068, "step": 382}
{"train_info/time_between_train_steps": 0.005716085433959961, "step": 382}
{"info/global_step": 383, "train_info/time_within_train_step": 27.965447425842285, "step": 383}
{"train_info/time_between_train_steps": 0.015073299407958984, "step": 383}
{"info/global_step": 384, "train_info/time_within_train_step": 27.93622589111328, "step": 384}
{"train_info/time_between_train_steps": 0.010890483856201172, "step": 384}
{"train_info/time_between_train_steps": 5.232351064682007, "step": 384}
{"info/global_step": 385, "train_info/time_within_train_step": 27.88042116165161, "step": 385}
{"train_info/time_between_train_steps": 0.005445241928100586, "step": 385}
{"info/global_step": 386, "train_info/time_within_train_step": 28.035608053207397, "step": 386}
{"train_info/time_between_train_steps": 0.010398387908935547, "step": 386}
{"info/global_step": 387, "train_info/time_within_train_step": 27.923914670944214, "step": 387}
{"train_info/time_between_train_steps": 0.00563359260559082, "step": 387}
{"info/global_step": 388, "train_info/time_within_train_step": 27.99910283088684, "step": 388}
{"train_info/time_between_train_steps": 0.005629777908325195, "step": 388}
{"info/global_step": 389, "train_info/time_within_train_step": 27.885318994522095, "step": 389}
{"train_info/time_between_train_steps": 0.005276679992675781, "step": 389}
{"info/global_step": 390, "train_info/time_within_train_step": 27.94597625732422, "step": 390}
{"train_info/time_between_train_steps": 0.005300760269165039, "step": 390}
{"info/global_step": 391, "train_info/time_within_train_step": 27.91901183128357, "step": 391}
{"train_info/time_between_train_steps": 0.0051059722900390625, "step": 391}
{"info/global_step": 392, "train_info/time_within_train_step": 27.922277688980103, "step": 392}
{"train_info/time_between_train_steps": 0.010256052017211914, "step": 392}
{"info/global_step": 393, "train_info/time_within_train_step": 27.946816444396973, "step": 393}
{"train_info/time_between_train_steps": 0.005426645278930664, "step": 393}
{"info/global_step": 394, "train_info/time_within_train_step": 27.813148260116577, "step": 394}
{"train_info/time_between_train_steps": 0.005214691162109375, "step": 394}
{"info/global_step": 395, "train_info/time_within_train_step": 28.031450510025024, "step": 395}
{"train_info/time_between_train_steps": 0.010218620300292969, "step": 395}
{"info/global_step": 396, "train_info/time_within_train_step": 27.832324743270874, "step": 396}
{"train_info/time_between_train_steps": 0.005281686782836914, "step": 396}
{"info/global_step": 397, "train_info/time_within_train_step": 27.890445232391357, "step": 397}
{"train_info/time_between_train_steps": 0.005423545837402344, "step": 397}
{"info/global_step": 398, "train_info/time_within_train_step": 27.870547771453857, "step": 398}
{"train_info/time_between_train_steps": 0.00529170036315918, "step": 398}
{"info/global_step": 399, "train_info/time_within_train_step": 27.923609733581543, "step": 399}
{"train_info/time_between_train_steps": 0.006553173065185547, "step": 399}
{"info/global_step": 400, "train_info/time_within_train_step": 27.91495633125305, "step": 400}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733873596, "_runtime": 11908}, "step": 400}
{"logs": {"train/loss": 5.1141, "train/learning_rate": 0.00044444444444444436, "train/epoch": 16.01, "_timestamp": 1733873596, "_runtime": 11908}, "step": 400}
{"train_info/time_between_train_steps": 2.3100426197052, "step": 400}
{"info/global_step": 401, "train_info/time_within_train_step": 27.960118770599365, "step": 401}
{"train_info/time_between_train_steps": 0.010901212692260742, "step": 401}
{"info/global_step": 402, "train_info/time_within_train_step": 27.82571816444397, "step": 402}
{"train_info/time_between_train_steps": 0.005398988723754883, "step": 402}
{"info/global_step": 403, "train_info/time_within_train_step": 27.9453444480896, "step": 403}
{"train_info/time_between_train_steps": 0.01426243782043457, "step": 403}
{"info/global_step": 404, "train_info/time_within_train_step": 27.875283002853394, "step": 404}
{"train_info/time_between_train_steps": 0.005678892135620117, "step": 404}
{"info/global_step": 405, "train_info/time_within_train_step": 27.934632062911987, "step": 405}
{"train_info/time_between_train_steps": 0.005330562591552734, "step": 405}
{"info/global_step": 406, "train_info/time_within_train_step": 27.880878925323486, "step": 406}
{"train_info/time_between_train_steps": 0.005694866180419922, "step": 406}
{"info/global_step": 407, "train_info/time_within_train_step": 27.85265612602234, "step": 407}
{"train_info/time_between_train_steps": 0.005730152130126953, "step": 407}
{"info/global_step": 408, "train_info/time_within_train_step": 27.920149087905884, "step": 408}
{"train_info/time_between_train_steps": 0.006062984466552734, "step": 408}
{"train_info/time_between_train_steps": 5.215541124343872, "step": 408}
{"info/global_step": 409, "train_info/time_within_train_step": 27.87403392791748, "step": 409}
{"train_info/time_between_train_steps": 0.010165929794311523, "step": 409}
{"info/global_step": 410, "train_info/time_within_train_step": 28.105641841888428, "step": 410}
{"train_info/time_between_train_steps": 0.005406618118286133, "step": 410}
{"info/global_step": 411, "train_info/time_within_train_step": 27.8521511554718, "step": 411}
{"train_info/time_between_train_steps": 0.00648951530456543, "step": 411}
{"info/global_step": 412, "train_info/time_within_train_step": 28.015289783477783, "step": 412}
{"train_info/time_between_train_steps": 0.005639076232910156, "step": 412}
{"info/global_step": 413, "train_info/time_within_train_step": 27.95787477493286, "step": 413}
{"train_info/time_between_train_steps": 0.014213323593139648, "step": 413}
{"info/global_step": 414, "train_info/time_within_train_step": 27.87571358680725, "step": 414}
{"train_info/time_between_train_steps": 0.005636930465698242, "step": 414}
{"info/global_step": 415, "train_info/time_within_train_step": 27.94058871269226, "step": 415}
{"train_info/time_between_train_steps": 0.005146503448486328, "step": 415}
{"info/global_step": 416, "train_info/time_within_train_step": 27.896914958953857, "step": 416}
{"train_info/time_between_train_steps": 0.00959634780883789, "step": 416}
{"info/global_step": 417, "train_info/time_within_train_step": 27.883610725402832, "step": 417}
{"train_info/time_between_train_steps": 0.005218029022216797, "step": 417}
{"info/global_step": 418, "train_info/time_within_train_step": 27.903810024261475, "step": 418}
{"train_info/time_between_train_steps": 0.005398750305175781, "step": 418}
{"info/global_step": 419, "train_info/time_within_train_step": 27.812946796417236, "step": 419}
{"train_info/time_between_train_steps": 0.01419520378112793, "step": 419}
{"info/global_step": 420, "train_info/time_within_train_step": 27.90622115135193, "step": 420}
{"train_info/time_between_train_steps": 0.0100860595703125, "step": 420}
{"info/global_step": 421, "train_info/time_within_train_step": 28.07691717147827, "step": 421}
{"train_info/time_between_train_steps": 0.013910293579101562, "step": 421}
{"info/global_step": 422, "train_info/time_within_train_step": 27.86402177810669, "step": 422}
{"train_info/time_between_train_steps": 0.010456085205078125, "step": 422}
{"info/global_step": 423, "train_info/time_within_train_step": 27.864712238311768, "step": 423}
{"train_info/time_between_train_steps": 0.005240917205810547, "step": 423}
{"info/global_step": 424, "train_info/time_within_train_step": 27.85373544692993, "step": 424}
{"train_info/time_between_train_steps": 0.00566411018371582, "step": 424}
{"info/global_step": 425, "train_info/time_within_train_step": 27.910603523254395, "step": 425}
{"train_info/time_between_train_steps": 0.010902881622314453, "step": 425}
{"info/global_step": 426, "train_info/time_within_train_step": 27.866512775421143, "step": 426}
{"train_info/time_between_train_steps": 0.005379438400268555, "step": 426}
{"info/global_step": 427, "train_info/time_within_train_step": 27.883288621902466, "step": 427}
{"train_info/time_between_train_steps": 0.005482196807861328, "step": 427}
{"info/global_step": 428, "train_info/time_within_train_step": 27.89821982383728, "step": 428}
{"train_info/time_between_train_steps": 0.006619930267333984, "step": 428}
{"info/global_step": 429, "train_info/time_within_train_step": 27.90566897392273, "step": 429}
{"train_info/time_between_train_steps": 0.009766340255737305, "step": 429}
{"info/global_step": 430, "train_info/time_within_train_step": 27.890706777572632, "step": 430}
{"train_info/time_between_train_steps": 0.005345821380615234, "step": 430}
{"info/global_step": 431, "train_info/time_within_train_step": 27.875792503356934, "step": 431}
{"train_info/time_between_train_steps": 0.016437530517578125, "step": 431}
{"info/global_step": 432, "train_info/time_within_train_step": 27.900954723358154, "step": 432}
{"train_info/time_between_train_steps": 0.005933523178100586, "step": 432}
{"train_info/time_between_train_steps": 5.349683523178101, "step": 432}
{"info/global_step": 433, "train_info/time_within_train_step": 27.885534286499023, "step": 433}
{"train_info/time_between_train_steps": 0.005750894546508789, "step": 433}
{"info/global_step": 434, "train_info/time_within_train_step": 27.9525887966156, "step": 434}
{"train_info/time_between_train_steps": 0.009895801544189453, "step": 434}
{"info/global_step": 435, "train_info/time_within_train_step": 27.83566117286682, "step": 435}
{"train_info/time_between_train_steps": 0.005357265472412109, "step": 435}
{"info/global_step": 436, "train_info/time_within_train_step": 27.940978288650513, "step": 436}
{"train_info/time_between_train_steps": 0.010418891906738281, "step": 436}
{"info/global_step": 437, "train_info/time_within_train_step": 27.980412483215332, "step": 437}
{"train_info/time_between_train_steps": 0.0063152313232421875, "step": 437}
{"info/global_step": 438, "train_info/time_within_train_step": 27.86991834640503, "step": 438}
{"train_info/time_between_train_steps": 0.005168437957763672, "step": 438}
{"info/global_step": 439, "train_info/time_within_train_step": 27.884427547454834, "step": 439}
{"train_info/time_between_train_steps": 0.008323907852172852, "step": 439}
{"info/global_step": 440, "train_info/time_within_train_step": 27.893783807754517, "step": 440}
{"train_info/time_between_train_steps": 0.005981922149658203, "step": 440}
{"info/global_step": 441, "train_info/time_within_train_step": 27.8704776763916, "step": 441}
{"train_info/time_between_train_steps": 0.009710073471069336, "step": 441}
{"info/global_step": 442, "train_info/time_within_train_step": 27.863332509994507, "step": 442}
{"train_info/time_between_train_steps": 0.0054018497467041016, "step": 442}
{"info/global_step": 443, "train_info/time_within_train_step": 27.86281991004944, "step": 443}
{"train_info/time_between_train_steps": 0.010308027267456055, "step": 443}
{"info/global_step": 444, "train_info/time_within_train_step": 27.92629861831665, "step": 444}
{"train_info/time_between_train_steps": 0.006601095199584961, "step": 444}
{"info/global_step": 445, "train_info/time_within_train_step": 27.84630036354065, "step": 445}
{"train_info/time_between_train_steps": 0.008348226547241211, "step": 445}
{"info/global_step": 446, "train_info/time_within_train_step": 27.856345176696777, "step": 446}
{"train_info/time_between_train_steps": 0.0060961246490478516, "step": 446}
{"info/global_step": 447, "train_info/time_within_train_step": 27.856279611587524, "step": 447}
{"train_info/time_between_train_steps": 0.010698556900024414, "step": 447}
{"info/global_step": 448, "train_info/time_within_train_step": 27.88671612739563, "step": 448}
{"train_info/time_between_train_steps": 0.0057773590087890625, "step": 448}
{"info/global_step": 449, "train_info/time_within_train_step": 27.800527334213257, "step": 449}
{"train_info/time_between_train_steps": 0.006496906280517578, "step": 449}
{"info/global_step": 450, "train_info/time_within_train_step": 27.81158995628357, "step": 450}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733875004, "_runtime": 13316}, "step": 450}
{"logs": {"train/loss": 4.9877, "train/learning_rate": 0.00041666666666666664, "train/epoch": 18.02, "_timestamp": 1733875004, "_runtime": 13316}, "step": 450}
{"train_info/time_between_train_steps": 0.0074841976165771484, "step": 450}
{"info/global_step": 451, "train_info/time_within_train_step": 27.803152561187744, "step": 451}
{"train_info/time_between_train_steps": 0.00532841682434082, "step": 451}
{"info/global_step": 452, "train_info/time_within_train_step": 27.996629238128662, "step": 452}
{"train_info/time_between_train_steps": 0.005557060241699219, "step": 452}
{"info/global_step": 453, "train_info/time_within_train_step": 27.90078353881836, "step": 453}
{"train_info/time_between_train_steps": 0.0054361820220947266, "step": 453}
{"info/global_step": 454, "train_info/time_within_train_step": 27.82730531692505, "step": 454}
{"train_info/time_between_train_steps": 0.005541324615478516, "step": 454}
{"info/global_step": 455, "train_info/time_within_train_step": 27.92565107345581, "step": 455}
{"train_info/time_between_train_steps": 0.015038013458251953, "step": 455}
{"info/global_step": 456, "train_info/time_within_train_step": 27.925771236419678, "step": 456}
{"train_info/time_between_train_steps": 0.0060122013092041016, "step": 456}
{"train_info/time_between_train_steps": 5.15233588218689, "step": 456}
{"info/global_step": 457, "train_info/time_within_train_step": 27.909586191177368, "step": 457}
{"train_info/time_between_train_steps": 0.006040334701538086, "step": 457}
{"info/global_step": 458, "train_info/time_within_train_step": 28.137542963027954, "step": 458}
{"train_info/time_between_train_steps": 0.011893987655639648, "step": 458}
{"info/global_step": 459, "train_info/time_within_train_step": 27.95271396636963, "step": 459}
{"train_info/time_between_train_steps": 0.006497621536254883, "step": 459}
{"info/global_step": 460, "train_info/time_within_train_step": 28.001882314682007, "step": 460}
{"train_info/time_between_train_steps": 0.005715847015380859, "step": 460}
{"info/global_step": 461, "train_info/time_within_train_step": 27.925892114639282, "step": 461}
{"train_info/time_between_train_steps": 0.005464792251586914, "step": 461}
{"info/global_step": 462, "train_info/time_within_train_step": 27.843188285827637, "step": 462}
{"train_info/time_between_train_steps": 0.01022195816040039, "step": 462}
{"info/global_step": 463, "train_info/time_within_train_step": 27.835870265960693, "step": 463}
{"train_info/time_between_train_steps": 0.00530552864074707, "step": 463}
{"info/global_step": 464, "train_info/time_within_train_step": 27.901309967041016, "step": 464}
{"train_info/time_between_train_steps": 0.01144099235534668, "step": 464}
{"info/global_step": 465, "train_info/time_within_train_step": 27.88672947883606, "step": 465}
{"train_info/time_between_train_steps": 0.009938240051269531, "step": 465}
{"info/global_step": 466, "train_info/time_within_train_step": 27.887600421905518, "step": 466}
{"train_info/time_between_train_steps": 0.00989675521850586, "step": 466}
{"info/global_step": 467, "train_info/time_within_train_step": 27.849918127059937, "step": 467}
{"train_info/time_between_train_steps": 0.005476474761962891, "step": 467}
{"info/global_step": 468, "train_info/time_within_train_step": 27.953349828720093, "step": 468}
{"train_info/time_between_train_steps": 0.011000633239746094, "step": 468}
{"info/global_step": 469, "train_info/time_within_train_step": 27.874753713607788, "step": 469}
{"train_info/time_between_train_steps": 0.0054209232330322266, "step": 469}
{"info/global_step": 470, "train_info/time_within_train_step": 27.884888172149658, "step": 470}
{"train_info/time_between_train_steps": 0.005951881408691406, "step": 470}
{"info/global_step": 471, "train_info/time_within_train_step": 27.82809352874756, "step": 471}
{"train_info/time_between_train_steps": 0.00557255744934082, "step": 471}
{"info/global_step": 472, "train_info/time_within_train_step": 27.86241579055786, "step": 472}
{"train_info/time_between_train_steps": 0.010120391845703125, "step": 472}
{"info/global_step": 473, "train_info/time_within_train_step": 27.844380378723145, "step": 473}
{"train_info/time_between_train_steps": 0.005620718002319336, "step": 473}
{"info/global_step": 474, "train_info/time_within_train_step": 27.89250683784485, "step": 474}
{"train_info/time_between_train_steps": 0.005524635314941406, "step": 474}
{"info/global_step": 475, "train_info/time_within_train_step": 27.882616758346558, "step": 475}
{"train_info/time_between_train_steps": 0.005684852600097656, "step": 475}
{"info/global_step": 476, "train_info/time_within_train_step": 27.834041118621826, "step": 476}
{"train_info/time_between_train_steps": 0.005663394927978516, "step": 476}
{"info/global_step": 477, "train_info/time_within_train_step": 27.90588068962097, "step": 477}
{"train_info/time_between_train_steps": 0.00581669807434082, "step": 477}
{"info/global_step": 478, "train_info/time_within_train_step": 27.864700078964233, "step": 478}
{"train_info/time_between_train_steps": 0.006318092346191406, "step": 478}
{"info/global_step": 479, "train_info/time_within_train_step": 27.850335597991943, "step": 479}
{"train_info/time_between_train_steps": 0.005738019943237305, "step": 479}
{"info/global_step": 480, "train_info/time_within_train_step": 27.91063904762268, "step": 480}
{"train_info/time_between_train_steps": 0.007357120513916016, "step": 480}
{"train_info/time_between_train_steps": 5.296358585357666, "step": 480}
{"info/global_step": 481, "train_info/time_within_train_step": 27.84310793876648, "step": 481}
{"train_info/time_between_train_steps": 0.005970478057861328, "step": 481}
{"info/global_step": 482, "train_info/time_within_train_step": 27.996733903884888, "step": 482}
{"train_info/time_between_train_steps": 0.005694389343261719, "step": 482}
{"info/global_step": 483, "train_info/time_within_train_step": 27.973267555236816, "step": 483}
{"train_info/time_between_train_steps": 0.01124882698059082, "step": 483}
{"info/global_step": 484, "train_info/time_within_train_step": 27.917524814605713, "step": 484}
{"train_info/time_between_train_steps": 0.00571441650390625, "step": 484}
{"info/global_step": 485, "train_info/time_within_train_step": 27.860389947891235, "step": 485}
{"train_info/time_between_train_steps": 0.00542759895324707, "step": 485}
{"info/global_step": 486, "train_info/time_within_train_step": 27.826270818710327, "step": 486}
{"train_info/time_between_train_steps": 0.0060253143310546875, "step": 486}
{"info/global_step": 487, "train_info/time_within_train_step": 27.85361337661743, "step": 487}
{"train_info/time_between_train_steps": 0.005337715148925781, "step": 487}
{"info/global_step": 488, "train_info/time_within_train_step": 27.836999893188477, "step": 488}
{"train_info/time_between_train_steps": 0.0056018829345703125, "step": 488}
{"info/global_step": 489, "train_info/time_within_train_step": 27.85642695426941, "step": 489}
{"train_info/time_between_train_steps": 0.005617856979370117, "step": 489}
{"info/global_step": 490, "train_info/time_within_train_step": 27.831857681274414, "step": 490}
{"train_info/time_between_train_steps": 0.011475324630737305, "step": 490}
{"info/global_step": 491, "train_info/time_within_train_step": 27.851728916168213, "step": 491}
{"train_info/time_between_train_steps": 0.00559544563293457, "step": 491}
{"info/global_step": 492, "train_info/time_within_train_step": 27.86044979095459, "step": 492}
{"train_info/time_between_train_steps": 0.014014959335327148, "step": 492}
{"info/global_step": 493, "train_info/time_within_train_step": 27.872878313064575, "step": 493}
{"train_info/time_between_train_steps": 0.005593299865722656, "step": 493}
{"info/global_step": 494, "train_info/time_within_train_step": 27.82900619506836, "step": 494}
{"train_info/time_between_train_steps": 0.010349273681640625, "step": 494}
{"info/global_step": 495, "train_info/time_within_train_step": 27.82022786140442, "step": 495}
{"train_info/time_between_train_steps": 0.011099100112915039, "step": 495}
{"info/global_step": 496, "train_info/time_within_train_step": 27.86856961250305, "step": 496}
{"train_info/time_between_train_steps": 0.0054931640625, "step": 496}
{"info/global_step": 497, "train_info/time_within_train_step": 27.846609354019165, "step": 497}
{"train_info/time_between_train_steps": 0.005639314651489258, "step": 497}
{"info/global_step": 498, "train_info/time_within_train_step": 27.828230619430542, "step": 498}
{"train_info/time_between_train_steps": 0.005542278289794922, "step": 498}
{"info/global_step": 499, "train_info/time_within_train_step": 27.958035707473755, "step": 499}
{"train_info/time_between_train_steps": 0.010689735412597656, "step": 499}
{"info/global_step": 500, "train_info/time_within_train_step": 27.839276552200317, "step": 500}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733876409, "_runtime": 14721}, "step": 500}
{"logs": {"train/loss": 4.8652, "train/learning_rate": 0.00038888888888888887, "train/epoch": 20.02, "_timestamp": 1733876409, "_runtime": 14721}, "step": 500}
{"train_info/time_between_train_steps": 2.394805908203125, "step": 500}
{"info/global_step": 501, "train_info/time_within_train_step": 27.87432885169983, "step": 501}
{"train_info/time_between_train_steps": 0.010862588882446289, "step": 501}
{"info/global_step": 502, "train_info/time_within_train_step": 27.8777072429657, "step": 502}
{"train_info/time_between_train_steps": 0.005761861801147461, "step": 502}
{"info/global_step": 503, "train_info/time_within_train_step": 27.890493631362915, "step": 503}
{"train_info/time_between_train_steps": 0.010388374328613281, "step": 503}
{"info/global_step": 504, "train_info/time_within_train_step": 27.889983892440796, "step": 504}
{"train_info/time_between_train_steps": 0.0061185359954833984, "step": 504}
{"train_info/time_between_train_steps": 5.4197797775268555, "step": 504}
{"info/global_step": 505, "train_info/time_within_train_step": 27.843919038772583, "step": 505}
{"train_info/time_between_train_steps": 0.0056915283203125, "step": 505}
{"info/global_step": 506, "train_info/time_within_train_step": 28.030489921569824, "step": 506}
{"train_info/time_between_train_steps": 0.005544185638427734, "step": 506}
{"info/global_step": 507, "train_info/time_within_train_step": 27.894803285598755, "step": 507}
{"train_info/time_between_train_steps": 0.005391597747802734, "step": 507}
{"info/global_step": 508, "train_info/time_within_train_step": 27.943537950515747, "step": 508}
{"train_info/time_between_train_steps": 0.005640745162963867, "step": 508}
{"info/global_step": 509, "train_info/time_within_train_step": 27.828128814697266, "step": 509}
{"train_info/time_between_train_steps": 0.005241870880126953, "step": 509}
{"info/global_step": 510, "train_info/time_within_train_step": 27.823890924453735, "step": 510}
{"train_info/time_between_train_steps": 0.005310535430908203, "step": 510}
{"info/global_step": 511, "train_info/time_within_train_step": 27.840429306030273, "step": 511}
{"train_info/time_between_train_steps": 0.005288362503051758, "step": 511}
{"info/global_step": 512, "train_info/time_within_train_step": 27.854710817337036, "step": 512}
{"train_info/time_between_train_steps": 0.005129814147949219, "step": 512}
{"info/global_step": 513, "train_info/time_within_train_step": 27.868507146835327, "step": 513}
{"train_info/time_between_train_steps": 0.006006002426147461, "step": 513}
{"info/global_step": 514, "train_info/time_within_train_step": 27.93352437019348, "step": 514}
{"train_info/time_between_train_steps": 0.005305767059326172, "step": 514}
{"info/global_step": 515, "train_info/time_within_train_step": 27.83526039123535, "step": 515}
{"train_info/time_between_train_steps": 0.010460376739501953, "step": 515}
{"info/global_step": 516, "train_info/time_within_train_step": 27.841933250427246, "step": 516}
{"train_info/time_between_train_steps": 0.005476713180541992, "step": 516}
{"info/global_step": 517, "train_info/time_within_train_step": 27.84576439857483, "step": 517}
{"train_info/time_between_train_steps": 0.0052182674407958984, "step": 517}
{"info/global_step": 518, "train_info/time_within_train_step": 27.84359884262085, "step": 518}
{"train_info/time_between_train_steps": 0.005664825439453125, "step": 518}
{"info/global_step": 519, "train_info/time_within_train_step": 27.852445125579834, "step": 519}
{"train_info/time_between_train_steps": 0.006258964538574219, "step": 519}
{"info/global_step": 520, "train_info/time_within_train_step": 27.842531204223633, "step": 520}
{"train_info/time_between_train_steps": 0.00561070442199707, "step": 520}
{"info/global_step": 521, "train_info/time_within_train_step": 27.889511108398438, "step": 521}
{"train_info/time_between_train_steps": 0.009637832641601562, "step": 521}
{"info/global_step": 522, "train_info/time_within_train_step": 27.802544832229614, "step": 522}
{"train_info/time_between_train_steps": 0.0051920413970947266, "step": 522}
{"info/global_step": 523, "train_info/time_within_train_step": 27.8525447845459, "step": 523}
{"train_info/time_between_train_steps": 0.0055637359619140625, "step": 523}
{"info/global_step": 524, "train_info/time_within_train_step": 27.80139923095703, "step": 524}
{"train_info/time_between_train_steps": 0.010105133056640625, "step": 524}
{"info/global_step": 525, "train_info/time_within_train_step": 27.865301370620728, "step": 525}
{"train_info/time_between_train_steps": 0.005692720413208008, "step": 525}
{"info/global_step": 526, "train_info/time_within_train_step": 27.88852858543396, "step": 526}
{"train_info/time_between_train_steps": 0.005749702453613281, "step": 526}
{"info/global_step": 527, "train_info/time_within_train_step": 27.896571159362793, "step": 527}
{"train_info/time_between_train_steps": 0.007287263870239258, "step": 527}
{"info/global_step": 528, "train_info/time_within_train_step": 27.88986873626709, "step": 528}
{"train_info/time_between_train_steps": 0.011726617813110352, "step": 528}
{"train_info/time_between_train_steps": 5.120944023132324, "step": 528}
{"info/global_step": 529, "train_info/time_within_train_step": 27.89640474319458, "step": 529}
{"train_info/time_between_train_steps": 0.005939006805419922, "step": 529}
{"info/global_step": 530, "train_info/time_within_train_step": 28.218708515167236, "step": 530}
{"train_info/time_between_train_steps": 0.005604267120361328, "step": 530}
{"info/global_step": 531, "train_info/time_within_train_step": 27.859265327453613, "step": 531}
{"train_info/time_between_train_steps": 0.0059545040130615234, "step": 531}
{"info/global_step": 532, "train_info/time_within_train_step": 27.967445850372314, "step": 532}
{"train_info/time_between_train_steps": 0.005720376968383789, "step": 532}
{"info/global_step": 533, "train_info/time_within_train_step": 27.89865231513977, "step": 533}
{"train_info/time_between_train_steps": 0.0056056976318359375, "step": 533}
{"info/global_step": 534, "train_info/time_within_train_step": 27.8799991607666, "step": 534}
{"train_info/time_between_train_steps": 0.005559206008911133, "step": 534}
{"info/global_step": 535, "train_info/time_within_train_step": 27.83234429359436, "step": 535}
{"train_info/time_between_train_steps": 0.005421161651611328, "step": 535}
{"info/global_step": 536, "train_info/time_within_train_step": 27.84687352180481, "step": 536}
{"train_info/time_between_train_steps": 0.005324840545654297, "step": 536}
{"info/global_step": 537, "train_info/time_within_train_step": 27.812856674194336, "step": 537}
{"train_info/time_between_train_steps": 0.005374908447265625, "step": 537}
{"info/global_step": 538, "train_info/time_within_train_step": 27.82063102722168, "step": 538}
{"train_info/time_between_train_steps": 0.005239248275756836, "step": 538}
{"info/global_step": 539, "train_info/time_within_train_step": 27.82723379135132, "step": 539}
{"train_info/time_between_train_steps": 0.005295991897583008, "step": 539}
{"info/global_step": 540, "train_info/time_within_train_step": 27.811086177825928, "step": 540}
{"train_info/time_between_train_steps": 0.005580425262451172, "step": 540}
{"info/global_step": 541, "train_info/time_within_train_step": 27.837977409362793, "step": 541}
{"train_info/time_between_train_steps": 0.005512237548828125, "step": 541}
{"info/global_step": 542, "train_info/time_within_train_step": 27.830695629119873, "step": 542}
{"train_info/time_between_train_steps": 0.005494594573974609, "step": 542}
{"info/global_step": 543, "train_info/time_within_train_step": 27.867006301879883, "step": 543}
{"train_info/time_between_train_steps": 0.005351066589355469, "step": 543}
{"info/global_step": 544, "train_info/time_within_train_step": 27.807859659194946, "step": 544}
{"train_info/time_between_train_steps": 0.005249977111816406, "step": 544}
{"info/global_step": 545, "train_info/time_within_train_step": 27.82230019569397, "step": 545}
{"train_info/time_between_train_steps": 0.010681867599487305, "step": 545}
{"info/global_step": 546, "train_info/time_within_train_step": 27.970029592514038, "step": 546}
{"train_info/time_between_train_steps": 0.006182193756103516, "step": 546}
{"info/global_step": 547, "train_info/time_within_train_step": 27.87220859527588, "step": 547}
{"train_info/time_between_train_steps": 0.005524396896362305, "step": 547}
{"info/global_step": 548, "train_info/time_within_train_step": 27.823115825653076, "step": 548}
{"train_info/time_between_train_steps": 0.005835056304931641, "step": 548}
{"info/global_step": 549, "train_info/time_within_train_step": 27.857767820358276, "step": 549}
{"train_info/time_between_train_steps": 0.005532026290893555, "step": 549}
{"info/global_step": 550, "train_info/time_within_train_step": 27.86286187171936, "step": 550}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733877816, "_runtime": 16128}, "step": 550}
{"logs": {"train/loss": 4.7263, "train/learning_rate": 0.0003611111111111111, "train/epoch": 22.02, "_timestamp": 1733877816, "_runtime": 16128}, "step": 550}
{"train_info/time_between_train_steps": 0.007869482040405273, "step": 550}
{"info/global_step": 551, "train_info/time_within_train_step": 27.906161546707153, "step": 551}
{"train_info/time_between_train_steps": 0.005956411361694336, "step": 551}
{"info/global_step": 552, "train_info/time_within_train_step": 27.835118293762207, "step": 552}
{"train_info/time_between_train_steps": 0.006093740463256836, "step": 552}
{"train_info/time_between_train_steps": 5.284787654876709, "step": 552}
{"info/global_step": 553, "train_info/time_within_train_step": 27.828003883361816, "step": 553}
{"train_info/time_between_train_steps": 0.005063533782958984, "step": 553}
{"info/global_step": 554, "train_info/time_within_train_step": 27.94733953475952, "step": 554}
{"train_info/time_between_train_steps": 0.005703926086425781, "step": 554}
{"info/global_step": 555, "train_info/time_within_train_step": 27.92203974723816, "step": 555}
{"train_info/time_between_train_steps": 0.005499839782714844, "step": 555}
{"info/global_step": 556, "train_info/time_within_train_step": 27.90157985687256, "step": 556}
{"train_info/time_between_train_steps": 0.00991058349609375, "step": 556}
{"info/global_step": 557, "train_info/time_within_train_step": 27.941086053848267, "step": 557}
{"train_info/time_between_train_steps": 0.00571751594543457, "step": 557}
{"info/global_step": 558, "train_info/time_within_train_step": 27.858603954315186, "step": 558}
{"train_info/time_between_train_steps": 0.005327701568603516, "step": 558}
{"info/global_step": 559, "train_info/time_within_train_step": 27.915207147598267, "step": 559}
{"train_info/time_between_train_steps": 0.005393505096435547, "step": 559}
{"info/global_step": 560, "train_info/time_within_train_step": 27.894651412963867, "step": 560}
{"train_info/time_between_train_steps": 0.005367279052734375, "step": 560}
{"info/global_step": 561, "train_info/time_within_train_step": 27.99834942817688, "step": 561}
{"train_info/time_between_train_steps": 0.007378816604614258, "step": 561}
{"info/global_step": 562, "train_info/time_within_train_step": 27.92231774330139, "step": 562}
{"train_info/time_between_train_steps": 0.005354404449462891, "step": 562}
{"info/global_step": 563, "train_info/time_within_train_step": 27.89910888671875, "step": 563}
{"train_info/time_between_train_steps": 0.009620428085327148, "step": 563}
{"info/global_step": 564, "train_info/time_within_train_step": 27.822662115097046, "step": 564}
{"train_info/time_between_train_steps": 0.005409717559814453, "step": 564}
{"info/global_step": 565, "train_info/time_within_train_step": 27.88777995109558, "step": 565}
{"train_info/time_between_train_steps": 0.00524139404296875, "step": 565}
{"info/global_step": 566, "train_info/time_within_train_step": 27.86192226409912, "step": 566}
{"train_info/time_between_train_steps": 0.005444765090942383, "step": 566}
{"info/global_step": 567, "train_info/time_within_train_step": 27.852421045303345, "step": 567}
{"train_info/time_between_train_steps": 0.009893178939819336, "step": 567}
{"info/global_step": 568, "train_info/time_within_train_step": 27.89379858970642, "step": 568}
{"train_info/time_between_train_steps": 0.005529165267944336, "step": 568}
{"info/global_step": 569, "train_info/time_within_train_step": 27.851369619369507, "step": 569}
{"train_info/time_between_train_steps": 0.005176544189453125, "step": 569}
{"info/global_step": 570, "train_info/time_within_train_step": 27.86748242378235, "step": 570}
{"train_info/time_between_train_steps": 0.006411552429199219, "step": 570}
{"info/global_step": 571, "train_info/time_within_train_step": 27.906250715255737, "step": 571}
{"train_info/time_between_train_steps": 0.005312204360961914, "step": 571}
{"info/global_step": 572, "train_info/time_within_train_step": 27.893706560134888, "step": 572}
{"train_info/time_between_train_steps": 0.010753870010375977, "step": 572}
{"info/global_step": 573, "train_info/time_within_train_step": 27.914600133895874, "step": 573}
{"train_info/time_between_train_steps": 0.01149606704711914, "step": 573}
{"info/global_step": 574, "train_info/time_within_train_step": 27.947702646255493, "step": 574}
{"train_info/time_between_train_steps": 0.005384922027587891, "step": 574}
{"info/global_step": 575, "train_info/time_within_train_step": 27.92045021057129, "step": 575}
{"train_info/time_between_train_steps": 0.0062482357025146484, "step": 575}
{"info/global_step": 576, "train_info/time_within_train_step": 27.906256437301636, "step": 576}
{"train_info/time_between_train_steps": 0.010857343673706055, "step": 576}
{"train_info/time_between_train_steps": 5.474336862564087, "step": 576}
{"info/global_step": 577, "train_info/time_within_train_step": 27.944814205169678, "step": 577}
{"train_info/time_between_train_steps": 0.0054705142974853516, "step": 577}
{"info/global_step": 578, "train_info/time_within_train_step": 28.054246187210083, "step": 578}
{"train_info/time_between_train_steps": 0.008492231369018555, "step": 578}
{"info/global_step": 579, "train_info/time_within_train_step": 27.874080419540405, "step": 579}
{"train_info/time_between_train_steps": 0.005407810211181641, "step": 579}
{"info/global_step": 580, "train_info/time_within_train_step": 27.935359001159668, "step": 580}
{"train_info/time_between_train_steps": 0.005383729934692383, "step": 580}
{"info/global_step": 581, "train_info/time_within_train_step": 27.85428524017334, "step": 581}
{"train_info/time_between_train_steps": 0.0074841976165771484, "step": 581}
{"info/global_step": 582, "train_info/time_within_train_step": 27.831166982650757, "step": 582}
{"train_info/time_between_train_steps": 0.009261131286621094, "step": 582}
{"info/global_step": 583, "train_info/time_within_train_step": 27.855700969696045, "step": 583}
{"train_info/time_between_train_steps": 0.0052700042724609375, "step": 583}
{"info/global_step": 584, "train_info/time_within_train_step": 27.880573272705078, "step": 584}
{"train_info/time_between_train_steps": 0.005286693572998047, "step": 584}
{"info/global_step": 585, "train_info/time_within_train_step": 27.888071537017822, "step": 585}
{"train_info/time_between_train_steps": 0.013593196868896484, "step": 585}
{"info/global_step": 586, "train_info/time_within_train_step": 27.849879026412964, "step": 586}
{"train_info/time_between_train_steps": 0.010090351104736328, "step": 586}
{"info/global_step": 587, "train_info/time_within_train_step": 27.924092054367065, "step": 587}
{"train_info/time_between_train_steps": 0.005278825759887695, "step": 587}
{"info/global_step": 588, "train_info/time_within_train_step": 27.82734966278076, "step": 588}
{"train_info/time_between_train_steps": 0.0053501129150390625, "step": 588}
{"info/global_step": 589, "train_info/time_within_train_step": 27.91457724571228, "step": 589}
{"train_info/time_between_train_steps": 0.0053327083587646484, "step": 589}
{"info/global_step": 590, "train_info/time_within_train_step": 27.881101846694946, "step": 590}
{"train_info/time_between_train_steps": 0.005130767822265625, "step": 590}
{"info/global_step": 591, "train_info/time_within_train_step": 27.862570762634277, "step": 591}
{"train_info/time_between_train_steps": 0.005700588226318359, "step": 591}
{"info/global_step": 592, "train_info/time_within_train_step": 27.955049514770508, "step": 592}
{"train_info/time_between_train_steps": 0.005343437194824219, "step": 592}
{"info/global_step": 593, "train_info/time_within_train_step": 27.93032479286194, "step": 593}
{"train_info/time_between_train_steps": 0.005692481994628906, "step": 593}
{"info/global_step": 594, "train_info/time_within_train_step": 27.88618516921997, "step": 594}
{"train_info/time_between_train_steps": 0.0054819583892822266, "step": 594}
{"info/global_step": 595, "train_info/time_within_train_step": 27.854907989501953, "step": 595}
{"train_info/time_between_train_steps": 0.005196809768676758, "step": 595}
{"info/global_step": 596, "train_info/time_within_train_step": 27.84715962409973, "step": 596}
{"train_info/time_between_train_steps": 0.0058362483978271484, "step": 596}
{"info/global_step": 597, "train_info/time_within_train_step": 27.838088750839233, "step": 597}
{"train_info/time_between_train_steps": 0.010184526443481445, "step": 597}
{"info/global_step": 598, "train_info/time_within_train_step": 27.921239614486694, "step": 598}
{"train_info/time_between_train_steps": 0.009755611419677734, "step": 598}
{"info/global_step": 599, "train_info/time_within_train_step": 27.896024227142334, "step": 599}
{"train_info/time_between_train_steps": 0.011821508407592773, "step": 599}
{"info/global_step": 600, "train_info/time_within_train_step": 27.94292402267456, "step": 600}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733879222, "_runtime": 17534}, "step": 600}
{"logs": {"train/loss": 4.5808, "train/learning_rate": 0.0003333333333333333, "train/epoch": 24.02, "_timestamp": 1733879222, "_runtime": 17534}, "step": 600}
{"train_info/time_between_train_steps": 2.839597225189209, "step": 600}
{"train_info/time_between_train_steps": 7.952690839767456, "step": 600}
{"info/global_step": 601, "train_info/time_within_train_step": 27.817885637283325, "step": 601}
{"train_info/time_between_train_steps": 0.009822845458984375, "step": 601}
{"info/global_step": 602, "train_info/time_within_train_step": 28.11079692840576, "step": 602}
{"train_info/time_between_train_steps": 0.005141258239746094, "step": 602}
{"info/global_step": 603, "train_info/time_within_train_step": 27.870774745941162, "step": 603}
{"train_info/time_between_train_steps": 0.010284900665283203, "step": 603}
{"info/global_step": 604, "train_info/time_within_train_step": 27.955245971679688, "step": 604}
{"train_info/time_between_train_steps": 0.005579233169555664, "step": 604}
{"info/global_step": 605, "train_info/time_within_train_step": 27.851816654205322, "step": 605}
{"train_info/time_between_train_steps": 0.005100727081298828, "step": 605}
{"info/global_step": 606, "train_info/time_within_train_step": 27.849857807159424, "step": 606}
{"train_info/time_between_train_steps": 0.005554676055908203, "step": 606}
{"info/global_step": 607, "train_info/time_within_train_step": 27.838050603866577, "step": 607}
{"train_info/time_between_train_steps": 0.009172201156616211, "step": 607}
{"info/global_step": 608, "train_info/time_within_train_step": 27.986337423324585, "step": 608}
{"train_info/time_between_train_steps": 0.009524345397949219, "step": 608}
{"info/global_step": 609, "train_info/time_within_train_step": 27.850003957748413, "step": 609}
{"train_info/time_between_train_steps": 0.005481719970703125, "step": 609}
{"info/global_step": 610, "train_info/time_within_train_step": 27.860655307769775, "step": 610}
{"train_info/time_between_train_steps": 0.005255699157714844, "step": 610}
{"info/global_step": 611, "train_info/time_within_train_step": 27.891159772872925, "step": 611}
{"train_info/time_between_train_steps": 0.005232095718383789, "step": 611}
{"info/global_step": 612, "train_info/time_within_train_step": 27.85856342315674, "step": 612}
{"train_info/time_between_train_steps": 0.0054302215576171875, "step": 612}
{"info/global_step": 613, "train_info/time_within_train_step": 27.862857818603516, "step": 613}
{"train_info/time_between_train_steps": 0.005461215972900391, "step": 613}
{"info/global_step": 614, "train_info/time_within_train_step": 27.912312984466553, "step": 614}
{"train_info/time_between_train_steps": 0.005301952362060547, "step": 614}
{"info/global_step": 615, "train_info/time_within_train_step": 27.930366277694702, "step": 615}
{"train_info/time_between_train_steps": 0.005224943161010742, "step": 615}
{"info/global_step": 616, "train_info/time_within_train_step": 27.820459842681885, "step": 616}
{"train_info/time_between_train_steps": 0.010549068450927734, "step": 616}
{"info/global_step": 617, "train_info/time_within_train_step": 27.95806336402893, "step": 617}
{"train_info/time_between_train_steps": 0.010022401809692383, "step": 617}
{"info/global_step": 618, "train_info/time_within_train_step": 27.853299140930176, "step": 618}
{"train_info/time_between_train_steps": 0.00542449951171875, "step": 618}
{"info/global_step": 619, "train_info/time_within_train_step": 27.879270315170288, "step": 619}
{"train_info/time_between_train_steps": 0.010322809219360352, "step": 619}
{"info/global_step": 620, "train_info/time_within_train_step": 27.898733615875244, "step": 620}
{"train_info/time_between_train_steps": 0.0053937435150146484, "step": 620}
{"info/global_step": 621, "train_info/time_within_train_step": 27.862004041671753, "step": 621}
{"train_info/time_between_train_steps": 0.005614519119262695, "step": 621}
{"info/global_step": 622, "train_info/time_within_train_step": 27.875123262405396, "step": 622}
{"train_info/time_between_train_steps": 0.005391120910644531, "step": 622}
{"info/global_step": 623, "train_info/time_within_train_step": 27.894152641296387, "step": 623}
{"train_info/time_between_train_steps": 0.009673118591308594, "step": 623}
{"info/global_step": 624, "train_info/time_within_train_step": 28.011129140853882, "step": 624}
{"train_info/time_between_train_steps": 0.006047964096069336, "step": 624}
{"train_info/time_between_train_steps": 5.369655609130859, "step": 624}
{"info/global_step": 625, "train_info/time_within_train_step": 27.895280122756958, "step": 625}
{"train_info/time_between_train_steps": 0.004972696304321289, "step": 625}
{"info/global_step": 626, "train_info/time_within_train_step": 28.024032592773438, "step": 626}
{"train_info/time_between_train_steps": 0.011165380477905273, "step": 626}
{"info/global_step": 627, "train_info/time_within_train_step": 27.93697762489319, "step": 627}
{"train_info/time_between_train_steps": 0.0054209232330322266, "step": 627}
{"info/global_step": 628, "train_info/time_within_train_step": 27.882732391357422, "step": 628}
{"train_info/time_between_train_steps": 0.005675792694091797, "step": 628}
{"info/global_step": 629, "train_info/time_within_train_step": 27.885122537612915, "step": 629}
{"train_info/time_between_train_steps": 0.005019664764404297, "step": 629}
{"info/global_step": 630, "train_info/time_within_train_step": 27.8977108001709, "step": 630}
{"train_info/time_between_train_steps": 0.005239725112915039, "step": 630}
{"info/global_step": 631, "train_info/time_within_train_step": 27.897190809249878, "step": 631}
{"train_info/time_between_train_steps": 0.005419015884399414, "step": 631}
{"info/global_step": 632, "train_info/time_within_train_step": 27.897838354110718, "step": 632}
{"train_info/time_between_train_steps": 0.005216121673583984, "step": 632}
{"info/global_step": 633, "train_info/time_within_train_step": 27.852357625961304, "step": 633}
{"train_info/time_between_train_steps": 0.005405902862548828, "step": 633}
{"info/global_step": 634, "train_info/time_within_train_step": 27.894083261489868, "step": 634}
{"train_info/time_between_train_steps": 0.005175352096557617, "step": 634}
{"info/global_step": 635, "train_info/time_within_train_step": 27.8632071018219, "step": 635}
{"train_info/time_between_train_steps": 0.00528407096862793, "step": 635}
{"info/global_step": 636, "train_info/time_within_train_step": 27.94785165786743, "step": 636}
{"train_info/time_between_train_steps": 0.005322694778442383, "step": 636}
{"info/global_step": 637, "train_info/time_within_train_step": 27.882810354232788, "step": 637}
{"train_info/time_between_train_steps": 0.0061762332916259766, "step": 637}
{"info/global_step": 638, "train_info/time_within_train_step": 27.906910181045532, "step": 638}
{"train_info/time_between_train_steps": 0.005358457565307617, "step": 638}
{"info/global_step": 639, "train_info/time_within_train_step": 27.94679284095764, "step": 639}
{"train_info/time_between_train_steps": 0.005338907241821289, "step": 639}
{"info/global_step": 640, "train_info/time_within_train_step": 27.862999200820923, "step": 640}
{"train_info/time_between_train_steps": 0.005895137786865234, "step": 640}
{"info/global_step": 641, "train_info/time_within_train_step": 27.89948844909668, "step": 641}
{"train_info/time_between_train_steps": 0.005259037017822266, "step": 641}
{"info/global_step": 642, "train_info/time_within_train_step": 27.919026613235474, "step": 642}
{"train_info/time_between_train_steps": 0.011430978775024414, "step": 642}
{"info/global_step": 643, "train_info/time_within_train_step": 27.872007369995117, "step": 643}
{"train_info/time_between_train_steps": 0.005465984344482422, "step": 643}
{"info/global_step": 644, "train_info/time_within_train_step": 27.87464165687561, "step": 644}
{"train_info/time_between_train_steps": 0.0067577362060546875, "step": 644}
{"info/global_step": 645, "train_info/time_within_train_step": 27.858885288238525, "step": 645}
{"train_info/time_between_train_steps": 0.005514383316040039, "step": 645}
{"info/global_step": 646, "train_info/time_within_train_step": 27.875934839248657, "step": 646}
{"train_info/time_between_train_steps": 0.0064830780029296875, "step": 646}
{"info/global_step": 647, "train_info/time_within_train_step": 27.907817363739014, "step": 647}
{"train_info/time_between_train_steps": 0.010320425033569336, "step": 647}
{"info/global_step": 648, "train_info/time_within_train_step": 27.879340410232544, "step": 648}
{"train_info/time_between_train_steps": 0.006078958511352539, "step": 648}
{"train_info/time_between_train_steps": 5.4237892627716064, "step": 648}
{"info/global_step": 649, "train_info/time_within_train_step": 27.847715854644775, "step": 649}
{"train_info/time_between_train_steps": 0.01444387435913086, "step": 649}
{"info/global_step": 650, "train_info/time_within_train_step": 28.1419575214386, "step": 650}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733880636, "_runtime": 18948}, "step": 650}
{"logs": {"train/loss": 4.4631, "train/learning_rate": 0.00030555555555555555, "train/epoch": 27.0, "_timestamp": 1733880636, "_runtime": 18948}, "step": 650}
{"train_info/time_between_train_steps": 0.0076024532318115234, "step": 650}
{"info/global_step": 651, "train_info/time_within_train_step": 27.962664365768433, "step": 651}
{"train_info/time_between_train_steps": 0.005708456039428711, "step": 651}
{"info/global_step": 652, "train_info/time_within_train_step": 27.97283625602722, "step": 652}
{"train_info/time_between_train_steps": 0.009986162185668945, "step": 652}
{"info/global_step": 653, "train_info/time_within_train_step": 27.915614128112793, "step": 653}
{"train_info/time_between_train_steps": 0.0052263736724853516, "step": 653}
{"info/global_step": 654, "train_info/time_within_train_step": 27.86668062210083, "step": 654}
{"train_info/time_between_train_steps": 0.0053522586822509766, "step": 654}
{"info/global_step": 655, "train_info/time_within_train_step": 28.000743865966797, "step": 655}
{"train_info/time_between_train_steps": 0.0051631927490234375, "step": 655}
{"info/global_step": 656, "train_info/time_within_train_step": 27.86671257019043, "step": 656}
{"train_info/time_between_train_steps": 0.005816221237182617, "step": 656}
{"info/global_step": 657, "train_info/time_within_train_step": 27.914462566375732, "step": 657}
{"train_info/time_between_train_steps": 0.0054242610931396484, "step": 657}
{"info/global_step": 658, "train_info/time_within_train_step": 27.83583378791809, "step": 658}
{"train_info/time_between_train_steps": 0.00928640365600586, "step": 658}
{"info/global_step": 659, "train_info/time_within_train_step": 27.83978533744812, "step": 659}
{"train_info/time_between_train_steps": 0.0054318904876708984, "step": 659}
{"info/global_step": 660, "train_info/time_within_train_step": 27.826948881149292, "step": 660}
{"train_info/time_between_train_steps": 0.005329608917236328, "step": 660}
{"info/global_step": 661, "train_info/time_within_train_step": 27.876357793807983, "step": 661}
{"train_info/time_between_train_steps": 0.010441780090332031, "step": 661}
{"info/global_step": 662, "train_info/time_within_train_step": 27.91276979446411, "step": 662}
{"train_info/time_between_train_steps": 0.005395650863647461, "step": 662}
{"info/global_step": 663, "train_info/time_within_train_step": 27.84207057952881, "step": 663}
{"train_info/time_between_train_steps": 0.005218505859375, "step": 663}
{"info/global_step": 664, "train_info/time_within_train_step": 27.85801887512207, "step": 664}
{"train_info/time_between_train_steps": 0.0065572261810302734, "step": 664}
{"info/global_step": 665, "train_info/time_within_train_step": 27.826082229614258, "step": 665}
{"train_info/time_between_train_steps": 0.005336284637451172, "step": 665}
{"info/global_step": 666, "train_info/time_within_train_step": 27.97257161140442, "step": 666}
{"train_info/time_between_train_steps": 0.0053369998931884766, "step": 666}
{"info/global_step": 667, "train_info/time_within_train_step": 27.884641885757446, "step": 667}
{"train_info/time_between_train_steps": 0.005444526672363281, "step": 667}
{"info/global_step": 668, "train_info/time_within_train_step": 27.861114740371704, "step": 668}
{"train_info/time_between_train_steps": 0.0056304931640625, "step": 668}
{"info/global_step": 669, "train_info/time_within_train_step": 27.85574221611023, "step": 669}
{"train_info/time_between_train_steps": 0.005450725555419922, "step": 669}
{"info/global_step": 670, "train_info/time_within_train_step": 28.04161500930786, "step": 670}
{"train_info/time_between_train_steps": 0.005568265914916992, "step": 670}
{"info/global_step": 671, "train_info/time_within_train_step": 27.907753944396973, "step": 671}
{"train_info/time_between_train_steps": 0.005795478820800781, "step": 671}
{"info/global_step": 672, "train_info/time_within_train_step": 27.87393593788147, "step": 672}
{"train_info/time_between_train_steps": 0.0058290958404541016, "step": 672}
{"train_info/time_between_train_steps": 5.279158115386963, "step": 672}
{"info/global_step": 673, "train_info/time_within_train_step": 27.869053840637207, "step": 673}
{"train_info/time_between_train_steps": 0.00553131103515625, "step": 673}
{"info/global_step": 674, "train_info/time_within_train_step": 28.01433825492859, "step": 674}
{"train_info/time_between_train_steps": 0.005415916442871094, "step": 674}
{"info/global_step": 675, "train_info/time_within_train_step": 27.84256911277771, "step": 675}
{"train_info/time_between_train_steps": 0.005495786666870117, "step": 675}
{"info/global_step": 676, "train_info/time_within_train_step": 28.041896104812622, "step": 676}
{"train_info/time_between_train_steps": 0.009836196899414062, "step": 676}
{"info/global_step": 677, "train_info/time_within_train_step": 27.912744283676147, "step": 677}
{"train_info/time_between_train_steps": 0.005164146423339844, "step": 677}
{"info/global_step": 678, "train_info/time_within_train_step": 27.817155361175537, "step": 678}
{"train_info/time_between_train_steps": 0.0056400299072265625, "step": 678}
{"info/global_step": 679, "train_info/time_within_train_step": 27.905116081237793, "step": 679}
{"train_info/time_between_train_steps": 0.008977174758911133, "step": 679}
{"info/global_step": 680, "train_info/time_within_train_step": 27.985504388809204, "step": 680}
{"train_info/time_between_train_steps": 0.005307435989379883, "step": 680}
{"info/global_step": 681, "train_info/time_within_train_step": 27.85242533683777, "step": 681}
{"train_info/time_between_train_steps": 0.005267143249511719, "step": 681}
{"info/global_step": 682, "train_info/time_within_train_step": 27.85489511489868, "step": 682}
{"train_info/time_between_train_steps": 0.005684375762939453, "step": 682}
{"info/global_step": 683, "train_info/time_within_train_step": 27.880486726760864, "step": 683}
{"train_info/time_between_train_steps": 0.005312681198120117, "step": 683}
{"info/global_step": 684, "train_info/time_within_train_step": 27.866594791412354, "step": 684}
{"train_info/time_between_train_steps": 0.009598493576049805, "step": 684}
{"info/global_step": 685, "train_info/time_within_train_step": 27.86707615852356, "step": 685}
{"train_info/time_between_train_steps": 0.005392789840698242, "step": 685}
{"info/global_step": 686, "train_info/time_within_train_step": 27.948904275894165, "step": 686}
{"train_info/time_between_train_steps": 0.010075807571411133, "step": 686}
{"info/global_step": 687, "train_info/time_within_train_step": 27.854478120803833, "step": 687}
{"train_info/time_between_train_steps": 0.005673408508300781, "step": 687}
{"info/global_step": 688, "train_info/time_within_train_step": 27.850605964660645, "step": 688}
{"train_info/time_between_train_steps": 0.009410381317138672, "step": 688}
{"info/global_step": 689, "train_info/time_within_train_step": 27.879457473754883, "step": 689}
{"train_info/time_between_train_steps": 0.005396366119384766, "step": 689}
{"info/global_step": 690, "train_info/time_within_train_step": 27.856611251831055, "step": 690}
{"train_info/time_between_train_steps": 0.010206937789916992, "step": 690}
{"info/global_step": 691, "train_info/time_within_train_step": 27.816641092300415, "step": 691}
{"train_info/time_between_train_steps": 0.0052869319915771484, "step": 691}
{"info/global_step": 692, "train_info/time_within_train_step": 27.89573836326599, "step": 692}
{"train_info/time_between_train_steps": 0.01099085807800293, "step": 692}
{"info/global_step": 693, "train_info/time_within_train_step": 27.881745100021362, "step": 693}
{"train_info/time_between_train_steps": 0.005259513854980469, "step": 693}
{"info/global_step": 694, "train_info/time_within_train_step": 27.905223846435547, "step": 694}
{"train_info/time_between_train_steps": 0.005930423736572266, "step": 694}
{"info/global_step": 695, "train_info/time_within_train_step": 27.936837434768677, "step": 695}
{"train_info/time_between_train_steps": 0.005639076232910156, "step": 695}
{"info/global_step": 696, "train_info/time_within_train_step": 27.969319343566895, "step": 696}
{"train_info/time_between_train_steps": 0.005949974060058594, "step": 696}
{"train_info/time_between_train_steps": 5.299138069152832, "step": 696}
{"info/global_step": 697, "train_info/time_within_train_step": 27.832470655441284, "step": 697}
{"train_info/time_between_train_steps": 0.005220651626586914, "step": 697}
{"info/global_step": 698, "train_info/time_within_train_step": 28.041288375854492, "step": 698}
{"train_info/time_between_train_steps": 0.0051691532135009766, "step": 698}
{"info/global_step": 699, "train_info/time_within_train_step": 27.842570304870605, "step": 699}
{"train_info/time_between_train_steps": 0.009353160858154297, "step": 699}
{"info/global_step": 700, "train_info/time_within_train_step": 27.95538091659546, "step": 700}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733882042, "_runtime": 20354}, "step": 700}
{"logs": {"train/loss": 4.3476, "train/learning_rate": 0.0002777777777777778, "train/epoch": 29.0, "_timestamp": 1733882042, "_runtime": 20354}, "step": 700}
{"train_info/time_between_train_steps": 2.894319772720337, "step": 700}
{"info/global_step": 701, "train_info/time_within_train_step": 27.97170376777649, "step": 701}
{"train_info/time_between_train_steps": 0.005122661590576172, "step": 701}
{"info/global_step": 702, "train_info/time_within_train_step": 27.963645458221436, "step": 702}
{"train_info/time_between_train_steps": 0.013430356979370117, "step": 702}
{"info/global_step": 703, "train_info/time_within_train_step": 27.84221625328064, "step": 703}
{"train_info/time_between_train_steps": 0.005458354949951172, "step": 703}
{"info/global_step": 704, "train_info/time_within_train_step": 27.867116928100586, "step": 704}
{"train_info/time_between_train_steps": 0.014849662780761719, "step": 704}
{"info/global_step": 705, "train_info/time_within_train_step": 27.890214681625366, "step": 705}
{"train_info/time_between_train_steps": 0.005322456359863281, "step": 705}
{"info/global_step": 706, "train_info/time_within_train_step": 27.86959671974182, "step": 706}
{"train_info/time_between_train_steps": 0.0053558349609375, "step": 706}
{"info/global_step": 707, "train_info/time_within_train_step": 27.83532190322876, "step": 707}
{"train_info/time_between_train_steps": 0.005261421203613281, "step": 707}
{"info/global_step": 708, "train_info/time_within_train_step": 27.85789155960083, "step": 708}
{"train_info/time_between_train_steps": 0.0054051876068115234, "step": 708}
{"info/global_step": 709, "train_info/time_within_train_step": 27.859711408615112, "step": 709}
{"train_info/time_between_train_steps": 0.005505084991455078, "step": 709}
{"info/global_step": 710, "train_info/time_within_train_step": 27.83241868019104, "step": 710}
{"train_info/time_between_train_steps": 0.0053615570068359375, "step": 710}
{"info/global_step": 711, "train_info/time_within_train_step": 27.8771390914917, "step": 711}
{"train_info/time_between_train_steps": 0.00545191764831543, "step": 711}
{"info/global_step": 712, "train_info/time_within_train_step": 27.899548292160034, "step": 712}
{"train_info/time_between_train_steps": 0.0054662227630615234, "step": 712}
{"info/global_step": 713, "train_info/time_within_train_step": 27.864492654800415, "step": 713}
{"train_info/time_between_train_steps": 0.005400896072387695, "step": 713}
{"info/global_step": 714, "train_info/time_within_train_step": 27.828548192977905, "step": 714}
{"train_info/time_between_train_steps": 0.005742549896240234, "step": 714}
{"info/global_step": 715, "train_info/time_within_train_step": 27.863619565963745, "step": 715}
{"train_info/time_between_train_steps": 0.009663581848144531, "step": 715}
{"info/global_step": 716, "train_info/time_within_train_step": 27.942336082458496, "step": 716}
{"train_info/time_between_train_steps": 0.005761384963989258, "step": 716}
{"info/global_step": 717, "train_info/time_within_train_step": 28.023338794708252, "step": 717}
{"train_info/time_between_train_steps": 0.005545377731323242, "step": 717}
{"info/global_step": 718, "train_info/time_within_train_step": 27.887366771697998, "step": 718}
{"train_info/time_between_train_steps": 0.005745410919189453, "step": 718}
{"info/global_step": 719, "train_info/time_within_train_step": 27.91116499900818, "step": 719}
{"train_info/time_between_train_steps": 0.005788326263427734, "step": 719}
{"info/global_step": 720, "train_info/time_within_train_step": 27.967403411865234, "step": 720}
{"train_info/time_between_train_steps": 0.005941629409790039, "step": 720}
{"train_info/time_between_train_steps": 5.477025270462036, "step": 720}
{"info/global_step": 721, "train_info/time_within_train_step": 27.928735971450806, "step": 721}
{"train_info/time_between_train_steps": 0.005128383636474609, "step": 721}
{"info/global_step": 722, "train_info/time_within_train_step": 28.049934148788452, "step": 722}
{"train_info/time_between_train_steps": 0.005548238754272461, "step": 722}
{"info/global_step": 723, "train_info/time_within_train_step": 27.867759943008423, "step": 723}
{"train_info/time_between_train_steps": 0.005232095718383789, "step": 723}
{"info/global_step": 724, "train_info/time_within_train_step": 27.958215713500977, "step": 724}
{"train_info/time_between_train_steps": 0.010283708572387695, "step": 724}
{"info/global_step": 725, "train_info/time_within_train_step": 27.838098526000977, "step": 725}
{"train_info/time_between_train_steps": 0.008843421936035156, "step": 725}
{"info/global_step": 726, "train_info/time_within_train_step": 28.03019952774048, "step": 726}
{"train_info/time_between_train_steps": 0.005263090133666992, "step": 726}
{"info/global_step": 727, "train_info/time_within_train_step": 27.922576904296875, "step": 727}
{"train_info/time_between_train_steps": 0.00530242919921875, "step": 727}
{"info/global_step": 728, "train_info/time_within_train_step": 27.81952452659607, "step": 728}
{"train_info/time_between_train_steps": 0.005249500274658203, "step": 728}
{"info/global_step": 729, "train_info/time_within_train_step": 27.86084794998169, "step": 729}
{"train_info/time_between_train_steps": 0.00553584098815918, "step": 729}
{"info/global_step": 730, "train_info/time_within_train_step": 27.873020887374878, "step": 730}
{"train_info/time_between_train_steps": 0.010323286056518555, "step": 730}
{"info/global_step": 731, "train_info/time_within_train_step": 27.86635661125183, "step": 731}
{"train_info/time_between_train_steps": 0.009994983673095703, "step": 731}
{"info/global_step": 732, "train_info/time_within_train_step": 27.869921445846558, "step": 732}
{"train_info/time_between_train_steps": 0.005424022674560547, "step": 732}
{"info/global_step": 733, "train_info/time_within_train_step": 27.96374249458313, "step": 733}
{"train_info/time_between_train_steps": 0.00825810432434082, "step": 733}
{"info/global_step": 734, "train_info/time_within_train_step": 27.971956729888916, "step": 734}
{"train_info/time_between_train_steps": 0.009534835815429688, "step": 734}
{"info/global_step": 735, "train_info/time_within_train_step": 27.848340272903442, "step": 735}
{"train_info/time_between_train_steps": 0.011820554733276367, "step": 735}
{"info/global_step": 736, "train_info/time_within_train_step": 27.863386631011963, "step": 736}
{"train_info/time_between_train_steps": 0.005312919616699219, "step": 736}
{"info/global_step": 737, "train_info/time_within_train_step": 27.89184880256653, "step": 737}
{"train_info/time_between_train_steps": 0.008439779281616211, "step": 737}
{"info/global_step": 738, "train_info/time_within_train_step": 27.89066457748413, "step": 738}
{"train_info/time_between_train_steps": 0.0051767826080322266, "step": 738}
{"info/global_step": 739, "train_info/time_within_train_step": 27.878474712371826, "step": 739}
{"train_info/time_between_train_steps": 0.00537419319152832, "step": 739}
{"info/global_step": 740, "train_info/time_within_train_step": 27.918630123138428, "step": 740}
{"train_info/time_between_train_steps": 0.014837503433227539, "step": 740}
{"info/global_step": 741, "train_info/time_within_train_step": 27.868849992752075, "step": 741}
{"train_info/time_between_train_steps": 0.0053942203521728516, "step": 741}
{"info/global_step": 742, "train_info/time_within_train_step": 27.92979669570923, "step": 742}
{"train_info/time_between_train_steps": 0.006720304489135742, "step": 742}
{"info/global_step": 743, "train_info/time_within_train_step": 27.953426361083984, "step": 743}
{"train_info/time_between_train_steps": 0.00989675521850586, "step": 743}
{"info/global_step": 744, "train_info/time_within_train_step": 27.905426502227783, "step": 744}
{"train_info/time_between_train_steps": 0.006106853485107422, "step": 744}
{"train_info/time_between_train_steps": 5.212895631790161, "step": 744}
{"info/global_step": 745, "train_info/time_within_train_step": 27.943410396575928, "step": 745}
{"train_info/time_between_train_steps": 0.005742073059082031, "step": 745}
{"info/global_step": 746, "train_info/time_within_train_step": 28.070550680160522, "step": 746}
{"train_info/time_between_train_steps": 0.0053234100341796875, "step": 746}
{"info/global_step": 747, "train_info/time_within_train_step": 27.933279752731323, "step": 747}
{"train_info/time_between_train_steps": 0.005614280700683594, "step": 747}
{"info/global_step": 748, "train_info/time_within_train_step": 28.059388399124146, "step": 748}
{"train_info/time_between_train_steps": 0.0075206756591796875, "step": 748}
{"info/global_step": 749, "train_info/time_within_train_step": 27.876919746398926, "step": 749}
{"train_info/time_between_train_steps": 0.01029348373413086, "step": 749}
{"info/global_step": 750, "train_info/time_within_train_step": 27.832568407058716, "step": 750}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733883451, "_runtime": 21763}, "step": 750}
{"logs": {"train/loss": 4.2499, "train/learning_rate": 0.00025, "train/epoch": 31.0, "_timestamp": 1733883451, "_runtime": 21763}, "step": 750}
{"train_info/time_between_train_steps": 0.0072934627532958984, "step": 750}
{"info/global_step": 751, "train_info/time_within_train_step": 27.857545137405396, "step": 751}
{"train_info/time_between_train_steps": 0.005162477493286133, "step": 751}
{"info/global_step": 752, "train_info/time_within_train_step": 27.834912538528442, "step": 752}
{"train_info/time_between_train_steps": 0.0052471160888671875, "step": 752}
{"info/global_step": 753, "train_info/time_within_train_step": 27.934590101242065, "step": 753}
{"train_info/time_between_train_steps": 0.006592273712158203, "step": 753}
{"info/global_step": 754, "train_info/time_within_train_step": 27.857612371444702, "step": 754}
{"train_info/time_between_train_steps": 0.005227565765380859, "step": 754}
{"info/global_step": 755, "train_info/time_within_train_step": 27.91248846054077, "step": 755}
{"train_info/time_between_train_steps": 0.005403041839599609, "step": 755}
{"info/global_step": 756, "train_info/time_within_train_step": 27.85490083694458, "step": 756}
{"train_info/time_between_train_steps": 0.010051250457763672, "step": 756}
{"info/global_step": 757, "train_info/time_within_train_step": 27.881808042526245, "step": 757}
{"train_info/time_between_train_steps": 0.010099172592163086, "step": 757}
{"info/global_step": 758, "train_info/time_within_train_step": 27.91795063018799, "step": 758}
{"train_info/time_between_train_steps": 0.005520820617675781, "step": 758}
{"info/global_step": 759, "train_info/time_within_train_step": 27.9602370262146, "step": 759}
{"train_info/time_between_train_steps": 0.009317636489868164, "step": 759}
{"info/global_step": 760, "train_info/time_within_train_step": 27.932271718978882, "step": 760}
{"train_info/time_between_train_steps": 0.010860443115234375, "step": 760}
{"info/global_step": 761, "train_info/time_within_train_step": 27.96569061279297, "step": 761}
{"train_info/time_between_train_steps": 0.01341104507446289, "step": 761}
{"info/global_step": 762, "train_info/time_within_train_step": 27.93411898612976, "step": 762}
{"train_info/time_between_train_steps": 0.010379552841186523, "step": 762}
{"info/global_step": 763, "train_info/time_within_train_step": 27.84468364715576, "step": 763}
{"train_info/time_between_train_steps": 0.010996103286743164, "step": 763}
{"info/global_step": 764, "train_info/time_within_train_step": 27.969399213790894, "step": 764}
{"train_info/time_between_train_steps": 0.0055010318756103516, "step": 764}
{"info/global_step": 765, "train_info/time_within_train_step": 27.884066581726074, "step": 765}
{"train_info/time_between_train_steps": 0.0054187774658203125, "step": 765}
{"info/global_step": 766, "train_info/time_within_train_step": 27.933112859725952, "step": 766}
{"train_info/time_between_train_steps": 0.010654449462890625, "step": 766}
{"info/global_step": 767, "train_info/time_within_train_step": 27.856878995895386, "step": 767}
{"train_info/time_between_train_steps": 0.006348371505737305, "step": 767}
{"info/global_step": 768, "train_info/time_within_train_step": 27.92731261253357, "step": 768}
{"train_info/time_between_train_steps": 0.006208896636962891, "step": 768}
{"train_info/time_between_train_steps": 5.409374713897705, "step": 768}
{"info/global_step": 769, "train_info/time_within_train_step": 27.88438105583191, "step": 769}
{"train_info/time_between_train_steps": 0.0056574344635009766, "step": 769}
{"info/global_step": 770, "train_info/time_within_train_step": 28.048359870910645, "step": 770}
{"train_info/time_between_train_steps": 0.008373022079467773, "step": 770}
{"info/global_step": 771, "train_info/time_within_train_step": 27.89099645614624, "step": 771}
{"train_info/time_between_train_steps": 0.005343437194824219, "step": 771}
{"info/global_step": 772, "train_info/time_within_train_step": 27.918737411499023, "step": 772}
{"train_info/time_between_train_steps": 0.005456447601318359, "step": 772}
{"info/global_step": 773, "train_info/time_within_train_step": 27.975944757461548, "step": 773}
{"train_info/time_between_train_steps": 0.0052411556243896484, "step": 773}
{"info/global_step": 774, "train_info/time_within_train_step": 27.828519582748413, "step": 774}
{"train_info/time_between_train_steps": 0.009424448013305664, "step": 774}
{"info/global_step": 775, "train_info/time_within_train_step": 27.888432264328003, "step": 775}
{"train_info/time_between_train_steps": 0.005304813385009766, "step": 775}
{"info/global_step": 776, "train_info/time_within_train_step": 27.863325357437134, "step": 776}
{"train_info/time_between_train_steps": 0.019701242446899414, "step": 776}
{"info/global_step": 777, "train_info/time_within_train_step": 27.86982536315918, "step": 777}
{"train_info/time_between_train_steps": 0.005448341369628906, "step": 777}
{"info/global_step": 778, "train_info/time_within_train_step": 27.82927107810974, "step": 778}
{"train_info/time_between_train_steps": 0.0052759647369384766, "step": 778}
{"info/global_step": 779, "train_info/time_within_train_step": 28.01047158241272, "step": 779}
{"train_info/time_between_train_steps": 0.006181240081787109, "step": 779}
{"info/global_step": 780, "train_info/time_within_train_step": 27.81373620033264, "step": 780}
{"train_info/time_between_train_steps": 0.010245084762573242, "step": 780}
{"info/global_step": 781, "train_info/time_within_train_step": 27.889512062072754, "step": 781}
{"train_info/time_between_train_steps": 0.005410671234130859, "step": 781}
{"info/global_step": 782, "train_info/time_within_train_step": 27.905481815338135, "step": 782}
{"train_info/time_between_train_steps": 0.009799003601074219, "step": 782}
{"info/global_step": 783, "train_info/time_within_train_step": 27.887949466705322, "step": 783}
{"train_info/time_between_train_steps": 0.010118246078491211, "step": 783}
{"info/global_step": 784, "train_info/time_within_train_step": 27.87034273147583, "step": 784}
{"train_info/time_between_train_steps": 0.005460500717163086, "step": 784}
{"info/global_step": 785, "train_info/time_within_train_step": 27.845494747161865, "step": 785}
{"train_info/time_between_train_steps": 0.005574941635131836, "step": 785}
{"info/global_step": 786, "train_info/time_within_train_step": 27.85550856590271, "step": 786}
{"train_info/time_between_train_steps": 0.005370616912841797, "step": 786}
{"info/global_step": 787, "train_info/time_within_train_step": 27.862098932266235, "step": 787}
{"train_info/time_between_train_steps": 0.00519871711730957, "step": 787}
{"info/global_step": 788, "train_info/time_within_train_step": 27.86797547340393, "step": 788}
{"train_info/time_between_train_steps": 0.005776643753051758, "step": 788}
{"info/global_step": 789, "train_info/time_within_train_step": 27.84992265701294, "step": 789}
{"train_info/time_between_train_steps": 0.005273103713989258, "step": 789}
{"info/global_step": 790, "train_info/time_within_train_step": 27.901424407958984, "step": 790}
{"train_info/time_between_train_steps": 0.005642414093017578, "step": 790}
{"info/global_step": 791, "train_info/time_within_train_step": 27.887646198272705, "step": 791}
{"train_info/time_between_train_steps": 0.005697488784790039, "step": 791}
{"info/global_step": 792, "train_info/time_within_train_step": 27.908438444137573, "step": 792}
{"train_info/time_between_train_steps": 0.006121158599853516, "step": 792}
{"train_info/time_between_train_steps": 5.583119630813599, "step": 792}
{"info/global_step": 793, "train_info/time_within_train_step": 27.9321129322052, "step": 793}
{"train_info/time_between_train_steps": 0.005574226379394531, "step": 793}
{"info/global_step": 794, "train_info/time_within_train_step": 28.02779269218445, "step": 794}
{"train_info/time_between_train_steps": 0.010422468185424805, "step": 794}
{"info/global_step": 795, "train_info/time_within_train_step": 28.07706332206726, "step": 795}
{"train_info/time_between_train_steps": 0.005431652069091797, "step": 795}
{"info/global_step": 796, "train_info/time_within_train_step": 27.99479055404663, "step": 796}
{"train_info/time_between_train_steps": 0.010009527206420898, "step": 796}
{"info/global_step": 797, "train_info/time_within_train_step": 27.875941514968872, "step": 797}
{"train_info/time_between_train_steps": 0.009826421737670898, "step": 797}
{"info/global_step": 798, "train_info/time_within_train_step": 27.81486940383911, "step": 798}
{"train_info/time_between_train_steps": 0.005196809768676758, "step": 798}
{"info/global_step": 799, "train_info/time_within_train_step": 27.92206048965454, "step": 799}
{"train_info/time_between_train_steps": 0.0056955814361572266, "step": 799}
{"info/global_step": 800, "train_info/time_within_train_step": 27.945321798324585, "step": 800}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733884858, "_runtime": 23170}, "step": 800}
{"logs": {"train/loss": 4.1602, "train/learning_rate": 0.00022222222222222218, "train/epoch": 33.01, "_timestamp": 1733884858, "_runtime": 23170}, "step": 800}
{"train_info/time_between_train_steps": 2.856712818145752, "step": 800}
{"info/global_step": 801, "train_info/time_within_train_step": 27.883622407913208, "step": 801}
{"train_info/time_between_train_steps": 0.010210514068603516, "step": 801}
{"info/global_step": 802, "train_info/time_within_train_step": 27.86180806159973, "step": 802}
{"train_info/time_between_train_steps": 0.005268096923828125, "step": 802}
{"info/global_step": 803, "train_info/time_within_train_step": 27.82466983795166, "step": 803}
{"train_info/time_between_train_steps": 0.005328655242919922, "step": 803}
{"info/global_step": 804, "train_info/time_within_train_step": 27.841315269470215, "step": 804}
{"train_info/time_between_train_steps": 0.0055658817291259766, "step": 804}
{"info/global_step": 805, "train_info/time_within_train_step": 27.815061330795288, "step": 805}
{"train_info/time_between_train_steps": 0.005221128463745117, "step": 805}
{"info/global_step": 806, "train_info/time_within_train_step": 27.87323260307312, "step": 806}
{"train_info/time_between_train_steps": 0.005598306655883789, "step": 806}
{"info/global_step": 807, "train_info/time_within_train_step": 27.858259201049805, "step": 807}
{"train_info/time_between_train_steps": 0.005509376525878906, "step": 807}
{"info/global_step": 808, "train_info/time_within_train_step": 27.866678714752197, "step": 808}
{"train_info/time_between_train_steps": 0.011636972427368164, "step": 808}
{"info/global_step": 809, "train_info/time_within_train_step": 27.925782918930054, "step": 809}
{"train_info/time_between_train_steps": 0.0053369998931884766, "step": 809}
{"info/global_step": 810, "train_info/time_within_train_step": 28.003788471221924, "step": 810}
{"train_info/time_between_train_steps": 0.005316734313964844, "step": 810}
{"info/global_step": 811, "train_info/time_within_train_step": 27.91982889175415, "step": 811}
{"train_info/time_between_train_steps": 0.009908676147460938, "step": 811}
{"info/global_step": 812, "train_info/time_within_train_step": 27.854879140853882, "step": 812}
{"train_info/time_between_train_steps": 0.009664535522460938, "step": 812}
{"info/global_step": 813, "train_info/time_within_train_step": 27.91584825515747, "step": 813}
{"train_info/time_between_train_steps": 0.006469249725341797, "step": 813}
{"info/global_step": 814, "train_info/time_within_train_step": 27.832855701446533, "step": 814}
{"train_info/time_between_train_steps": 0.0059909820556640625, "step": 814}
{"info/global_step": 815, "train_info/time_within_train_step": 27.992600202560425, "step": 815}
{"train_info/time_between_train_steps": 0.0058078765869140625, "step": 815}
{"info/global_step": 816, "train_info/time_within_train_step": 27.886504411697388, "step": 816}
{"train_info/time_between_train_steps": 0.006314992904663086, "step": 816}
{"train_info/time_between_train_steps": 5.055109739303589, "step": 816}
{"info/global_step": 817, "train_info/time_within_train_step": 27.866954565048218, "step": 817}
{"train_info/time_between_train_steps": 0.005156517028808594, "step": 817}
{"info/global_step": 818, "train_info/time_within_train_step": 28.01647639274597, "step": 818}
{"train_info/time_between_train_steps": 0.005446195602416992, "step": 818}
{"info/global_step": 819, "train_info/time_within_train_step": 27.96556568145752, "step": 819}
{"train_info/time_between_train_steps": 0.005622148513793945, "step": 819}
{"info/global_step": 820, "train_info/time_within_train_step": 27.945469617843628, "step": 820}
{"train_info/time_between_train_steps": 0.0056915283203125, "step": 820}
{"info/global_step": 821, "train_info/time_within_train_step": 27.88659358024597, "step": 821}
{"train_info/time_between_train_steps": 0.005565643310546875, "step": 821}
{"info/global_step": 822, "train_info/time_within_train_step": 27.867566108703613, "step": 822}
{"train_info/time_between_train_steps": 0.01445913314819336, "step": 822}
{"info/global_step": 823, "train_info/time_within_train_step": 27.87318253517151, "step": 823}
{"train_info/time_between_train_steps": 0.00535273551940918, "step": 823}
{"info/global_step": 824, "train_info/time_within_train_step": 27.916833639144897, "step": 824}
{"train_info/time_between_train_steps": 0.01334524154663086, "step": 824}
{"info/global_step": 825, "train_info/time_within_train_step": 27.860329627990723, "step": 825}
{"train_info/time_between_train_steps": 0.005523204803466797, "step": 825}
{"info/global_step": 826, "train_info/time_within_train_step": 27.956284046173096, "step": 826}
{"train_info/time_between_train_steps": 0.010099649429321289, "step": 826}
{"info/global_step": 827, "train_info/time_within_train_step": 27.849488735198975, "step": 827}
{"train_info/time_between_train_steps": 0.0053904056549072266, "step": 827}
{"info/global_step": 828, "train_info/time_within_train_step": 27.854365587234497, "step": 828}
{"train_info/time_between_train_steps": 0.011330604553222656, "step": 828}
{"info/global_step": 829, "train_info/time_within_train_step": 27.8541579246521, "step": 829}
{"train_info/time_between_train_steps": 0.0071141719818115234, "step": 829}
{"info/global_step": 830, "train_info/time_within_train_step": 27.892338037490845, "step": 830}
{"train_info/time_between_train_steps": 0.0055408477783203125, "step": 830}
{"info/global_step": 831, "train_info/time_within_train_step": 27.898076057434082, "step": 831}
{"train_info/time_between_train_steps": 0.005829811096191406, "step": 831}
{"info/global_step": 832, "train_info/time_within_train_step": 27.874744415283203, "step": 832}
{"train_info/time_between_train_steps": 0.005541801452636719, "step": 832}
{"info/global_step": 833, "train_info/time_within_train_step": 27.888389110565186, "step": 833}
{"train_info/time_between_train_steps": 0.01053619384765625, "step": 833}
{"info/global_step": 834, "train_info/time_within_train_step": 27.89982581138611, "step": 834}
{"train_info/time_between_train_steps": 0.010380983352661133, "step": 834}
{"info/global_step": 835, "train_info/time_within_train_step": 27.894134044647217, "step": 835}
{"train_info/time_between_train_steps": 0.005674839019775391, "step": 835}
{"info/global_step": 836, "train_info/time_within_train_step": 27.866823434829712, "step": 836}
{"train_info/time_between_train_steps": 0.0060307979583740234, "step": 836}
{"info/global_step": 837, "train_info/time_within_train_step": 27.890435695648193, "step": 837}
{"train_info/time_between_train_steps": 0.00531768798828125, "step": 837}
{"info/global_step": 838, "train_info/time_within_train_step": 27.914138317108154, "step": 838}
{"train_info/time_between_train_steps": 0.006368160247802734, "step": 838}
{"info/global_step": 839, "train_info/time_within_train_step": 27.904123544692993, "step": 839}
{"train_info/time_between_train_steps": 0.006043910980224609, "step": 839}
{"info/global_step": 840, "train_info/time_within_train_step": 27.89624571800232, "step": 840}
{"train_info/time_between_train_steps": 0.005858659744262695, "step": 840}
{"train_info/time_between_train_steps": 5.2123870849609375, "step": 840}
{"info/global_step": 841, "train_info/time_within_train_step": 27.913843393325806, "step": 841}
{"train_info/time_between_train_steps": 0.0059795379638671875, "step": 841}
{"info/global_step": 842, "train_info/time_within_train_step": 28.356560945510864, "step": 842}
{"train_info/time_between_train_steps": 0.011049747467041016, "step": 842}
{"info/global_step": 843, "train_info/time_within_train_step": 27.864521265029907, "step": 843}
{"train_info/time_between_train_steps": 0.00561833381652832, "step": 843}
{"info/global_step": 844, "train_info/time_within_train_step": 27.929980516433716, "step": 844}
{"train_info/time_between_train_steps": 0.0063550472259521484, "step": 844}
{"info/global_step": 845, "train_info/time_within_train_step": 27.919150590896606, "step": 845}
{"train_info/time_between_train_steps": 0.00543665885925293, "step": 845}
{"info/global_step": 846, "train_info/time_within_train_step": 27.896425247192383, "step": 846}
{"train_info/time_between_train_steps": 0.009620428085327148, "step": 846}
{"info/global_step": 847, "train_info/time_within_train_step": 27.87555956840515, "step": 847}
{"train_info/time_between_train_steps": 0.005321502685546875, "step": 847}
{"info/global_step": 848, "train_info/time_within_train_step": 27.80702829360962, "step": 848}
{"train_info/time_between_train_steps": 0.0053670406341552734, "step": 848}
{"info/global_step": 849, "train_info/time_within_train_step": 27.804544925689697, "step": 849}
{"train_info/time_between_train_steps": 0.005560874938964844, "step": 849}
{"info/global_step": 850, "train_info/time_within_train_step": 27.844847202301025, "step": 850}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733886266, "_runtime": 24578}, "step": 850}
{"logs": {"train/loss": 4.0822, "train/learning_rate": 0.00019444444444444443, "train/epoch": 35.01, "_timestamp": 1733886266, "_runtime": 24578}, "step": 850}
{"train_info/time_between_train_steps": 0.008715391159057617, "step": 850}
{"info/global_step": 851, "train_info/time_within_train_step": 27.872763872146606, "step": 851}
{"train_info/time_between_train_steps": 0.0057337284088134766, "step": 851}
{"info/global_step": 852, "train_info/time_within_train_step": 27.913955450057983, "step": 852}
{"train_info/time_between_train_steps": 0.005682468414306641, "step": 852}
{"info/global_step": 853, "train_info/time_within_train_step": 27.885173797607422, "step": 853}
{"train_info/time_between_train_steps": 0.005443096160888672, "step": 853}
{"info/global_step": 854, "train_info/time_within_train_step": 27.87550449371338, "step": 854}
{"train_info/time_between_train_steps": 0.005412578582763672, "step": 854}
{"info/global_step": 855, "train_info/time_within_train_step": 27.89293122291565, "step": 855}
{"train_info/time_between_train_steps": 0.0056154727935791016, "step": 855}
{"info/global_step": 856, "train_info/time_within_train_step": 28.025326251983643, "step": 856}
{"train_info/time_between_train_steps": 0.005723237991333008, "step": 856}
{"info/global_step": 857, "train_info/time_within_train_step": 27.968424797058105, "step": 857}
{"train_info/time_between_train_steps": 0.005353450775146484, "step": 857}
{"info/global_step": 858, "train_info/time_within_train_step": 27.907056093215942, "step": 858}
{"train_info/time_between_train_steps": 0.005520343780517578, "step": 858}
{"info/global_step": 859, "train_info/time_within_train_step": 27.83943009376526, "step": 859}
{"train_info/time_between_train_steps": 0.005416393280029297, "step": 859}
{"info/global_step": 860, "train_info/time_within_train_step": 27.956836700439453, "step": 860}
{"train_info/time_between_train_steps": 0.005898475646972656, "step": 860}
{"info/global_step": 861, "train_info/time_within_train_step": 27.90471315383911, "step": 861}
{"train_info/time_between_train_steps": 0.00586390495300293, "step": 861}
{"info/global_step": 862, "train_info/time_within_train_step": 27.879387855529785, "step": 862}
{"train_info/time_between_train_steps": 0.005524158477783203, "step": 862}
{"info/global_step": 863, "train_info/time_within_train_step": 27.867449522018433, "step": 863}
{"train_info/time_between_train_steps": 0.0068089962005615234, "step": 863}
{"info/global_step": 864, "train_info/time_within_train_step": 27.886305570602417, "step": 864}
{"train_info/time_between_train_steps": 0.01122283935546875, "step": 864}
{"train_info/time_between_train_steps": 5.387828826904297, "step": 864}
{"info/global_step": 865, "train_info/time_within_train_step": 27.889748096466064, "step": 865}
{"train_info/time_between_train_steps": 0.0058650970458984375, "step": 865}
{"info/global_step": 866, "train_info/time_within_train_step": 28.057335138320923, "step": 866}
{"train_info/time_between_train_steps": 0.005793333053588867, "step": 866}
{"info/global_step": 867, "train_info/time_within_train_step": 27.950927734375, "step": 867}
{"train_info/time_between_train_steps": 0.006034374237060547, "step": 867}
{"info/global_step": 868, "train_info/time_within_train_step": 27.952280282974243, "step": 868}
{"train_info/time_between_train_steps": 0.0062236785888671875, "step": 868}
{"info/global_step": 869, "train_info/time_within_train_step": 27.96891140937805, "step": 869}
{"train_info/time_between_train_steps": 0.005426645278930664, "step": 869}
{"info/global_step": 870, "train_info/time_within_train_step": 27.82170271873474, "step": 870}
{"train_info/time_between_train_steps": 0.005269765853881836, "step": 870}
{"info/global_step": 871, "train_info/time_within_train_step": 27.86750102043152, "step": 871}
{"train_info/time_between_train_steps": 0.0055255889892578125, "step": 871}
{"info/global_step": 872, "train_info/time_within_train_step": 27.925307512283325, "step": 872}
{"train_info/time_between_train_steps": 0.0057430267333984375, "step": 872}
{"info/global_step": 873, "train_info/time_within_train_step": 28.0738263130188, "step": 873}
{"train_info/time_between_train_steps": 0.005604982376098633, "step": 873}
{"info/global_step": 874, "train_info/time_within_train_step": 28.023247718811035, "step": 874}
{"train_info/time_between_train_steps": 0.011282205581665039, "step": 874}
{"info/global_step": 875, "train_info/time_within_train_step": 27.98322868347168, "step": 875}
{"train_info/time_between_train_steps": 0.005761384963989258, "step": 875}
{"info/global_step": 876, "train_info/time_within_train_step": 27.981420278549194, "step": 876}
{"train_info/time_between_train_steps": 0.006268024444580078, "step": 876}
{"info/global_step": 877, "train_info/time_within_train_step": 27.93537163734436, "step": 877}
{"train_info/time_between_train_steps": 0.00609588623046875, "step": 877}
{"info/global_step": 878, "train_info/time_within_train_step": 27.94768261909485, "step": 878}
{"train_info/time_between_train_steps": 0.005653858184814453, "step": 878}
{"info/global_step": 879, "train_info/time_within_train_step": 27.90947914123535, "step": 879}
{"train_info/time_between_train_steps": 0.00923013687133789, "step": 879}
{"info/global_step": 880, "train_info/time_within_train_step": 27.938187837600708, "step": 880}
{"train_info/time_between_train_steps": 0.010868310928344727, "step": 880}
{"info/global_step": 881, "train_info/time_within_train_step": 27.99759531021118, "step": 881}
{"train_info/time_between_train_steps": 0.0061130523681640625, "step": 881}
{"info/global_step": 882, "train_info/time_within_train_step": 28.007490634918213, "step": 882}
{"train_info/time_between_train_steps": 0.006865978240966797, "step": 882}
{"info/global_step": 883, "train_info/time_within_train_step": 28.12627387046814, "step": 883}
{"train_info/time_between_train_steps": 0.012643098831176758, "step": 883}
{"info/global_step": 884, "train_info/time_within_train_step": 27.981439352035522, "step": 884}
{"train_info/time_between_train_steps": 0.007307767868041992, "step": 884}
{"info/global_step": 885, "train_info/time_within_train_step": 27.90947699546814, "step": 885}
{"train_info/time_between_train_steps": 0.006138801574707031, "step": 885}
{"info/global_step": 886, "train_info/time_within_train_step": 27.922860622406006, "step": 886}
{"train_info/time_between_train_steps": 0.005804538726806641, "step": 886}
{"info/global_step": 887, "train_info/time_within_train_step": 27.87931752204895, "step": 887}
{"train_info/time_between_train_steps": 0.00600123405456543, "step": 887}
{"info/global_step": 888, "train_info/time_within_train_step": 28.044672966003418, "step": 888}
{"train_info/time_between_train_steps": 0.015778064727783203, "step": 888}
{"train_info/time_between_train_steps": 5.344126462936401, "step": 888}
{"info/global_step": 889, "train_info/time_within_train_step": 27.876063108444214, "step": 889}
{"train_info/time_between_train_steps": 0.005171298980712891, "step": 889}
{"info/global_step": 890, "train_info/time_within_train_step": 28.000138521194458, "step": 890}
{"train_info/time_between_train_steps": 0.005452394485473633, "step": 890}
{"info/global_step": 891, "train_info/time_within_train_step": 27.84483766555786, "step": 891}
{"train_info/time_between_train_steps": 0.005944728851318359, "step": 891}
{"info/global_step": 892, "train_info/time_within_train_step": 27.940255880355835, "step": 892}
{"train_info/time_between_train_steps": 0.005712270736694336, "step": 892}
{"info/global_step": 893, "train_info/time_within_train_step": 27.899933338165283, "step": 893}
{"train_info/time_between_train_steps": 0.005553007125854492, "step": 893}
{"info/global_step": 894, "train_info/time_within_train_step": 27.820339679718018, "step": 894}
{"train_info/time_between_train_steps": 0.005334138870239258, "step": 894}
{"info/global_step": 895, "train_info/time_within_train_step": 27.865430116653442, "step": 895}
{"train_info/time_between_train_steps": 0.005246400833129883, "step": 895}
{"info/global_step": 896, "train_info/time_within_train_step": 27.80813217163086, "step": 896}
{"train_info/time_between_train_steps": 0.005289554595947266, "step": 896}
{"info/global_step": 897, "train_info/time_within_train_step": 27.915367364883423, "step": 897}
{"train_info/time_between_train_steps": 0.005543947219848633, "step": 897}
{"info/global_step": 898, "train_info/time_within_train_step": 27.848084211349487, "step": 898}
{"train_info/time_between_train_steps": 0.00555872917175293, "step": 898}
{"info/global_step": 899, "train_info/time_within_train_step": 27.826393842697144, "step": 899}
{"train_info/time_between_train_steps": 0.005648374557495117, "step": 899}
{"info/global_step": 900, "train_info/time_within_train_step": 27.91648840904236, "step": 900}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733887674, "_runtime": 25986}, "step": 900}
{"logs": {"train/loss": 4.0101, "train/learning_rate": 0.00016666666666666666, "train/epoch": 37.01, "_timestamp": 1733887674, "_runtime": 25986}, "step": 900}
{"train_info/time_between_train_steps": 2.9591546058654785, "step": 900}
{"info/global_step": 901, "train_info/time_within_train_step": 27.884081840515137, "step": 901}
{"train_info/time_between_train_steps": 0.010945320129394531, "step": 901}
{"info/global_step": 902, "train_info/time_within_train_step": 27.86406373977661, "step": 902}
{"train_info/time_between_train_steps": 0.00526118278503418, "step": 902}
{"info/global_step": 903, "train_info/time_within_train_step": 27.87629222869873, "step": 903}
{"train_info/time_between_train_steps": 0.011861562728881836, "step": 903}
{"info/global_step": 904, "train_info/time_within_train_step": 27.986878633499146, "step": 904}
{"train_info/time_between_train_steps": 0.010555267333984375, "step": 904}
{"info/global_step": 905, "train_info/time_within_train_step": 27.838485717773438, "step": 905}
{"train_info/time_between_train_steps": 0.005414724349975586, "step": 905}
{"info/global_step": 906, "train_info/time_within_train_step": 27.875592708587646, "step": 906}
{"train_info/time_between_train_steps": 0.005292415618896484, "step": 906}
{"info/global_step": 907, "train_info/time_within_train_step": 27.804466724395752, "step": 907}
{"train_info/time_between_train_steps": 0.005299568176269531, "step": 907}
{"info/global_step": 908, "train_info/time_within_train_step": 27.801083087921143, "step": 908}
{"train_info/time_between_train_steps": 0.00581812858581543, "step": 908}
{"info/global_step": 909, "train_info/time_within_train_step": 27.924331188201904, "step": 909}
{"train_info/time_between_train_steps": 0.0052814483642578125, "step": 909}
{"info/global_step": 910, "train_info/time_within_train_step": 27.825196743011475, "step": 910}
{"train_info/time_between_train_steps": 0.006045341491699219, "step": 910}
{"info/global_step": 911, "train_info/time_within_train_step": 27.840593099594116, "step": 911}
{"train_info/time_between_train_steps": 0.006079435348510742, "step": 911}
{"info/global_step": 912, "train_info/time_within_train_step": 27.888762950897217, "step": 912}
{"train_info/time_between_train_steps": 0.006135702133178711, "step": 912}
{"train_info/time_between_train_steps": 5.085971117019653, "step": 912}
{"info/global_step": 913, "train_info/time_within_train_step": 27.817318201065063, "step": 913}
{"train_info/time_between_train_steps": 0.005024433135986328, "step": 913}
{"info/global_step": 914, "train_info/time_within_train_step": 27.97433114051819, "step": 914}
{"train_info/time_between_train_steps": 0.006505727767944336, "step": 914}
{"info/global_step": 915, "train_info/time_within_train_step": 27.94943904876709, "step": 915}
{"train_info/time_between_train_steps": 0.005566120147705078, "step": 915}
{"info/global_step": 916, "train_info/time_within_train_step": 28.04191303253174, "step": 916}
{"train_info/time_between_train_steps": 0.005540370941162109, "step": 916}
{"info/global_step": 917, "train_info/time_within_train_step": 27.926685333251953, "step": 917}
{"train_info/time_between_train_steps": 0.0052187442779541016, "step": 917}
{"info/global_step": 918, "train_info/time_within_train_step": 27.85184645652771, "step": 918}
{"train_info/time_between_train_steps": 0.00523686408996582, "step": 918}
{"info/global_step": 919, "train_info/time_within_train_step": 27.94430136680603, "step": 919}
{"train_info/time_between_train_steps": 0.005269765853881836, "step": 919}
{"info/global_step": 920, "train_info/time_within_train_step": 27.838752031326294, "step": 920}
{"train_info/time_between_train_steps": 0.005185365676879883, "step": 920}
{"info/global_step": 921, "train_info/time_within_train_step": 27.80368733406067, "step": 921}
{"train_info/time_between_train_steps": 0.0056989192962646484, "step": 921}
{"info/global_step": 922, "train_info/time_within_train_step": 27.8658230304718, "step": 922}
{"train_info/time_between_train_steps": 0.005913972854614258, "step": 922}
{"info/global_step": 923, "train_info/time_within_train_step": 27.876071453094482, "step": 923}
{"train_info/time_between_train_steps": 0.005391359329223633, "step": 923}
{"info/global_step": 924, "train_info/time_within_train_step": 27.842966318130493, "step": 924}
{"train_info/time_between_train_steps": 0.005644083023071289, "step": 924}
{"info/global_step": 925, "train_info/time_within_train_step": 27.826216220855713, "step": 925}
{"train_info/time_between_train_steps": 0.009181022644042969, "step": 925}
{"info/global_step": 926, "train_info/time_within_train_step": 27.84077477455139, "step": 926}
{"train_info/time_between_train_steps": 0.005381107330322266, "step": 926}
{"info/global_step": 927, "train_info/time_within_train_step": 27.917213916778564, "step": 927}
{"train_info/time_between_train_steps": 0.005394697189331055, "step": 927}
{"info/global_step": 928, "train_info/time_within_train_step": 27.82552146911621, "step": 928}
{"train_info/time_between_train_steps": 0.009613513946533203, "step": 928}
{"info/global_step": 929, "train_info/time_within_train_step": 27.828991889953613, "step": 929}
{"train_info/time_between_train_steps": 0.005264997482299805, "step": 929}
{"info/global_step": 930, "train_info/time_within_train_step": 27.84946894645691, "step": 930}
{"train_info/time_between_train_steps": 0.005398750305175781, "step": 930}
{"info/global_step": 931, "train_info/time_within_train_step": 27.903262615203857, "step": 931}
{"train_info/time_between_train_steps": 0.0055963993072509766, "step": 931}
{"info/global_step": 932, "train_info/time_within_train_step": 28.01182794570923, "step": 932}
{"train_info/time_between_train_steps": 0.005692481994628906, "step": 932}
{"info/global_step": 933, "train_info/time_within_train_step": 27.81058621406555, "step": 933}
{"train_info/time_between_train_steps": 0.005754232406616211, "step": 933}
{"info/global_step": 934, "train_info/time_within_train_step": 27.965450048446655, "step": 934}
{"train_info/time_between_train_steps": 0.0070648193359375, "step": 934}
{"info/global_step": 935, "train_info/time_within_train_step": 28.131367444992065, "step": 935}
{"train_info/time_between_train_steps": 0.005963563919067383, "step": 935}
{"info/global_step": 936, "train_info/time_within_train_step": 27.927685976028442, "step": 936}
{"train_info/time_between_train_steps": 0.006070375442504883, "step": 936}
{"train_info/time_between_train_steps": 5.437132835388184, "step": 936}
{"info/global_step": 937, "train_info/time_within_train_step": 27.84115982055664, "step": 937}
{"train_info/time_between_train_steps": 0.0055806636810302734, "step": 937}
{"info/global_step": 938, "train_info/time_within_train_step": 28.006691694259644, "step": 938}
{"train_info/time_between_train_steps": 0.0065898895263671875, "step": 938}
{"info/global_step": 939, "train_info/time_within_train_step": 27.80047607421875, "step": 939}
{"train_info/time_between_train_steps": 0.005469560623168945, "step": 939}
{"info/global_step": 940, "train_info/time_within_train_step": 27.92683696746826, "step": 940}
{"train_info/time_between_train_steps": 0.005613088607788086, "step": 940}
{"info/global_step": 941, "train_info/time_within_train_step": 27.842132806777954, "step": 941}
{"train_info/time_between_train_steps": 0.005785226821899414, "step": 941}
{"info/global_step": 942, "train_info/time_within_train_step": 27.827579021453857, "step": 942}
{"train_info/time_between_train_steps": 0.010230064392089844, "step": 942}
{"info/global_step": 943, "train_info/time_within_train_step": 27.84981632232666, "step": 943}
{"train_info/time_between_train_steps": 0.00640559196472168, "step": 943}
{"info/global_step": 944, "train_info/time_within_train_step": 27.93044900894165, "step": 944}
{"train_info/time_between_train_steps": 0.005368947982788086, "step": 944}
{"info/global_step": 945, "train_info/time_within_train_step": 27.81655263900757, "step": 945}
{"train_info/time_between_train_steps": 0.005617380142211914, "step": 945}
{"info/global_step": 946, "train_info/time_within_train_step": 27.825392484664917, "step": 946}
{"train_info/time_between_train_steps": 0.0053827762603759766, "step": 946}
{"info/global_step": 947, "train_info/time_within_train_step": 27.829052686691284, "step": 947}
{"train_info/time_between_train_steps": 0.0055119991302490234, "step": 947}
{"info/global_step": 948, "train_info/time_within_train_step": 27.929964065551758, "step": 948}
{"train_info/time_between_train_steps": 0.010542869567871094, "step": 948}
{"info/global_step": 949, "train_info/time_within_train_step": 27.88458013534546, "step": 949}
{"train_info/time_between_train_steps": 0.005186557769775391, "step": 949}
{"info/global_step": 950, "train_info/time_within_train_step": 27.85302209854126, "step": 950}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733889082, "_runtime": 27394}, "step": 950}
{"logs": {"train/loss": 3.9461, "train/learning_rate": 0.0001388888888888889, "train/epoch": 39.01, "_timestamp": 1733889082, "_runtime": 27394}, "step": 950}
{"train_info/time_between_train_steps": 0.007400035858154297, "step": 950}
{"info/global_step": 951, "train_info/time_within_train_step": 27.93006181716919, "step": 951}
{"train_info/time_between_train_steps": 0.005506992340087891, "step": 951}
{"info/global_step": 952, "train_info/time_within_train_step": 27.88629961013794, "step": 952}
{"train_info/time_between_train_steps": 0.009310483932495117, "step": 952}
{"info/global_step": 953, "train_info/time_within_train_step": 27.82680892944336, "step": 953}
{"train_info/time_between_train_steps": 0.005295991897583008, "step": 953}
{"info/global_step": 954, "train_info/time_within_train_step": 27.94121766090393, "step": 954}
{"train_info/time_between_train_steps": 0.018523216247558594, "step": 954}
{"info/global_step": 955, "train_info/time_within_train_step": 27.943815231323242, "step": 955}
{"train_info/time_between_train_steps": 0.005396842956542969, "step": 955}
{"info/global_step": 956, "train_info/time_within_train_step": 27.859354496002197, "step": 956}
{"train_info/time_between_train_steps": 0.005617618560791016, "step": 956}
{"info/global_step": 957, "train_info/time_within_train_step": 27.888511180877686, "step": 957}
{"train_info/time_between_train_steps": 0.00799703598022461, "step": 957}
{"info/global_step": 958, "train_info/time_within_train_step": 27.889397382736206, "step": 958}
{"train_info/time_between_train_steps": 0.009823799133300781, "step": 958}
{"info/global_step": 959, "train_info/time_within_train_step": 27.882930755615234, "step": 959}
{"train_info/time_between_train_steps": 0.006162405014038086, "step": 959}
{"info/global_step": 960, "train_info/time_within_train_step": 27.8966166973114, "step": 960}
{"train_info/time_between_train_steps": 0.005913734436035156, "step": 960}
{"train_info/time_between_train_steps": 5.191656589508057, "step": 960}
{"info/global_step": 961, "train_info/time_within_train_step": 27.789000511169434, "step": 961}
{"train_info/time_between_train_steps": 0.005738973617553711, "step": 961}
{"info/global_step": 962, "train_info/time_within_train_step": 28.052489519119263, "step": 962}
{"train_info/time_between_train_steps": 0.005551815032958984, "step": 962}
{"info/global_step": 963, "train_info/time_within_train_step": 27.9151771068573, "step": 963}
{"train_info/time_between_train_steps": 0.005597114562988281, "step": 963}
{"info/global_step": 964, "train_info/time_within_train_step": 28.411425828933716, "step": 964}
{"train_info/time_between_train_steps": 0.0050678253173828125, "step": 964}
{"info/global_step": 965, "train_info/time_within_train_step": 27.83763360977173, "step": 965}
{"train_info/time_between_train_steps": 0.0058650970458984375, "step": 965}
{"info/global_step": 966, "train_info/time_within_train_step": 27.977898597717285, "step": 966}
{"train_info/time_between_train_steps": 0.005273580551147461, "step": 966}
{"info/global_step": 967, "train_info/time_within_train_step": 27.887017965316772, "step": 967}
{"train_info/time_between_train_steps": 0.0051593780517578125, "step": 967}
{"info/global_step": 968, "train_info/time_within_train_step": 27.821566343307495, "step": 968}
{"train_info/time_between_train_steps": 0.005392551422119141, "step": 968}
{"info/global_step": 969, "train_info/time_within_train_step": 27.810842275619507, "step": 969}
{"train_info/time_between_train_steps": 0.005220651626586914, "step": 969}
{"info/global_step": 970, "train_info/time_within_train_step": 27.844110012054443, "step": 970}
{"train_info/time_between_train_steps": 0.0054836273193359375, "step": 970}
{"info/global_step": 971, "train_info/time_within_train_step": 27.80595374107361, "step": 971}
{"train_info/time_between_train_steps": 0.005359649658203125, "step": 971}
{"info/global_step": 972, "train_info/time_within_train_step": 27.851890802383423, "step": 972}
{"train_info/time_between_train_steps": 0.011244535446166992, "step": 972}
{"info/global_step": 973, "train_info/time_within_train_step": 27.857337474822998, "step": 973}
{"train_info/time_between_train_steps": 0.0053637027740478516, "step": 973}
{"info/global_step": 974, "train_info/time_within_train_step": 27.86637592315674, "step": 974}
{"train_info/time_between_train_steps": 0.005276203155517578, "step": 974}
{"info/global_step": 975, "train_info/time_within_train_step": 27.866991758346558, "step": 975}
{"train_info/time_between_train_steps": 0.010159492492675781, "step": 975}
{"info/global_step": 976, "train_info/time_within_train_step": 27.831337451934814, "step": 976}
{"train_info/time_between_train_steps": 0.00559544563293457, "step": 976}
{"info/global_step": 977, "train_info/time_within_train_step": 27.88849663734436, "step": 977}
{"train_info/time_between_train_steps": 0.0051991939544677734, "step": 977}
{"info/global_step": 978, "train_info/time_within_train_step": 27.87962317466736, "step": 978}
{"train_info/time_between_train_steps": 0.005331993103027344, "step": 978}
{"info/global_step": 979, "train_info/time_within_train_step": 27.851089477539062, "step": 979}
{"train_info/time_between_train_steps": 0.011881589889526367, "step": 979}
{"info/global_step": 980, "train_info/time_within_train_step": 27.930831909179688, "step": 980}
{"train_info/time_between_train_steps": 0.01476740837097168, "step": 980}
{"info/global_step": 981, "train_info/time_within_train_step": 27.913533449172974, "step": 981}
{"train_info/time_between_train_steps": 0.007160663604736328, "step": 981}
{"info/global_step": 982, "train_info/time_within_train_step": 28.11786651611328, "step": 982}
{"train_info/time_between_train_steps": 0.013040781021118164, "step": 982}
{"info/global_step": 983, "train_info/time_within_train_step": 27.899564027786255, "step": 983}
{"train_info/time_between_train_steps": 0.011513471603393555, "step": 983}
{"info/global_step": 984, "train_info/time_within_train_step": 27.90519404411316, "step": 984}
{"train_info/time_between_train_steps": 0.006306886672973633, "step": 984}
{"train_info/time_between_train_steps": 5.3222222328186035, "step": 984}
{"info/global_step": 985, "train_info/time_within_train_step": 27.84534525871277, "step": 985}
{"train_info/time_between_train_steps": 0.005148172378540039, "step": 985}
{"info/global_step": 986, "train_info/time_within_train_step": 28.026160717010498, "step": 986}
{"train_info/time_between_train_steps": 0.0057599544525146484, "step": 986}
{"info/global_step": 987, "train_info/time_within_train_step": 27.87250852584839, "step": 987}
{"train_info/time_between_train_steps": 0.01073312759399414, "step": 987}
{"info/global_step": 988, "train_info/time_within_train_step": 27.89476466178894, "step": 988}
{"train_info/time_between_train_steps": 0.010852575302124023, "step": 988}
{"info/global_step": 989, "train_info/time_within_train_step": 27.911609411239624, "step": 989}
{"train_info/time_between_train_steps": 0.009978532791137695, "step": 989}
{"info/global_step": 990, "train_info/time_within_train_step": 27.848854780197144, "step": 990}
{"train_info/time_between_train_steps": 0.005465507507324219, "step": 990}
{"info/global_step": 991, "train_info/time_within_train_step": 27.806310892105103, "step": 991}
{"train_info/time_between_train_steps": 0.00540924072265625, "step": 991}
{"info/global_step": 992, "train_info/time_within_train_step": 27.85192632675171, "step": 992}
{"train_info/time_between_train_steps": 0.005357503890991211, "step": 992}
{"info/global_step": 993, "train_info/time_within_train_step": 27.83337712287903, "step": 993}
{"train_info/time_between_train_steps": 0.005525350570678711, "step": 993}
{"info/global_step": 994, "train_info/time_within_train_step": 27.934894323349, "step": 994}
{"train_info/time_between_train_steps": 0.009718179702758789, "step": 994}
{"info/global_step": 995, "train_info/time_within_train_step": 27.91450810432434, "step": 995}
{"train_info/time_between_train_steps": 0.005321025848388672, "step": 995}
{"info/global_step": 996, "train_info/time_within_train_step": 27.864219427108765, "step": 996}
{"train_info/time_between_train_steps": 0.005610942840576172, "step": 996}
{"info/global_step": 997, "train_info/time_within_train_step": 28.008266925811768, "step": 997}
{"train_info/time_between_train_steps": 0.010438680648803711, "step": 997}
{"info/global_step": 998, "train_info/time_within_train_step": 27.83282995223999, "step": 998}
{"train_info/time_between_train_steps": 0.010363101959228516, "step": 998}
{"info/global_step": 999, "train_info/time_within_train_step": 27.869904041290283, "step": 999}
{"train_info/time_between_train_steps": 0.005359649658203125, "step": 999}
{"info/global_step": 1000, "train_info/time_within_train_step": 27.885088682174683, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733890487, "_runtime": 28799}, "step": 1000}
{"logs": {"train/loss": 3.8885, "train/learning_rate": 0.00011111111111111109, "train/epoch": 41.01, "_timestamp": 1733890487, "_runtime": 28799}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733890489, "_runtime": 28801}, "step": 1000}
{"logs": {"eval/loss": 5.021076202392578, "eval/runtime": 1.8249, "eval/samples_per_second": 50.963, "eval/steps_per_second": 3.288, "train/epoch": 41.01, "_timestamp": 1733890489, "_runtime": 28801}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733890489, "_runtime": 28801}, "step": 1000}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 5.021076202392578, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 151.57434071608614, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 1.8249, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 50.963, "train/epoch": 41.01, "_timestamp": 1733890489, "_runtime": 28801}, "step": 1000}
{"train_info/time_between_train_steps": 4.208867788314819, "step": 1000}
{"info/global_step": 1001, "train_info/time_within_train_step": 27.871687650680542, "step": 1001}
{"train_info/time_between_train_steps": 0.010308265686035156, "step": 1001}
{"info/global_step": 1002, "train_info/time_within_train_step": 27.84255075454712, "step": 1002}
{"train_info/time_between_train_steps": 0.005226612091064453, "step": 1002}
{"info/global_step": 1003, "train_info/time_within_train_step": 27.873998403549194, "step": 1003}
{"train_info/time_between_train_steps": 0.005320310592651367, "step": 1003}
{"info/global_step": 1004, "train_info/time_within_train_step": 27.84050679206848, "step": 1004}
{"train_info/time_between_train_steps": 0.010746002197265625, "step": 1004}
{"info/global_step": 1005, "train_info/time_within_train_step": 27.91942071914673, "step": 1005}
{"train_info/time_between_train_steps": 0.005536317825317383, "step": 1005}
{"info/global_step": 1006, "train_info/time_within_train_step": 27.880692720413208, "step": 1006}
{"train_info/time_between_train_steps": 0.0062940120697021484, "step": 1006}
{"info/global_step": 1007, "train_info/time_within_train_step": 27.865641355514526, "step": 1007}
{"train_info/time_between_train_steps": 0.010835886001586914, "step": 1007}
{"info/global_step": 1008, "train_info/time_within_train_step": 27.99689292907715, "step": 1008}
{"train_info/time_between_train_steps": 0.010865449905395508, "step": 1008}
{"train_info/time_between_train_steps": 5.426269054412842, "step": 1008}
{"info/global_step": 1009, "train_info/time_within_train_step": 27.834061861038208, "step": 1009}
{"train_info/time_between_train_steps": 0.01191091537475586, "step": 1009}
{"info/global_step": 1010, "train_info/time_within_train_step": 27.97603130340576, "step": 1010}
{"train_info/time_between_train_steps": 0.005285024642944336, "step": 1010}
{"info/global_step": 1011, "train_info/time_within_train_step": 27.933807134628296, "step": 1011}
{"train_info/time_between_train_steps": 0.00547337532043457, "step": 1011}
{"info/global_step": 1012, "train_info/time_within_train_step": 27.945985794067383, "step": 1012}
{"train_info/time_between_train_steps": 0.005488157272338867, "step": 1012}
{"info/global_step": 1013, "train_info/time_within_train_step": 27.975032806396484, "step": 1013}
{"train_info/time_between_train_steps": 0.0052869319915771484, "step": 1013}
{"info/global_step": 1014, "train_info/time_within_train_step": 27.847171306610107, "step": 1014}
{"train_info/time_between_train_steps": 0.014146566390991211, "step": 1014}
{"info/global_step": 1015, "train_info/time_within_train_step": 27.91959023475647, "step": 1015}
{"train_info/time_between_train_steps": 0.009741067886352539, "step": 1015}
{"info/global_step": 1016, "train_info/time_within_train_step": 27.85541081428528, "step": 1016}
{"train_info/time_between_train_steps": 0.010186433792114258, "step": 1016}
{"info/global_step": 1017, "train_info/time_within_train_step": 27.88287615776062, "step": 1017}
{"train_info/time_between_train_steps": 0.005461692810058594, "step": 1017}
{"info/global_step": 1018, "train_info/time_within_train_step": 27.824490308761597, "step": 1018}
{"train_info/time_between_train_steps": 0.005400180816650391, "step": 1018}
{"info/global_step": 1019, "train_info/time_within_train_step": 27.83704400062561, "step": 1019}
{"train_info/time_between_train_steps": 0.005383491516113281, "step": 1019}
{"info/global_step": 1020, "train_info/time_within_train_step": 27.93085741996765, "step": 1020}
{"train_info/time_between_train_steps": 0.0072023868560791016, "step": 1020}
{"info/global_step": 1021, "train_info/time_within_train_step": 27.890251636505127, "step": 1021}
{"train_info/time_between_train_steps": 0.005392789840698242, "step": 1021}
{"info/global_step": 1022, "train_info/time_within_train_step": 27.814088106155396, "step": 1022}
{"train_info/time_between_train_steps": 0.005352973937988281, "step": 1022}
{"info/global_step": 1023, "train_info/time_within_train_step": 27.812724351882935, "step": 1023}
{"train_info/time_between_train_steps": 0.0053558349609375, "step": 1023}
{"info/global_step": 1024, "train_info/time_within_train_step": 27.879349946975708, "step": 1024}
{"train_info/time_between_train_steps": 0.005811214447021484, "step": 1024}
{"info/global_step": 1025, "train_info/time_within_train_step": 27.849042415618896, "step": 1025}
{"train_info/time_between_train_steps": 0.005323886871337891, "step": 1025}
{"info/global_step": 1026, "train_info/time_within_train_step": 27.816988945007324, "step": 1026}
{"train_info/time_between_train_steps": 0.00547480583190918, "step": 1026}
{"info/global_step": 1027, "train_info/time_within_train_step": 27.818432331085205, "step": 1027}
{"train_info/time_between_train_steps": 0.005283355712890625, "step": 1027}
{"info/global_step": 1028, "train_info/time_within_train_step": 28.04896569252014, "step": 1028}
{"train_info/time_between_train_steps": 0.00604248046875, "step": 1028}
{"info/global_step": 1029, "train_info/time_within_train_step": 27.856252193450928, "step": 1029}
{"train_info/time_between_train_steps": 0.005608081817626953, "step": 1029}
{"info/global_step": 1030, "train_info/time_within_train_step": 27.89925503730774, "step": 1030}
{"train_info/time_between_train_steps": 0.00982809066772461, "step": 1030}
{"info/global_step": 1031, "train_info/time_within_train_step": 27.8701491355896, "step": 1031}
{"train_info/time_between_train_steps": 0.011253118515014648, "step": 1031}
{"info/global_step": 1032, "train_info/time_within_train_step": 27.858869075775146, "step": 1032}
{"train_info/time_between_train_steps": 0.0070421695709228516, "step": 1032}
{"train_info/time_between_train_steps": 5.631202697753906, "step": 1032}
{"info/global_step": 1033, "train_info/time_within_train_step": 27.875207901000977, "step": 1033}
{"train_info/time_between_train_steps": 0.010218620300292969, "step": 1033}
{"info/global_step": 1034, "train_info/time_within_train_step": 28.023854732513428, "step": 1034}
{"train_info/time_between_train_steps": 0.005663156509399414, "step": 1034}
{"info/global_step": 1035, "train_info/time_within_train_step": 27.858847856521606, "step": 1035}
{"train_info/time_between_train_steps": 0.010233640670776367, "step": 1035}
{"info/global_step": 1036, "train_info/time_within_train_step": 27.96044635772705, "step": 1036}
{"train_info/time_between_train_steps": 0.005649089813232422, "step": 1036}
{"info/global_step": 1037, "train_info/time_within_train_step": 27.82658886909485, "step": 1037}
{"train_info/time_between_train_steps": 0.0054895877838134766, "step": 1037}
{"info/global_step": 1038, "train_info/time_within_train_step": 27.847219467163086, "step": 1038}
{"train_info/time_between_train_steps": 0.0050258636474609375, "step": 1038}
{"info/global_step": 1039, "train_info/time_within_train_step": 27.800825357437134, "step": 1039}
{"train_info/time_between_train_steps": 0.005166530609130859, "step": 1039}
{"info/global_step": 1040, "train_info/time_within_train_step": 27.850704193115234, "step": 1040}
{"train_info/time_between_train_steps": 0.005276918411254883, "step": 1040}
{"info/global_step": 1041, "train_info/time_within_train_step": 27.860581874847412, "step": 1041}
{"train_info/time_between_train_steps": 0.005258321762084961, "step": 1041}
{"info/global_step": 1042, "train_info/time_within_train_step": 27.894838094711304, "step": 1042}
{"train_info/time_between_train_steps": 0.009755373001098633, "step": 1042}
{"info/global_step": 1043, "train_info/time_within_train_step": 27.88935685157776, "step": 1043}
{"train_info/time_between_train_steps": 0.005264997482299805, "step": 1043}
{"info/global_step": 1044, "train_info/time_within_train_step": 27.943812370300293, "step": 1044}
{"train_info/time_between_train_steps": 0.005316495895385742, "step": 1044}
{"info/global_step": 1045, "train_info/time_within_train_step": 27.898627996444702, "step": 1045}
{"train_info/time_between_train_steps": 0.005282163619995117, "step": 1045}
{"info/global_step": 1046, "train_info/time_within_train_step": 27.890408039093018, "step": 1046}
{"train_info/time_between_train_steps": 0.005305767059326172, "step": 1046}
{"info/global_step": 1047, "train_info/time_within_train_step": 27.83865213394165, "step": 1047}
{"train_info/time_between_train_steps": 0.010326147079467773, "step": 1047}
{"info/global_step": 1048, "train_info/time_within_train_step": 27.825844526290894, "step": 1048}
{"train_info/time_between_train_steps": 0.005569934844970703, "step": 1048}
{"info/global_step": 1049, "train_info/time_within_train_step": 27.864558696746826, "step": 1049}
{"train_info/time_between_train_steps": 0.009278297424316406, "step": 1049}
{"info/global_step": 1050, "train_info/time_within_train_step": 27.882912635803223, "step": 1050}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733891897, "_runtime": 30209}, "step": 1050}
{"logs": {"train/loss": 3.8378, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 43.02, "_timestamp": 1733891897, "_runtime": 30209}, "step": 1050}
{"train_info/time_between_train_steps": 0.010396003723144531, "step": 1050}
{"info/global_step": 1051, "train_info/time_within_train_step": 27.870380401611328, "step": 1051}
{"train_info/time_between_train_steps": 0.009507894515991211, "step": 1051}
{"info/global_step": 1052, "train_info/time_within_train_step": 27.832257747650146, "step": 1052}
{"train_info/time_between_train_steps": 0.009567975997924805, "step": 1052}
{"info/global_step": 1053, "train_info/time_within_train_step": 27.935939073562622, "step": 1053}
{"train_info/time_between_train_steps": 0.0055081844329833984, "step": 1053}
{"info/global_step": 1054, "train_info/time_within_train_step": 27.880056619644165, "step": 1054}
{"train_info/time_between_train_steps": 0.010406494140625, "step": 1054}
{"info/global_step": 1055, "train_info/time_within_train_step": 27.860008001327515, "step": 1055}
{"train_info/time_between_train_steps": 0.00567317008972168, "step": 1055}
{"info/global_step": 1056, "train_info/time_within_train_step": 27.90692710876465, "step": 1056}
{"train_info/time_between_train_steps": 0.00601959228515625, "step": 1056}
{"train_info/time_between_train_steps": 5.076283693313599, "step": 1056}
{"info/global_step": 1057, "train_info/time_within_train_step": 27.840405225753784, "step": 1057}
{"train_info/time_between_train_steps": 0.005169391632080078, "step": 1057}
{"info/global_step": 1058, "train_info/time_within_train_step": 28.035789966583252, "step": 1058}
{"train_info/time_between_train_steps": 0.005443096160888672, "step": 1058}
{"info/global_step": 1059, "train_info/time_within_train_step": 27.889871835708618, "step": 1059}
{"train_info/time_between_train_steps": 0.005475044250488281, "step": 1059}
{"info/global_step": 1060, "train_info/time_within_train_step": 28.028029918670654, "step": 1060}
{"train_info/time_between_train_steps": 0.005610942840576172, "step": 1060}
{"info/global_step": 1061, "train_info/time_within_train_step": 27.823429107666016, "step": 1061}
{"train_info/time_between_train_steps": 0.005183219909667969, "step": 1061}
{"info/global_step": 1062, "train_info/time_within_train_step": 27.829499006271362, "step": 1062}
{"train_info/time_between_train_steps": 0.005187034606933594, "step": 1062}
{"info/global_step": 1063, "train_info/time_within_train_step": 27.781425952911377, "step": 1063}
{"train_info/time_between_train_steps": 0.005378246307373047, "step": 1063}
{"info/global_step": 1064, "train_info/time_within_train_step": 27.827489137649536, "step": 1064}
{"train_info/time_between_train_steps": 0.005195140838623047, "step": 1064}
{"info/global_step": 1065, "train_info/time_within_train_step": 27.831575632095337, "step": 1065}
{"train_info/time_between_train_steps": 0.005433797836303711, "step": 1065}
{"info/global_step": 1066, "train_info/time_within_train_step": 27.86000967025757, "step": 1066}
{"train_info/time_between_train_steps": 0.005422830581665039, "step": 1066}
{"info/global_step": 1067, "train_info/time_within_train_step": 27.841500282287598, "step": 1067}
{"train_info/time_between_train_steps": 0.005216360092163086, "step": 1067}
{"info/global_step": 1068, "train_info/time_within_train_step": 27.848201990127563, "step": 1068}
{"train_info/time_between_train_steps": 0.005240917205810547, "step": 1068}
{"info/global_step": 1069, "train_info/time_within_train_step": 27.81586480140686, "step": 1069}
{"train_info/time_between_train_steps": 0.00553584098815918, "step": 1069}
{"info/global_step": 1070, "train_info/time_within_train_step": 27.87034583091736, "step": 1070}
{"train_info/time_between_train_steps": 0.010185480117797852, "step": 1070}
{"info/global_step": 1071, "train_info/time_within_train_step": 27.8208429813385, "step": 1071}
{"train_info/time_between_train_steps": 0.005502939224243164, "step": 1071}
{"info/global_step": 1072, "train_info/time_within_train_step": 27.8571138381958, "step": 1072}
{"train_info/time_between_train_steps": 0.005479574203491211, "step": 1072}
{"info/global_step": 1073, "train_info/time_within_train_step": 27.901679754257202, "step": 1073}
{"train_info/time_between_train_steps": 0.0064699649810791016, "step": 1073}
{"info/global_step": 1074, "train_info/time_within_train_step": 27.861160039901733, "step": 1074}
{"train_info/time_between_train_steps": 0.005468606948852539, "step": 1074}
{"info/global_step": 1075, "train_info/time_within_train_step": 28.04956865310669, "step": 1075}
{"train_info/time_between_train_steps": 0.0055484771728515625, "step": 1075}
{"info/global_step": 1076, "train_info/time_within_train_step": 27.876789331436157, "step": 1076}
{"train_info/time_between_train_steps": 0.0059244632720947266, "step": 1076}
{"info/global_step": 1077, "train_info/time_within_train_step": 27.894335746765137, "step": 1077}
{"train_info/time_between_train_steps": 0.005440235137939453, "step": 1077}
{"info/global_step": 1078, "train_info/time_within_train_step": 27.837372541427612, "step": 1078}
{"train_info/time_between_train_steps": 0.00574803352355957, "step": 1078}
{"info/global_step": 1079, "train_info/time_within_train_step": 27.862847328186035, "step": 1079}
{"train_info/time_between_train_steps": 0.0058135986328125, "step": 1079}
{"info/global_step": 1080, "train_info/time_within_train_step": 27.939833164215088, "step": 1080}
{"train_info/time_between_train_steps": 0.006144285202026367, "step": 1080}
{"train_info/time_between_train_steps": 5.433382272720337, "step": 1080}
{"info/global_step": 1081, "train_info/time_within_train_step": 27.86947202682495, "step": 1081}
{"train_info/time_between_train_steps": 0.01010751724243164, "step": 1081}
{"info/global_step": 1082, "train_info/time_within_train_step": 28.01881718635559, "step": 1082}
{"train_info/time_between_train_steps": 0.005396604537963867, "step": 1082}
{"info/global_step": 1083, "train_info/time_within_train_step": 27.928024291992188, "step": 1083}
{"train_info/time_between_train_steps": 0.005327701568603516, "step": 1083}
{"info/global_step": 1084, "train_info/time_within_train_step": 27.879897832870483, "step": 1084}
{"train_info/time_between_train_steps": 0.005597829818725586, "step": 1084}
{"info/global_step": 1085, "train_info/time_within_train_step": 27.84545636177063, "step": 1085}
{"train_info/time_between_train_steps": 0.00518035888671875, "step": 1085}
{"info/global_step": 1086, "train_info/time_within_train_step": 27.820013761520386, "step": 1086}
{"train_info/time_between_train_steps": 0.005136013031005859, "step": 1086}
{"info/global_step": 1087, "train_info/time_within_train_step": 27.82221007347107, "step": 1087}
{"train_info/time_between_train_steps": 0.00972437858581543, "step": 1087}
{"info/global_step": 1088, "train_info/time_within_train_step": 27.811971187591553, "step": 1088}
{"train_info/time_between_train_steps": 0.005386829376220703, "step": 1088}
{"info/global_step": 1089, "train_info/time_within_train_step": 27.79498600959778, "step": 1089}
{"train_info/time_between_train_steps": 0.005358219146728516, "step": 1089}
{"info/global_step": 1090, "train_info/time_within_train_step": 27.800930976867676, "step": 1090}
{"train_info/time_between_train_steps": 0.005383491516113281, "step": 1090}
{"info/global_step": 1091, "train_info/time_within_train_step": 27.90198254585266, "step": 1091}
{"train_info/time_between_train_steps": 0.009496688842773438, "step": 1091}
{"info/global_step": 1092, "train_info/time_within_train_step": 27.837273836135864, "step": 1092}
{"train_info/time_between_train_steps": 0.006284952163696289, "step": 1092}
{"info/global_step": 1093, "train_info/time_within_train_step": 27.8120756149292, "step": 1093}
{"train_info/time_between_train_steps": 0.0055468082427978516, "step": 1093}
{"info/global_step": 1094, "train_info/time_within_train_step": 27.841538190841675, "step": 1094}
{"train_info/time_between_train_steps": 0.005209922790527344, "step": 1094}
{"info/global_step": 1095, "train_info/time_within_train_step": 27.830973625183105, "step": 1095}
{"train_info/time_between_train_steps": 0.0053424835205078125, "step": 1095}
{"info/global_step": 1096, "train_info/time_within_train_step": 27.84394598007202, "step": 1096}
{"train_info/time_between_train_steps": 0.0053327083587646484, "step": 1096}
{"info/global_step": 1097, "train_info/time_within_train_step": 27.92316508293152, "step": 1097}
{"train_info/time_between_train_steps": 0.0055446624755859375, "step": 1097}
{"info/global_step": 1098, "train_info/time_within_train_step": 27.883422374725342, "step": 1098}
{"train_info/time_between_train_steps": 0.005305290222167969, "step": 1098}
{"info/global_step": 1099, "train_info/time_within_train_step": 27.865355730056763, "step": 1099}
{"train_info/time_between_train_steps": 0.005285024642944336, "step": 1099}
{"info/global_step": 1100, "train_info/time_within_train_step": 27.873096704483032, "step": 1100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733893302, "_runtime": 31614}, "step": 1100}
{"logs": {"train/loss": 3.795, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 45.02, "_timestamp": 1733893302, "_runtime": 31614}, "step": 1100}
{"train_info/time_between_train_steps": 2.3480334281921387, "step": 1100}
{"info/global_step": 1101, "train_info/time_within_train_step": 27.819809436798096, "step": 1101}
{"train_info/time_between_train_steps": 0.005479574203491211, "step": 1101}
{"info/global_step": 1102, "train_info/time_within_train_step": 27.82911515235901, "step": 1102}
{"train_info/time_between_train_steps": 0.005760908126831055, "step": 1102}
{"info/global_step": 1103, "train_info/time_within_train_step": 27.89913821220398, "step": 1103}
{"train_info/time_between_train_steps": 0.006544589996337891, "step": 1103}
{"info/global_step": 1104, "train_info/time_within_train_step": 27.878231287002563, "step": 1104}
{"train_info/time_between_train_steps": 0.00638127326965332, "step": 1104}
{"train_info/time_between_train_steps": 5.429275035858154, "step": 1104}
{"info/global_step": 1105, "train_info/time_within_train_step": 27.801952600479126, "step": 1105}
{"train_info/time_between_train_steps": 0.00572657585144043, "step": 1105}
{"info/global_step": 1106, "train_info/time_within_train_step": 28.12136435508728, "step": 1106}
{"train_info/time_between_train_steps": 0.005679607391357422, "step": 1106}
{"info/global_step": 1107, "train_info/time_within_train_step": 27.84022045135498, "step": 1107}
{"train_info/time_between_train_steps": 0.005803108215332031, "step": 1107}
{"info/global_step": 1108, "train_info/time_within_train_step": 27.927231311798096, "step": 1108}
{"train_info/time_between_train_steps": 0.00576329231262207, "step": 1108}
{"info/global_step": 1109, "train_info/time_within_train_step": 27.82115125656128, "step": 1109}
{"train_info/time_between_train_steps": 0.009726524353027344, "step": 1109}
{"info/global_step": 1110, "train_info/time_within_train_step": 27.84475016593933, "step": 1110}
{"train_info/time_between_train_steps": 0.005287647247314453, "step": 1110}
{"info/global_step": 1111, "train_info/time_within_train_step": 27.821574926376343, "step": 1111}
{"train_info/time_between_train_steps": 0.005259513854980469, "step": 1111}
{"info/global_step": 1112, "train_info/time_within_train_step": 27.83818030357361, "step": 1112}
{"train_info/time_between_train_steps": 0.0053670406341552734, "step": 1112}
{"info/global_step": 1113, "train_info/time_within_train_step": 27.871209621429443, "step": 1113}
{"train_info/time_between_train_steps": 0.005872011184692383, "step": 1113}
{"info/global_step": 1114, "train_info/time_within_train_step": 27.851113319396973, "step": 1114}
{"train_info/time_between_train_steps": 0.005345582962036133, "step": 1114}
{"info/global_step": 1115, "train_info/time_within_train_step": 27.8630211353302, "step": 1115}
{"train_info/time_between_train_steps": 0.009368658065795898, "step": 1115}
{"info/global_step": 1116, "train_info/time_within_train_step": 27.82919931411743, "step": 1116}
{"train_info/time_between_train_steps": 0.005470991134643555, "step": 1116}
{"info/global_step": 1117, "train_info/time_within_train_step": 27.795893669128418, "step": 1117}
{"train_info/time_between_train_steps": 0.005371570587158203, "step": 1117}
{"info/global_step": 1118, "train_info/time_within_train_step": 27.81351399421692, "step": 1118}
{"train_info/time_between_train_steps": 0.005371809005737305, "step": 1118}
{"info/global_step": 1119, "train_info/time_within_train_step": 27.87670087814331, "step": 1119}
{"train_info/time_between_train_steps": 0.005535602569580078, "step": 1119}
{"info/global_step": 1120, "train_info/time_within_train_step": 27.8546245098114, "step": 1120}
{"train_info/time_between_train_steps": 0.005479335784912109, "step": 1120}
{"info/global_step": 1121, "train_info/time_within_train_step": 27.780725955963135, "step": 1121}
{"train_info/time_between_train_steps": 0.005257606506347656, "step": 1121}
{"info/global_step": 1122, "train_info/time_within_train_step": 27.91702675819397, "step": 1122}
{"train_info/time_between_train_steps": 0.005615711212158203, "step": 1122}
{"info/global_step": 1123, "train_info/time_within_train_step": 27.83725619316101, "step": 1123}
{"train_info/time_between_train_steps": 0.005323886871337891, "step": 1123}
{"info/global_step": 1124, "train_info/time_within_train_step": 27.790276288986206, "step": 1124}
{"train_info/time_between_train_steps": 0.005994558334350586, "step": 1124}
{"info/global_step": 1125, "train_info/time_within_train_step": 27.972107410430908, "step": 1125}
{"train_info/time_between_train_steps": 0.005520820617675781, "step": 1125}
{"info/global_step": 1126, "train_info/time_within_train_step": 27.920991897583008, "step": 1126}
{"train_info/time_between_train_steps": 0.0057659149169921875, "step": 1126}
{"info/global_step": 1127, "train_info/time_within_train_step": 27.863704442977905, "step": 1127}
{"train_info/time_between_train_steps": 0.005798816680908203, "step": 1127}
{"info/global_step": 1128, "train_info/time_within_train_step": 27.84405493736267, "step": 1128}
{"train_info/time_between_train_steps": 0.010540008544921875, "step": 1128}
{"train_info/time_between_train_steps": 5.095949172973633, "step": 1128}
{"info/global_step": 1129, "train_info/time_within_train_step": 27.899057149887085, "step": 1129}
{"train_info/time_between_train_steps": 0.005826473236083984, "step": 1129}
{"info/global_step": 1130, "train_info/time_within_train_step": 28.023507356643677, "step": 1130}
{"train_info/time_between_train_steps": 0.005648374557495117, "step": 1130}
{"info/global_step": 1131, "train_info/time_within_train_step": 27.80763292312622, "step": 1131}
{"train_info/time_between_train_steps": 0.006804943084716797, "step": 1131}
{"info/global_step": 1132, "train_info/time_within_train_step": 27.906848192214966, "step": 1132}
{"train_info/time_between_train_steps": 0.0055999755859375, "step": 1132}
{"info/global_step": 1133, "train_info/time_within_train_step": 27.797048568725586, "step": 1133}
{"train_info/time_between_train_steps": 0.005110025405883789, "step": 1133}
{"info/global_step": 1134, "train_info/time_within_train_step": 27.830748319625854, "step": 1134}
{"train_info/time_between_train_steps": 0.010213136672973633, "step": 1134}
{"info/global_step": 1135, "train_info/time_within_train_step": 27.767333269119263, "step": 1135}
{"train_info/time_between_train_steps": 0.010088443756103516, "step": 1135}
{"info/global_step": 1136, "train_info/time_within_train_step": 27.76253867149353, "step": 1136}
{"train_info/time_between_train_steps": 0.00527644157409668, "step": 1136}
{"info/global_step": 1137, "train_info/time_within_train_step": 27.88440203666687, "step": 1137}
{"train_info/time_between_train_steps": 0.005332469940185547, "step": 1137}
{"info/global_step": 1138, "train_info/time_within_train_step": 27.78595805168152, "step": 1138}
{"train_info/time_between_train_steps": 0.0051119327545166016, "step": 1138}
{"info/global_step": 1139, "train_info/time_within_train_step": 27.79640483856201, "step": 1139}
{"train_info/time_between_train_steps": 0.005146503448486328, "step": 1139}
{"info/global_step": 1140, "train_info/time_within_train_step": 27.97141933441162, "step": 1140}
{"train_info/time_between_train_steps": 0.009627103805541992, "step": 1140}
{"info/global_step": 1141, "train_info/time_within_train_step": 27.777838230133057, "step": 1141}
{"train_info/time_between_train_steps": 0.006667375564575195, "step": 1141}
{"info/global_step": 1142, "train_info/time_within_train_step": 27.77028489112854, "step": 1142}
{"train_info/time_between_train_steps": 0.005158662796020508, "step": 1142}
{"info/global_step": 1143, "train_info/time_within_train_step": 27.782121658325195, "step": 1143}
{"train_info/time_between_train_steps": 0.005317211151123047, "step": 1143}
{"info/global_step": 1144, "train_info/time_within_train_step": 27.75640892982483, "step": 1144}
{"train_info/time_between_train_steps": 0.005335092544555664, "step": 1144}
{"info/global_step": 1145, "train_info/time_within_train_step": 27.747837781906128, "step": 1145}
{"train_info/time_between_train_steps": 0.00524592399597168, "step": 1145}
{"info/global_step": 1146, "train_info/time_within_train_step": 27.794943809509277, "step": 1146}
{"train_info/time_between_train_steps": 0.00536656379699707, "step": 1146}
{"info/global_step": 1147, "train_info/time_within_train_step": 27.789411783218384, "step": 1147}
{"train_info/time_between_train_steps": 0.005321979522705078, "step": 1147}
{"info/global_step": 1148, "train_info/time_within_train_step": 27.785889863967896, "step": 1148}
{"train_info/time_between_train_steps": 0.005522012710571289, "step": 1148}
{"info/global_step": 1149, "train_info/time_within_train_step": 27.779873847961426, "step": 1149}
{"train_info/time_between_train_steps": 0.01063680648803711, "step": 1149}
{"info/global_step": 1150, "train_info/time_within_train_step": 27.966851949691772, "step": 1150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733894707, "_runtime": 33019}, "step": 1150}
{"logs": {"train/loss": 3.759, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 47.02, "_timestamp": 1733894707, "_runtime": 33019}, "step": 1150}
{"train_info/time_between_train_steps": 0.007906436920166016, "step": 1150}
{"info/global_step": 1151, "train_info/time_within_train_step": 27.835726022720337, "step": 1151}
{"train_info/time_between_train_steps": 0.011323690414428711, "step": 1151}
{"info/global_step": 1152, "train_info/time_within_train_step": 27.824504137039185, "step": 1152}
{"train_info/time_between_train_steps": 0.005723237991333008, "step": 1152}
{"train_info/time_between_train_steps": 5.2894017696380615, "step": 1152}
{"info/global_step": 1153, "train_info/time_within_train_step": 27.985440492630005, "step": 1153}
{"train_info/time_between_train_steps": 0.005067110061645508, "step": 1153}
{"info/global_step": 1154, "train_info/time_within_train_step": 27.958593368530273, "step": 1154}
{"train_info/time_between_train_steps": 0.005697965621948242, "step": 1154}
{"info/global_step": 1155, "train_info/time_within_train_step": 27.82355284690857, "step": 1155}
{"train_info/time_between_train_steps": 0.005614042282104492, "step": 1155}
{"info/global_step": 1156, "train_info/time_within_train_step": 27.937049865722656, "step": 1156}
{"train_info/time_between_train_steps": 0.0055696964263916016, "step": 1156}
{"info/global_step": 1157, "train_info/time_within_train_step": 27.911148071289062, "step": 1157}
{"train_info/time_between_train_steps": 0.010195493698120117, "step": 1157}
{"info/global_step": 1158, "train_info/time_within_train_step": 27.859436988830566, "step": 1158}
{"train_info/time_between_train_steps": 0.00612187385559082, "step": 1158}
{"info/global_step": 1159, "train_info/time_within_train_step": 27.848834991455078, "step": 1159}
{"train_info/time_between_train_steps": 0.0053653717041015625, "step": 1159}
{"info/global_step": 1160, "train_info/time_within_train_step": 27.8270845413208, "step": 1160}
{"train_info/time_between_train_steps": 0.005553483963012695, "step": 1160}
{"info/global_step": 1161, "train_info/time_within_train_step": 27.937666654586792, "step": 1161}
{"train_info/time_between_train_steps": 0.009557247161865234, "step": 1161}
{"info/global_step": 1162, "train_info/time_within_train_step": 27.889426469802856, "step": 1162}
{"train_info/time_between_train_steps": 0.005408048629760742, "step": 1162}
{"info/global_step": 1163, "train_info/time_within_train_step": 27.807403087615967, "step": 1163}
{"train_info/time_between_train_steps": 0.0055408477783203125, "step": 1163}
{"info/global_step": 1164, "train_info/time_within_train_step": 27.82313847541809, "step": 1164}
{"train_info/time_between_train_steps": 0.005788564682006836, "step": 1164}
{"info/global_step": 1165, "train_info/time_within_train_step": 27.812424182891846, "step": 1165}
{"train_info/time_between_train_steps": 0.005278825759887695, "step": 1165}
{"info/global_step": 1166, "train_info/time_within_train_step": 27.809709787368774, "step": 1166}
{"train_info/time_between_train_steps": 0.009994983673095703, "step": 1166}
{"info/global_step": 1167, "train_info/time_within_train_step": 27.82848834991455, "step": 1167}
{"train_info/time_between_train_steps": 0.005500316619873047, "step": 1167}
{"info/global_step": 1168, "train_info/time_within_train_step": 27.817094564437866, "step": 1168}
{"train_info/time_between_train_steps": 0.010876178741455078, "step": 1168}
{"info/global_step": 1169, "train_info/time_within_train_step": 28.011725902557373, "step": 1169}
{"train_info/time_between_train_steps": 0.005517721176147461, "step": 1169}
{"info/global_step": 1170, "train_info/time_within_train_step": 27.841821432113647, "step": 1170}
{"train_info/time_between_train_steps": 0.00686335563659668, "step": 1170}
{"info/global_step": 1171, "train_info/time_within_train_step": 27.825981616973877, "step": 1171}
{"train_info/time_between_train_steps": 0.005440235137939453, "step": 1171}
{"info/global_step": 1172, "train_info/time_within_train_step": 27.810929775238037, "step": 1172}
{"train_info/time_between_train_steps": 0.005632638931274414, "step": 1172}
{"info/global_step": 1173, "train_info/time_within_train_step": 27.806205987930298, "step": 1173}
{"train_info/time_between_train_steps": 0.005555629730224609, "step": 1173}
{"info/global_step": 1174, "train_info/time_within_train_step": 27.86811661720276, "step": 1174}
{"train_info/time_between_train_steps": 0.005770683288574219, "step": 1174}
{"info/global_step": 1175, "train_info/time_within_train_step": 27.852508068084717, "step": 1175}
{"train_info/time_between_train_steps": 0.005838632583618164, "step": 1175}
{"info/global_step": 1176, "train_info/time_within_train_step": 27.874561309814453, "step": 1176}
{"train_info/time_between_train_steps": 0.006274700164794922, "step": 1176}
{"train_info/time_between_train_steps": 5.651469469070435, "step": 1176}
{"info/global_step": 1177, "train_info/time_within_train_step": 27.818220615386963, "step": 1177}
{"train_info/time_between_train_steps": 0.0054509639739990234, "step": 1177}
{"info/global_step": 1178, "train_info/time_within_train_step": 27.972622394561768, "step": 1178}
{"train_info/time_between_train_steps": 0.010340690612792969, "step": 1178}
{"info/global_step": 1179, "train_info/time_within_train_step": 27.805202960968018, "step": 1179}
{"train_info/time_between_train_steps": 0.0056116580963134766, "step": 1179}
{"info/global_step": 1180, "train_info/time_within_train_step": 27.895092010498047, "step": 1180}
{"train_info/time_between_train_steps": 0.005451679229736328, "step": 1180}
{"info/global_step": 1181, "train_info/time_within_train_step": 27.863542079925537, "step": 1181}
{"train_info/time_between_train_steps": 0.005273342132568359, "step": 1181}
{"info/global_step": 1182, "train_info/time_within_train_step": 27.808309316635132, "step": 1182}
{"train_info/time_between_train_steps": 0.0073893070220947266, "step": 1182}
{"info/global_step": 1183, "train_info/time_within_train_step": 27.802002906799316, "step": 1183}
{"train_info/time_between_train_steps": 0.005164623260498047, "step": 1183}
{"info/global_step": 1184, "train_info/time_within_train_step": 27.897860527038574, "step": 1184}
{"train_info/time_between_train_steps": 0.005354166030883789, "step": 1184}
{"info/global_step": 1185, "train_info/time_within_train_step": 27.824500799179077, "step": 1185}
{"train_info/time_between_train_steps": 0.0053369998931884766, "step": 1185}
{"info/global_step": 1186, "train_info/time_within_train_step": 27.798107385635376, "step": 1186}
{"train_info/time_between_train_steps": 0.005399942398071289, "step": 1186}
{"info/global_step": 1187, "train_info/time_within_train_step": 27.82336711883545, "step": 1187}
{"train_info/time_between_train_steps": 0.0055332183837890625, "step": 1187}
{"info/global_step": 1188, "train_info/time_within_train_step": 27.878303050994873, "step": 1188}
{"train_info/time_between_train_steps": 0.005467414855957031, "step": 1188}
{"info/global_step": 1189, "train_info/time_within_train_step": 27.82072401046753, "step": 1189}
{"train_info/time_between_train_steps": 0.0052378177642822266, "step": 1189}
{"info/global_step": 1190, "train_info/time_within_train_step": 27.812041521072388, "step": 1190}
{"train_info/time_between_train_steps": 0.005345582962036133, "step": 1190}
{"info/global_step": 1191, "train_info/time_within_train_step": 27.769029140472412, "step": 1191}
{"train_info/time_between_train_steps": 0.005259990692138672, "step": 1191}
{"info/global_step": 1192, "train_info/time_within_train_step": 27.788742542266846, "step": 1192}
{"train_info/time_between_train_steps": 0.006676197052001953, "step": 1192}
{"info/global_step": 1193, "train_info/time_within_train_step": 27.83833622932434, "step": 1193}
{"train_info/time_between_train_steps": 0.005631208419799805, "step": 1193}
{"info/global_step": 1194, "train_info/time_within_train_step": 27.80966806411743, "step": 1194}
{"train_info/time_between_train_steps": 0.005423784255981445, "step": 1194}
{"info/global_step": 1195, "train_info/time_within_train_step": 27.84249782562256, "step": 1195}
{"train_info/time_between_train_steps": 0.011593818664550781, "step": 1195}
{"info/global_step": 1196, "train_info/time_within_train_step": 27.849767208099365, "step": 1196}
{"train_info/time_between_train_steps": 0.010730266571044922, "step": 1196}
{"info/global_step": 1197, "train_info/time_within_train_step": 27.838176727294922, "step": 1197}
{"train_info/time_between_train_steps": 0.008304357528686523, "step": 1197}
{"info/global_step": 1198, "train_info/time_within_train_step": 27.835001945495605, "step": 1198}
{"train_info/time_between_train_steps": 0.011017560958862305, "step": 1198}
{"info/global_step": 1199, "train_info/time_within_train_step": 27.881232976913452, "step": 1199}
{"train_info/time_between_train_steps": 0.011040687561035156, "step": 1199}
{"info/global_step": 1200, "train_info/time_within_train_step": 27.97308039665222, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733896111, "_runtime": 34423}, "step": 1200}
{"logs": {"train/loss": 3.7334, "train/learning_rate": 0.0, "train/epoch": 49.02, "_timestamp": 1733896111, "_runtime": 34423}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733896114, "_runtime": 34426}, "step": 1200}
{"logs": {"train/train_runtime": 34426.6186, "train/train_samples_per_second": 17.847, "train/train_steps_per_second": 0.035, "train/total_flos": 3.21920667353088e+17, "train/train_loss": 4.8886952106157935, "train/epoch": 49.02, "_timestamp": 1733896114, "_runtime": 34426}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733896116, "_runtime": 34428}, "step": 1200}
{"logs": {"eval/loss": 5.034140110015869, "eval/runtime": 1.8285, "eval/samples_per_second": 50.861, "eval/steps_per_second": 3.281, "train/epoch": 49.02, "_timestamp": 1733896116, "_runtime": 34428}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733896116, "_runtime": 34428}, "step": 1200}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 5.034140110015869, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 153.567484678875, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 1.8285, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 50.861, "train/epoch": 49.02, "_timestamp": 1733896116, "_runtime": 34428}, "step": 1200}