{"num_parameters": 108882432, "trainable_parameters": 108882432, "step": 0} {"train_info/time_between_train_steps": 2.5562856197357178, "step": 0} {"info/global_step": 1, "train_info/time_within_train_step": 6.218926906585693, "step": 1} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 3648.16943359375, "train_info/memory_reserved": 4092.0, "train_info/memory_max_reserved": 4092.0, "_timestamp": 1746252215, "_runtime": 34}, "step": 1} {"logs": {"train/loss": 10.3975, "train/learning_rate": 2e-06, "train/epoch": 0.0, "_timestamp": 1746252215, "_runtime": 34}, "step": 1} {"train_info/time_between_train_steps": 0.02504563331604004, "step": 1} {"info/global_step": 2, "train_info/time_within_train_step": 2.1660308837890625, "step": 2} {"train_info/time_between_train_steps": 0.0036873817443847656, "step": 2} {"info/global_step": 3, "train_info/time_within_train_step": 2.1711604595184326, "step": 3} {"train_info/time_between_train_steps": 0.003687620162963867, "step": 3} {"info/global_step": 4, "train_info/time_within_train_step": 2.171112060546875, "step": 4} {"train_info/time_between_train_steps": 0.003957986831665039, "step": 4} {"info/global_step": 5, "train_info/time_within_train_step": 2.1719939708709717, "step": 5} {"train_info/time_between_train_steps": 0.0036468505859375, "step": 5} {"info/global_step": 6, "train_info/time_within_train_step": 2.1748015880584717, "step": 6} {"train_info/time_between_train_steps": 0.003797769546508789, "step": 6} {"info/global_step": 7, "train_info/time_within_train_step": 2.1750102043151855, "step": 7} {"train_info/time_between_train_steps": 0.0037031173706054688, "step": 7} {"info/global_step": 8, "train_info/time_within_train_step": 2.1741299629211426, "step": 8} {"train_info/time_between_train_steps": 0.003702402114868164, "step": 8} {"info/global_step": 9, "train_info/time_within_train_step": 2.1706855297088623, "step": 9} {"train_info/time_between_train_steps": 0.0036482810974121094, "step": 9} {"info/global_step": 10, "train_info/time_within_train_step": 2.173098087310791, "step": 10} {"train_info/time_between_train_steps": 0.0037059783935546875, "step": 10} {"info/global_step": 11, "train_info/time_within_train_step": 2.1786398887634277, "step": 11} {"train_info/time_between_train_steps": 0.0036704540252685547, "step": 11} {"info/global_step": 12, "train_info/time_within_train_step": 2.2008121013641357, "step": 12} {"train_info/time_between_train_steps": 0.0038394927978515625, "step": 12} {"info/global_step": 13, "train_info/time_within_train_step": 2.278163194656372, "step": 13} {"train_info/time_between_train_steps": 0.0037894248962402344, "step": 13} {"info/global_step": 14, "train_info/time_within_train_step": 2.359151840209961, "step": 14} {"train_info/time_between_train_steps": 0.003903627395629883, "step": 14} {"info/global_step": 15, "train_info/time_within_train_step": 2.3585357666015625, "step": 15} {"train_info/time_between_train_steps": 0.0036427974700927734, "step": 15} {"info/global_step": 16, "train_info/time_within_train_step": 2.357976198196411, "step": 16} {"train_info/time_between_train_steps": 0.0036220550537109375, "step": 16} {"info/global_step": 17, "train_info/time_within_train_step": 2.358170986175537, "step": 17} {"train_info/time_between_train_steps": 0.003756284713745117, "step": 17} {"info/global_step": 18, "train_info/time_within_train_step": 2.3597633838653564, "step": 18} {"train_info/time_between_train_steps": 0.003701925277709961, "step": 18} {"info/global_step": 19, "train_info/time_within_train_step": 2.356710195541382, "step": 19} {"train_info/time_between_train_steps": 0.003506898880004883, "step": 19} {"info/global_step": 20, "train_info/time_within_train_step": 2.358927011489868, "step": 20} {"train_info/time_between_train_steps": 0.0036373138427734375, "step": 20} {"info/global_step": 21, "train_info/time_within_train_step": 2.3583486080169678, "step": 21} {"train_info/time_between_train_steps": 0.0036432743072509766, "step": 21} {"info/global_step": 22, "train_info/time_within_train_step": 2.358832836151123, "step": 22} {"train_info/time_between_train_steps": 0.003635883331298828, "step": 22} {"info/global_step": 23, "train_info/time_within_train_step": 2.3595216274261475, "step": 23} {"train_info/time_between_train_steps": 0.003796100616455078, "step": 23} {"info/global_step": 24, "train_info/time_within_train_step": 2.3596296310424805, "step": 24} {"train_info/time_between_train_steps": 0.0036857128143310547, "step": 24} {"info/global_step": 25, "train_info/time_within_train_step": 2.7242431640625, "step": 25} {"train_info/time_between_train_steps": 0.0035352706909179688, "step": 25} {"info/global_step": 26, "train_info/time_within_train_step": 2.3600566387176514, "step": 26} {"train_info/time_between_train_steps": 0.0034589767456054688, "step": 26} {"info/global_step": 27, "train_info/time_within_train_step": 2.3591721057891846, "step": 27} {"train_info/time_between_train_steps": 0.0034584999084472656, "step": 27} {"info/global_step": 28, "train_info/time_within_train_step": 2.37471342086792, "step": 28} {"train_info/time_between_train_steps": 0.0033376216888427734, "step": 28} {"info/global_step": 29, "train_info/time_within_train_step": 2.358891010284424, "step": 29} {"train_info/time_between_train_steps": 0.0034284591674804688, "step": 29} {"info/global_step": 30, "train_info/time_within_train_step": 2.3587961196899414, "step": 30} {"train_info/time_between_train_steps": 0.0033626556396484375, "step": 30} {"info/global_step": 31, "train_info/time_within_train_step": 2.3574225902557373, "step": 31} {"train_info/time_between_train_steps": 0.0035669803619384766, "step": 31} {"info/global_step": 32, "train_info/time_within_train_step": 2.3578569889068604, "step": 32} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 32} {"info/global_step": 33, "train_info/time_within_train_step": 2.3578715324401855, "step": 33} {"train_info/time_between_train_steps": 0.003470182418823242, "step": 33} {"info/global_step": 34, "train_info/time_within_train_step": 2.358719825744629, "step": 34} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 34} {"info/global_step": 35, "train_info/time_within_train_step": 2.3568410873413086, "step": 35} {"train_info/time_between_train_steps": 0.003292083740234375, "step": 35} {"info/global_step": 36, "train_info/time_within_train_step": 2.3567867279052734, "step": 36} {"train_info/time_between_train_steps": 0.0033173561096191406, "step": 36} {"info/global_step": 37, "train_info/time_within_train_step": 2.398298978805542, "step": 37} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 37} {"info/global_step": 38, "train_info/time_within_train_step": 2.357956886291504, "step": 38} {"train_info/time_between_train_steps": 0.0032660961151123047, "step": 38} {"info/global_step": 39, "train_info/time_within_train_step": 2.3582427501678467, "step": 39} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 39} {"info/global_step": 40, "train_info/time_within_train_step": 2.3565304279327393, "step": 40} {"train_info/time_between_train_steps": 0.0034019947052001953, "step": 40} {"info/global_step": 41, "train_info/time_within_train_step": 2.3580033779144287, "step": 41} {"train_info/time_between_train_steps": 0.0032911300659179688, "step": 41} {"info/global_step": 42, "train_info/time_within_train_step": 2.3597006797790527, "step": 42} {"train_info/time_between_train_steps": 0.0032873153686523438, "step": 42} {"info/global_step": 43, "train_info/time_within_train_step": 2.3565497398376465, "step": 43} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 43} {"info/global_step": 44, "train_info/time_within_train_step": 2.3571279048919678, "step": 44} {"train_info/time_between_train_steps": 0.0032863616943359375, "step": 44} {"info/global_step": 45, "train_info/time_within_train_step": 2.359693765640259, "step": 45} {"train_info/time_between_train_steps": 0.0032875537872314453, "step": 45} {"info/global_step": 46, "train_info/time_within_train_step": 2.359010696411133, "step": 46} {"train_info/time_between_train_steps": 0.003412961959838867, "step": 46} {"info/global_step": 47, "train_info/time_within_train_step": 2.3592796325683594, "step": 47} {"train_info/time_between_train_steps": 0.0032880306243896484, "step": 47} {"info/global_step": 48, "train_info/time_within_train_step": 2.359915018081665, "step": 48} {"train_info/time_between_train_steps": 0.0035147666931152344, "step": 48} {"info/global_step": 49, "train_info/time_within_train_step": 2.538724899291992, "step": 49} {"train_info/time_between_train_steps": 0.003340005874633789, "step": 49} {"info/global_step": 50, "train_info/time_within_train_step": 2.3570311069488525, "step": 50} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746252333, "_runtime": 152}, "step": 50} {"logs": {"train/loss": 8.2346, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 0.02, "_timestamp": 1746252333, "_runtime": 152}, "step": 50} {"train_info/time_between_train_steps": 0.028275251388549805, "step": 50} {"info/global_step": 51, "train_info/time_within_train_step": 2.3586385250091553, "step": 51} {"train_info/time_between_train_steps": 0.0036869049072265625, "step": 51} {"info/global_step": 52, "train_info/time_within_train_step": 2.35776948928833, "step": 52} {"train_info/time_between_train_steps": 0.0032896995544433594, "step": 52} {"info/global_step": 53, "train_info/time_within_train_step": 2.358900308609009, "step": 53} {"train_info/time_between_train_steps": 0.003365755081176758, "step": 53} {"info/global_step": 54, "train_info/time_within_train_step": 2.3564250469207764, "step": 54} {"train_info/time_between_train_steps": 0.003409862518310547, "step": 54} {"info/global_step": 55, "train_info/time_within_train_step": 2.3614771366119385, "step": 55} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 55} {"info/global_step": 56, "train_info/time_within_train_step": 2.356963872909546, "step": 56} {"train_info/time_between_train_steps": 0.003519296646118164, "step": 56} {"info/global_step": 57, "train_info/time_within_train_step": 2.3567886352539062, "step": 57} {"train_info/time_between_train_steps": 0.0033388137817382812, "step": 57} {"info/global_step": 58, "train_info/time_within_train_step": 2.358234167098999, "step": 58} {"train_info/time_between_train_steps": 0.0033075809478759766, "step": 58} {"info/global_step": 59, "train_info/time_within_train_step": 2.359684467315674, "step": 59} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 59} {"info/global_step": 60, "train_info/time_within_train_step": 2.357283592224121, "step": 60} {"train_info/time_between_train_steps": 0.0033254623413085938, "step": 60} {"info/global_step": 61, "train_info/time_within_train_step": 2.3575942516326904, "step": 61} {"train_info/time_between_train_steps": 0.003294706344604492, "step": 61} {"info/global_step": 62, "train_info/time_within_train_step": 2.357593059539795, "step": 62} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 62} {"info/global_step": 63, "train_info/time_within_train_step": 2.4916725158691406, "step": 63} {"train_info/time_between_train_steps": 0.0032329559326171875, "step": 63} {"info/global_step": 64, "train_info/time_within_train_step": 2.358694314956665, "step": 64} {"train_info/time_between_train_steps": 0.003282308578491211, "step": 64} {"info/global_step": 65, "train_info/time_within_train_step": 2.358525514602661, "step": 65} {"train_info/time_between_train_steps": 0.0033409595489501953, "step": 65} {"info/global_step": 66, "train_info/time_within_train_step": 2.3558220863342285, "step": 66} {"train_info/time_between_train_steps": 0.00331878662109375, "step": 66} {"info/global_step": 67, "train_info/time_within_train_step": 2.3571419715881348, "step": 67} {"train_info/time_between_train_steps": 0.0034275054931640625, "step": 67} {"info/global_step": 68, "train_info/time_within_train_step": 2.3572885990142822, "step": 68} {"train_info/time_between_train_steps": 0.0034558773040771484, "step": 68} {"info/global_step": 69, "train_info/time_within_train_step": 2.3583250045776367, "step": 69} {"train_info/time_between_train_steps": 0.0033941268920898438, "step": 69} {"info/global_step": 70, "train_info/time_within_train_step": 2.3580381870269775, "step": 70} {"train_info/time_between_train_steps": 0.003459930419921875, "step": 70} {"info/global_step": 71, "train_info/time_within_train_step": 2.3575923442840576, "step": 71} {"train_info/time_between_train_steps": 0.0035059452056884766, "step": 71} {"info/global_step": 72, "train_info/time_within_train_step": 2.356790781021118, "step": 72} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 72} {"info/global_step": 73, "train_info/time_within_train_step": 2.562591552734375, "step": 73} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 73} {"info/global_step": 74, "train_info/time_within_train_step": 2.3580374717712402, "step": 74} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 74} {"info/global_step": 75, "train_info/time_within_train_step": 2.358046054840088, "step": 75} {"train_info/time_between_train_steps": 0.0032958984375, "step": 75} {"info/global_step": 76, "train_info/time_within_train_step": 2.359062671661377, "step": 76} {"train_info/time_between_train_steps": 0.0032885074615478516, "step": 76} {"info/global_step": 77, "train_info/time_within_train_step": 2.3609068393707275, "step": 77} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 77} {"info/global_step": 78, "train_info/time_within_train_step": 2.3596549034118652, "step": 78} {"train_info/time_between_train_steps": 0.003295421600341797, "step": 78} {"info/global_step": 79, "train_info/time_within_train_step": 2.363466262817383, "step": 79} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 79} {"info/global_step": 80, "train_info/time_within_train_step": 2.3595008850097656, "step": 80} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 80} {"info/global_step": 81, "train_info/time_within_train_step": 2.3563828468322754, "step": 81} {"train_info/time_between_train_steps": 0.0033724308013916016, "step": 81} {"info/global_step": 82, "train_info/time_within_train_step": 2.3586714267730713, "step": 82} {"train_info/time_between_train_steps": 0.003451108932495117, "step": 82} {"info/global_step": 83, "train_info/time_within_train_step": 2.3598577976226807, "step": 83} {"train_info/time_between_train_steps": 0.003551006317138672, "step": 83} {"info/global_step": 84, "train_info/time_within_train_step": 2.3593568801879883, "step": 84} {"train_info/time_between_train_steps": 0.0034134387969970703, "step": 84} {"info/global_step": 85, "train_info/time_within_train_step": 2.3760030269622803, "step": 85} {"train_info/time_between_train_steps": 0.0037870407104492188, "step": 85} {"info/global_step": 86, "train_info/time_within_train_step": 2.36220645904541, "step": 86} {"train_info/time_between_train_steps": 0.0037550926208496094, "step": 86} {"info/global_step": 87, "train_info/time_within_train_step": 2.360752820968628, "step": 87} {"train_info/time_between_train_steps": 0.0037109851837158203, "step": 87} {"info/global_step": 88, "train_info/time_within_train_step": 2.3595099449157715, "step": 88} {"train_info/time_between_train_steps": 0.003762483596801758, "step": 88} {"info/global_step": 89, "train_info/time_within_train_step": 2.360595941543579, "step": 89} {"train_info/time_between_train_steps": 0.0038003921508789062, "step": 89} {"info/global_step": 90, "train_info/time_within_train_step": 2.360555410385132, "step": 90} {"train_info/time_between_train_steps": 0.0036895275115966797, "step": 90} {"info/global_step": 91, "train_info/time_within_train_step": 2.36079740524292, "step": 91} {"train_info/time_between_train_steps": 0.004001140594482422, "step": 91} {"info/global_step": 92, "train_info/time_within_train_step": 2.3612046241760254, "step": 92} {"train_info/time_between_train_steps": 0.003823995590209961, "step": 92} {"info/global_step": 93, "train_info/time_within_train_step": 2.3603813648223877, "step": 93} {"train_info/time_between_train_steps": 0.003645658493041992, "step": 93} {"info/global_step": 94, "train_info/time_within_train_step": 2.360269069671631, "step": 94} {"train_info/time_between_train_steps": 0.0037491321563720703, "step": 94} {"info/global_step": 95, "train_info/time_within_train_step": 2.3605387210845947, "step": 95} {"train_info/time_between_train_steps": 0.0036797523498535156, "step": 95} {"info/global_step": 96, "train_info/time_within_train_step": 2.3603734970092773, "step": 96} {"train_info/time_between_train_steps": 0.004075527191162109, "step": 96} {"info/global_step": 97, "train_info/time_within_train_step": 2.728877067565918, "step": 97} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 97} {"info/global_step": 98, "train_info/time_within_train_step": 2.3615663051605225, "step": 98} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 98} {"info/global_step": 99, "train_info/time_within_train_step": 2.359947443008423, "step": 99} {"train_info/time_between_train_steps": 0.0034139156341552734, "step": 99} {"info/global_step": 100, "train_info/time_within_train_step": 2.358921527862549, "step": 100} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746252457, "_runtime": 276}, "step": 100} {"logs": {"train/loss": 6.1398, "train/learning_rate": 0.00019999999999999998, "train/epoch": 0.03, "_timestamp": 1746252457, "_runtime": 276}, "step": 100} {"train_info/time_between_train_steps": 18.67257332801819, "step": 100} {"info/global_step": 101, "train_info/time_within_train_step": 2.2059874534606934, "step": 101} {"train_info/time_between_train_steps": 0.0033648014068603516, "step": 101} {"info/global_step": 102, "train_info/time_within_train_step": 2.1826255321502686, "step": 102} {"train_info/time_between_train_steps": 0.003467559814453125, "step": 102} {"info/global_step": 103, "train_info/time_within_train_step": 2.193572521209717, "step": 103} {"train_info/time_between_train_steps": 0.003621816635131836, "step": 103} {"info/global_step": 104, "train_info/time_within_train_step": 2.338738203048706, "step": 104} {"train_info/time_between_train_steps": 0.0038285255432128906, "step": 104} {"info/global_step": 105, "train_info/time_within_train_step": 2.360356330871582, "step": 105} {"train_info/time_between_train_steps": 0.0036911964416503906, "step": 105} {"info/global_step": 106, "train_info/time_within_train_step": 2.3589491844177246, "step": 106} {"train_info/time_between_train_steps": 0.003839254379272461, "step": 106} {"info/global_step": 107, "train_info/time_within_train_step": 2.360605478286743, "step": 107} {"train_info/time_between_train_steps": 0.0036420822143554688, "step": 107} {"info/global_step": 108, "train_info/time_within_train_step": 2.3625431060791016, "step": 108} {"train_info/time_between_train_steps": 0.0036461353302001953, "step": 108} {"info/global_step": 109, "train_info/time_within_train_step": 2.359623908996582, "step": 109} {"train_info/time_between_train_steps": 0.003646373748779297, "step": 109} {"info/global_step": 110, "train_info/time_within_train_step": 2.3580732345581055, "step": 110} {"train_info/time_between_train_steps": 0.0035512447357177734, "step": 110} {"info/global_step": 111, "train_info/time_within_train_step": 2.361424684524536, "step": 111} {"train_info/time_between_train_steps": 0.0034911632537841797, "step": 111} {"info/global_step": 112, "train_info/time_within_train_step": 2.3590712547302246, "step": 112} {"train_info/time_between_train_steps": 0.003815174102783203, "step": 112} {"info/global_step": 113, "train_info/time_within_train_step": 2.3600986003875732, "step": 113} {"train_info/time_between_train_steps": 0.003571748733520508, "step": 113} {"info/global_step": 114, "train_info/time_within_train_step": 2.3601365089416504, "step": 114} {"train_info/time_between_train_steps": 0.0035746097564697266, "step": 114} {"info/global_step": 115, "train_info/time_within_train_step": 2.3577699661254883, "step": 115} {"train_info/time_between_train_steps": 0.0035483837127685547, "step": 115} {"info/global_step": 116, "train_info/time_within_train_step": 2.3612005710601807, "step": 116} {"train_info/time_between_train_steps": 0.003669261932373047, "step": 116} {"info/global_step": 117, "train_info/time_within_train_step": 2.3596031665802, "step": 117} {"train_info/time_between_train_steps": 0.0034742355346679688, "step": 117} {"info/global_step": 118, "train_info/time_within_train_step": 2.360320806503296, "step": 118} {"train_info/time_between_train_steps": 0.003568887710571289, "step": 118} {"info/global_step": 119, "train_info/time_within_train_step": 2.3609910011291504, "step": 119} {"train_info/time_between_train_steps": 0.0035173892974853516, "step": 119} {"info/global_step": 120, "train_info/time_within_train_step": 2.3609743118286133, "step": 120} {"train_info/time_between_train_steps": 0.003685474395751953, "step": 120} {"info/global_step": 121, "train_info/time_within_train_step": 2.699951410293579, "step": 121} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 121} {"info/global_step": 122, "train_info/time_within_train_step": 2.359464168548584, "step": 122} {"train_info/time_between_train_steps": 0.003361940383911133, "step": 122} {"info/global_step": 123, "train_info/time_within_train_step": 2.358849287033081, "step": 123} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 123} {"info/global_step": 124, "train_info/time_within_train_step": 2.358597755432129, "step": 124} {"train_info/time_between_train_steps": 0.003386259078979492, "step": 124} {"info/global_step": 125, "train_info/time_within_train_step": 2.357332706451416, "step": 125} {"train_info/time_between_train_steps": 0.1390533447265625, "step": 125} {"info/global_step": 126, "train_info/time_within_train_step": 2.3691930770874023, "step": 126} {"train_info/time_between_train_steps": 0.0033156871795654297, "step": 126} {"info/global_step": 127, "train_info/time_within_train_step": 2.3688626289367676, "step": 127} {"train_info/time_between_train_steps": 0.003267049789428711, "step": 127} {"info/global_step": 128, "train_info/time_within_train_step": 2.3585541248321533, "step": 128} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 128} {"info/global_step": 129, "train_info/time_within_train_step": 2.359004020690918, "step": 129} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 129} {"info/global_step": 130, "train_info/time_within_train_step": 2.3584036827087402, "step": 130} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 130} {"info/global_step": 131, "train_info/time_within_train_step": 2.3590211868286133, "step": 131} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 131} {"info/global_step": 132, "train_info/time_within_train_step": 2.3570637702941895, "step": 132} {"train_info/time_between_train_steps": 0.0033922195434570312, "step": 132} {"info/global_step": 133, "train_info/time_within_train_step": 2.3584134578704834, "step": 133} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 133} {"info/global_step": 134, "train_info/time_within_train_step": 2.360975980758667, "step": 134} {"train_info/time_between_train_steps": 0.0033206939697265625, "step": 134} {"info/global_step": 135, "train_info/time_within_train_step": 2.359583616256714, "step": 135} {"train_info/time_between_train_steps": 0.003258228302001953, "step": 135} {"info/global_step": 136, "train_info/time_within_train_step": 2.360203266143799, "step": 136} {"train_info/time_between_train_steps": 0.0035219192504882812, "step": 136} {"info/global_step": 137, "train_info/time_within_train_step": 2.357349395751953, "step": 137} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 137} {"info/global_step": 138, "train_info/time_within_train_step": 2.3569600582122803, "step": 138} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 138} {"info/global_step": 139, "train_info/time_within_train_step": 2.3560361862182617, "step": 139} {"train_info/time_between_train_steps": 0.003468751907348633, "step": 139} {"info/global_step": 140, "train_info/time_within_train_step": 2.357257604598999, "step": 140} {"train_info/time_between_train_steps": 0.003557443618774414, "step": 140} {"info/global_step": 141, "train_info/time_within_train_step": 2.358605146408081, "step": 141} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 141} {"info/global_step": 142, "train_info/time_within_train_step": 2.358398675918579, "step": 142} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 142} {"info/global_step": 143, "train_info/time_within_train_step": 2.357011556625366, "step": 143} {"train_info/time_between_train_steps": 0.0041162967681884766, "step": 143} {"info/global_step": 144, "train_info/time_within_train_step": 2.358851432800293, "step": 144} {"train_info/time_between_train_steps": 0.0034651756286621094, "step": 144} {"info/global_step": 145, "train_info/time_within_train_step": 2.6077442169189453, "step": 145} {"train_info/time_between_train_steps": 0.003582477569580078, "step": 145} {"info/global_step": 146, "train_info/time_within_train_step": 2.358902931213379, "step": 146} {"train_info/time_between_train_steps": 0.0036139488220214844, "step": 146} {"info/global_step": 147, "train_info/time_within_train_step": 2.359074592590332, "step": 147} {"train_info/time_between_train_steps": 0.003913402557373047, "step": 147} {"info/global_step": 148, "train_info/time_within_train_step": 2.3597326278686523, "step": 148} {"train_info/time_between_train_steps": 0.0036025047302246094, "step": 148} {"info/global_step": 149, "train_info/time_within_train_step": 2.3590002059936523, "step": 149} {"train_info/time_between_train_steps": 0.0037436485290527344, "step": 149} {"info/global_step": 150, "train_info/time_within_train_step": 2.358922243118286, "step": 150} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746252596, "_runtime": 415}, "step": 150} {"logs": {"train/loss": 5.5284, "train/learning_rate": 0.0003, "train/epoch": 0.05, "_timestamp": 1746252596, "_runtime": 415}, "step": 150} {"train_info/time_between_train_steps": 0.40411972999572754, "step": 150} {"info/global_step": 151, "train_info/time_within_train_step": 2.3579585552215576, "step": 151} {"train_info/time_between_train_steps": 0.0035872459411621094, "step": 151} {"info/global_step": 152, "train_info/time_within_train_step": 2.495504856109619, "step": 152} {"train_info/time_between_train_steps": 0.0036339759826660156, "step": 152} {"info/global_step": 153, "train_info/time_within_train_step": 2.3585164546966553, "step": 153} {"train_info/time_between_train_steps": 0.003932476043701172, "step": 153} {"info/global_step": 154, "train_info/time_within_train_step": 2.357975959777832, "step": 154} {"train_info/time_between_train_steps": 0.003429889678955078, "step": 154} {"info/global_step": 155, "train_info/time_within_train_step": 2.3599584102630615, "step": 155} {"train_info/time_between_train_steps": 0.003664255142211914, "step": 155} {"info/global_step": 156, "train_info/time_within_train_step": 2.361062526702881, "step": 156} {"train_info/time_between_train_steps": 0.003946065902709961, "step": 156} {"info/global_step": 157, "train_info/time_within_train_step": 2.3576085567474365, "step": 157} {"train_info/time_between_train_steps": 0.0036504268646240234, "step": 157} {"info/global_step": 158, "train_info/time_within_train_step": 2.358046770095825, "step": 158} {"train_info/time_between_train_steps": 0.0035631656646728516, "step": 158} {"info/global_step": 159, "train_info/time_within_train_step": 2.3583202362060547, "step": 159} {"train_info/time_between_train_steps": 0.003697633743286133, "step": 159} {"info/global_step": 160, "train_info/time_within_train_step": 2.3574793338775635, "step": 160} {"train_info/time_between_train_steps": 0.003966093063354492, "step": 160} {"info/global_step": 161, "train_info/time_within_train_step": 2.3582420349121094, "step": 161} {"train_info/time_between_train_steps": 0.0038900375366210938, "step": 161} {"info/global_step": 162, "train_info/time_within_train_step": 2.354360580444336, "step": 162} {"train_info/time_between_train_steps": 0.0037860870361328125, "step": 162} {"info/global_step": 163, "train_info/time_within_train_step": 2.3561863899230957, "step": 163} {"train_info/time_between_train_steps": 0.0037755966186523438, "step": 163} {"info/global_step": 164, "train_info/time_within_train_step": 2.3577158451080322, "step": 164} {"train_info/time_between_train_steps": 0.003887176513671875, "step": 164} {"info/global_step": 165, "train_info/time_within_train_step": 2.358243227005005, "step": 165} {"train_info/time_between_train_steps": 0.0038299560546875, "step": 165} {"info/global_step": 166, "train_info/time_within_train_step": 2.3572421073913574, "step": 166} {"train_info/time_between_train_steps": 0.0038726329803466797, "step": 166} {"info/global_step": 167, "train_info/time_within_train_step": 2.357517957687378, "step": 167} {"train_info/time_between_train_steps": 0.003651142120361328, "step": 167} {"info/global_step": 168, "train_info/time_within_train_step": 2.35854434967041, "step": 168} {"train_info/time_between_train_steps": 0.003584146499633789, "step": 168} {"info/global_step": 169, "train_info/time_within_train_step": 2.6895506381988525, "step": 169} {"train_info/time_between_train_steps": 0.0033113956451416016, "step": 169} {"info/global_step": 170, "train_info/time_within_train_step": 2.3592827320098877, "step": 170} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 170} {"info/global_step": 171, "train_info/time_within_train_step": 2.358015298843384, "step": 171} {"train_info/time_between_train_steps": 0.0032622814178466797, "step": 171} {"info/global_step": 172, "train_info/time_within_train_step": 2.3584892749786377, "step": 172} {"train_info/time_between_train_steps": 0.0032949447631835938, "step": 172} {"info/global_step": 173, "train_info/time_within_train_step": 2.3588552474975586, "step": 173} {"train_info/time_between_train_steps": 0.003278970718383789, "step": 173} {"info/global_step": 174, "train_info/time_within_train_step": 2.355687379837036, "step": 174} {"train_info/time_between_train_steps": 0.0034351348876953125, "step": 174} {"info/global_step": 175, "train_info/time_within_train_step": 2.358598232269287, "step": 175} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 175} {"info/global_step": 176, "train_info/time_within_train_step": 2.3595690727233887, "step": 176} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 176} {"info/global_step": 177, "train_info/time_within_train_step": 2.3597609996795654, "step": 177} {"train_info/time_between_train_steps": 0.0035452842712402344, "step": 177} {"info/global_step": 178, "train_info/time_within_train_step": 2.3644824028015137, "step": 178} {"train_info/time_between_train_steps": 0.0033235549926757812, "step": 178} {"info/global_step": 179, "train_info/time_within_train_step": 2.3605329990386963, "step": 179} {"train_info/time_between_train_steps": 0.003412961959838867, "step": 179} {"info/global_step": 180, "train_info/time_within_train_step": 2.3594319820404053, "step": 180} {"train_info/time_between_train_steps": 0.0034208297729492188, "step": 180} {"info/global_step": 181, "train_info/time_within_train_step": 2.3588616847991943, "step": 181} {"train_info/time_between_train_steps": 0.0035905838012695312, "step": 181} {"info/global_step": 182, "train_info/time_within_train_step": 2.4221067428588867, "step": 182} {"train_info/time_between_train_steps": 0.0032961368560791016, "step": 182} {"info/global_step": 183, "train_info/time_within_train_step": 2.360305070877075, "step": 183} {"train_info/time_between_train_steps": 0.003354787826538086, "step": 183} {"info/global_step": 184, "train_info/time_within_train_step": 2.3595564365386963, "step": 184} {"train_info/time_between_train_steps": 0.0033614635467529297, "step": 184} {"info/global_step": 185, "train_info/time_within_train_step": 2.3599138259887695, "step": 185} {"train_info/time_between_train_steps": 0.0034143924713134766, "step": 185} {"info/global_step": 186, "train_info/time_within_train_step": 2.359727621078491, "step": 186} {"train_info/time_between_train_steps": 0.0034036636352539062, "step": 186} {"info/global_step": 187, "train_info/time_within_train_step": 2.360011339187622, "step": 187} {"train_info/time_between_train_steps": 0.003515005111694336, "step": 187} {"info/global_step": 188, "train_info/time_within_train_step": 2.506488561630249, "step": 188} {"train_info/time_between_train_steps": 0.003432035446166992, "step": 188} {"info/global_step": 189, "train_info/time_within_train_step": 2.360107421875, "step": 189} {"train_info/time_between_train_steps": 0.0033197402954101562, "step": 189} {"info/global_step": 190, "train_info/time_within_train_step": 2.360276937484741, "step": 190} {"train_info/time_between_train_steps": 0.0032939910888671875, "step": 190} {"info/global_step": 191, "train_info/time_within_train_step": 2.3599064350128174, "step": 191} {"train_info/time_between_train_steps": 0.003282785415649414, "step": 191} {"info/global_step": 192, "train_info/time_within_train_step": 2.3640103340148926, "step": 192} {"train_info/time_between_train_steps": 0.0034711360931396484, "step": 192} {"info/global_step": 193, "train_info/time_within_train_step": 2.5512497425079346, "step": 193} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 193} {"info/global_step": 194, "train_info/time_within_train_step": 2.3595809936523438, "step": 194} {"train_info/time_between_train_steps": 0.0032968521118164062, "step": 194} {"info/global_step": 195, "train_info/time_within_train_step": 2.3603882789611816, "step": 195} {"train_info/time_between_train_steps": 0.003263711929321289, "step": 195} {"info/global_step": 196, "train_info/time_within_train_step": 2.356394052505493, "step": 196} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 196} {"info/global_step": 197, "train_info/time_within_train_step": 2.358369827270508, "step": 197} {"train_info/time_between_train_steps": 0.003430604934692383, "step": 197} {"info/global_step": 198, "train_info/time_within_train_step": 2.361069917678833, "step": 198} {"train_info/time_between_train_steps": 0.0035240650177001953, "step": 198} {"info/global_step": 199, "train_info/time_within_train_step": 2.3603897094726562, "step": 199} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 199} {"info/global_step": 200, "train_info/time_within_train_step": 2.360145092010498, "step": 200} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746252721, "_runtime": 540}, "step": 200} {"logs": {"train/loss": 5.2946, "train/learning_rate": 0.00039999999999999996, "train/epoch": 0.07, "_timestamp": 1746252721, "_runtime": 540}, "step": 200} {"train_info/time_between_train_steps": 22.969948291778564, "step": 200} {"info/global_step": 201, "train_info/time_within_train_step": 2.2107512950897217, "step": 201} {"train_info/time_between_train_steps": 0.003382444381713867, "step": 201} {"info/global_step": 202, "train_info/time_within_train_step": 2.191628932952881, "step": 202} {"train_info/time_between_train_steps": 0.0034542083740234375, "step": 202} {"info/global_step": 203, "train_info/time_within_train_step": 2.1814119815826416, "step": 203} {"train_info/time_between_train_steps": 0.0033593177795410156, "step": 203} {"info/global_step": 204, "train_info/time_within_train_step": 2.308715581893921, "step": 204} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 204} {"info/global_step": 205, "train_info/time_within_train_step": 2.3486270904541016, "step": 205} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 205} {"info/global_step": 206, "train_info/time_within_train_step": 2.3528428077697754, "step": 206} {"train_info/time_between_train_steps": 0.003402233123779297, "step": 206} {"info/global_step": 207, "train_info/time_within_train_step": 2.3610129356384277, "step": 207} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 207} {"info/global_step": 208, "train_info/time_within_train_step": 2.356637477874756, "step": 208} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 208} {"info/global_step": 209, "train_info/time_within_train_step": 2.3708465099334717, "step": 209} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 209} {"info/global_step": 210, "train_info/time_within_train_step": 2.3563029766082764, "step": 210} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 210} {"info/global_step": 211, "train_info/time_within_train_step": 2.3559114933013916, "step": 211} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 211} {"info/global_step": 212, "train_info/time_within_train_step": 2.356658458709717, "step": 212} {"train_info/time_between_train_steps": 0.003260374069213867, "step": 212} {"info/global_step": 213, "train_info/time_within_train_step": 2.3567631244659424, "step": 213} {"train_info/time_between_train_steps": 0.003368377685546875, "step": 213} {"info/global_step": 214, "train_info/time_within_train_step": 2.3704464435577393, "step": 214} {"train_info/time_between_train_steps": 0.0034520626068115234, "step": 214} {"info/global_step": 215, "train_info/time_within_train_step": 2.3557851314544678, "step": 215} {"train_info/time_between_train_steps": 0.0032775402069091797, "step": 215} {"info/global_step": 216, "train_info/time_within_train_step": 2.3569960594177246, "step": 216} {"train_info/time_between_train_steps": 0.003517627716064453, "step": 216} {"info/global_step": 217, "train_info/time_within_train_step": 2.3573696613311768, "step": 217} {"train_info/time_between_train_steps": 0.003307342529296875, "step": 217} {"info/global_step": 218, "train_info/time_within_train_step": 2.5998523235321045, "step": 218} {"train_info/time_between_train_steps": 0.0036270618438720703, "step": 218} {"info/global_step": 219, "train_info/time_within_train_step": 2.3570499420166016, "step": 219} {"train_info/time_between_train_steps": 0.0034942626953125, "step": 219} {"info/global_step": 220, "train_info/time_within_train_step": 2.3575737476348877, "step": 220} {"train_info/time_between_train_steps": 0.0037856101989746094, "step": 220} {"info/global_step": 221, "train_info/time_within_train_step": 2.3584773540496826, "step": 221} {"train_info/time_between_train_steps": 0.0036623477935791016, "step": 221} {"info/global_step": 222, "train_info/time_within_train_step": 2.3570706844329834, "step": 222} {"train_info/time_between_train_steps": 0.0035889148712158203, "step": 222} {"info/global_step": 223, "train_info/time_within_train_step": 2.358114004135132, "step": 223} {"train_info/time_between_train_steps": 0.003552675247192383, "step": 223} {"info/global_step": 224, "train_info/time_within_train_step": 2.357825994491577, "step": 224} {"train_info/time_between_train_steps": 0.0037488937377929688, "step": 224} {"info/global_step": 225, "train_info/time_within_train_step": 2.356069326400757, "step": 225} {"train_info/time_between_train_steps": 0.0035400390625, "step": 225} {"info/global_step": 226, "train_info/time_within_train_step": 2.357100248336792, "step": 226} {"train_info/time_between_train_steps": 0.003669261932373047, "step": 226} {"info/global_step": 227, "train_info/time_within_train_step": 2.3569116592407227, "step": 227} {"train_info/time_between_train_steps": 0.0036611557006835938, "step": 227} {"info/global_step": 228, "train_info/time_within_train_step": 2.3586041927337646, "step": 228} {"train_info/time_between_train_steps": 0.003618001937866211, "step": 228} {"info/global_step": 229, "train_info/time_within_train_step": 2.3578574657440186, "step": 229} {"train_info/time_between_train_steps": 0.003806591033935547, "step": 229} {"info/global_step": 230, "train_info/time_within_train_step": 2.3573501110076904, "step": 230} {"train_info/time_between_train_steps": 0.003590822219848633, "step": 230} {"info/global_step": 231, "train_info/time_within_train_step": 2.357936143875122, "step": 231} {"train_info/time_between_train_steps": 0.0038127899169921875, "step": 231} {"info/global_step": 232, "train_info/time_within_train_step": 2.357916831970215, "step": 232} {"train_info/time_between_train_steps": 0.0037813186645507812, "step": 232} {"info/global_step": 233, "train_info/time_within_train_step": 2.3567423820495605, "step": 233} {"train_info/time_between_train_steps": 0.003750324249267578, "step": 233} {"info/global_step": 234, "train_info/time_within_train_step": 2.3566417694091797, "step": 234} {"train_info/time_between_train_steps": 0.0037648677825927734, "step": 234} {"info/global_step": 235, "train_info/time_within_train_step": 2.3566696643829346, "step": 235} {"train_info/time_between_train_steps": 0.003692150115966797, "step": 235} {"info/global_step": 236, "train_info/time_within_train_step": 2.356415271759033, "step": 236} {"train_info/time_between_train_steps": 0.0036873817443847656, "step": 236} {"info/global_step": 237, "train_info/time_within_train_step": 2.3568942546844482, "step": 237} {"train_info/time_between_train_steps": 0.003496885299682617, "step": 237} {"info/global_step": 238, "train_info/time_within_train_step": 2.357494831085205, "step": 238} {"train_info/time_between_train_steps": 0.003489255905151367, "step": 238} {"info/global_step": 239, "train_info/time_within_train_step": 2.3571207523345947, "step": 239} {"train_info/time_between_train_steps": 0.0037107467651367188, "step": 239} {"info/global_step": 240, "train_info/time_within_train_step": 2.3571619987487793, "step": 240} {"train_info/time_between_train_steps": 0.0037000179290771484, "step": 240} {"info/global_step": 241, "train_info/time_within_train_step": 2.357095718383789, "step": 241} {"train_info/time_between_train_steps": 0.003447294235229492, "step": 241} {"info/global_step": 242, "train_info/time_within_train_step": 2.689629077911377, "step": 242} {"train_info/time_between_train_steps": 0.0032835006713867188, "step": 242} {"info/global_step": 243, "train_info/time_within_train_step": 2.355384588241577, "step": 243} {"train_info/time_between_train_steps": 0.003239870071411133, "step": 243} {"info/global_step": 244, "train_info/time_within_train_step": 2.3551018238067627, "step": 244} {"train_info/time_between_train_steps": 0.003462076187133789, "step": 244} {"info/global_step": 245, "train_info/time_within_train_step": 2.3564255237579346, "step": 245} {"train_info/time_between_train_steps": 0.0033855438232421875, "step": 245} {"info/global_step": 246, "train_info/time_within_train_step": 2.3553457260131836, "step": 246} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 246} {"info/global_step": 247, "train_info/time_within_train_step": 2.3557305335998535, "step": 247} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 247} {"info/global_step": 248, "train_info/time_within_train_step": 2.3555328845977783, "step": 248} {"train_info/time_between_train_steps": 0.0034193992614746094, "step": 248} {"info/global_step": 249, "train_info/time_within_train_step": 2.3562960624694824, "step": 249} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 249} {"info/global_step": 250, "train_info/time_within_train_step": 3.140587329864502, "step": 250} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746252864, "_runtime": 683}, "step": 250} {"logs": {"train/loss": 5.1821, "train/learning_rate": 0.0005, "train/epoch": 0.08, "_timestamp": 1746252864, "_runtime": 683}, "step": 250} {"train_info/time_between_train_steps": 0.1665053367614746, "step": 250} {"info/global_step": 251, "train_info/time_within_train_step": 2.3556275367736816, "step": 251} {"train_info/time_between_train_steps": 0.0032567977905273438, "step": 251} {"info/global_step": 252, "train_info/time_within_train_step": 2.355294942855835, "step": 252} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 252} {"info/global_step": 253, "train_info/time_within_train_step": 2.3553929328918457, "step": 253} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 253} {"info/global_step": 254, "train_info/time_within_train_step": 2.3551881313323975, "step": 254} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 254} {"info/global_step": 255, "train_info/time_within_train_step": 2.3560259342193604, "step": 255} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 255} {"info/global_step": 256, "train_info/time_within_train_step": 2.3555548191070557, "step": 256} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 256} {"info/global_step": 257, "train_info/time_within_train_step": 2.3566627502441406, "step": 257} {"train_info/time_between_train_steps": 0.003208637237548828, "step": 257} {"info/global_step": 258, "train_info/time_within_train_step": 2.35636830329895, "step": 258} {"train_info/time_between_train_steps": 0.003263235092163086, "step": 258} {"info/global_step": 259, "train_info/time_within_train_step": 2.356475353240967, "step": 259} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 259} {"info/global_step": 260, "train_info/time_within_train_step": 2.356205940246582, "step": 260} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 260} {"info/global_step": 261, "train_info/time_within_train_step": 2.361158847808838, "step": 261} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 261} {"info/global_step": 262, "train_info/time_within_train_step": 2.3553812503814697, "step": 262} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 262} {"info/global_step": 263, "train_info/time_within_train_step": 2.3549718856811523, "step": 263} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 263} {"info/global_step": 264, "train_info/time_within_train_step": 2.354912281036377, "step": 264} {"train_info/time_between_train_steps": 0.0032765865325927734, "step": 264} {"info/global_step": 265, "train_info/time_within_train_step": 2.3557913303375244, "step": 265} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 265} {"info/global_step": 266, "train_info/time_within_train_step": 2.5487351417541504, "step": 266} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 266} {"info/global_step": 267, "train_info/time_within_train_step": 2.355052947998047, "step": 267} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 267} {"info/global_step": 268, "train_info/time_within_train_step": 2.355787515640259, "step": 268} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 268} {"info/global_step": 269, "train_info/time_within_train_step": 2.3550198078155518, "step": 269} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 269} {"info/global_step": 270, "train_info/time_within_train_step": 2.356394052505493, "step": 270} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 270} {"info/global_step": 271, "train_info/time_within_train_step": 2.3554954528808594, "step": 271} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 271} {"info/global_step": 272, "train_info/time_within_train_step": 2.3553664684295654, "step": 272} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 272} {"info/global_step": 273, "train_info/time_within_train_step": 2.355125904083252, "step": 273} {"train_info/time_between_train_steps": 0.0032520294189453125, "step": 273} {"info/global_step": 274, "train_info/time_within_train_step": 2.3551859855651855, "step": 274} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 274} {"info/global_step": 275, "train_info/time_within_train_step": 2.3568830490112305, "step": 275} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 275} {"info/global_step": 276, "train_info/time_within_train_step": 2.356086015701294, "step": 276} {"train_info/time_between_train_steps": 0.003299713134765625, "step": 276} {"info/global_step": 277, "train_info/time_within_train_step": 2.3558175563812256, "step": 277} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 277} {"info/global_step": 278, "train_info/time_within_train_step": 2.355665683746338, "step": 278} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 278} {"info/global_step": 279, "train_info/time_within_train_step": 2.3565025329589844, "step": 279} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 279} {"info/global_step": 280, "train_info/time_within_train_step": 2.3561553955078125, "step": 280} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 280} {"info/global_step": 281, "train_info/time_within_train_step": 2.3551974296569824, "step": 281} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 281} {"info/global_step": 282, "train_info/time_within_train_step": 2.355022668838501, "step": 282} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 282} {"info/global_step": 283, "train_info/time_within_train_step": 2.355245351791382, "step": 283} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 283} {"info/global_step": 284, "train_info/time_within_train_step": 2.363325834274292, "step": 284} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 284} {"info/global_step": 285, "train_info/time_within_train_step": 2.3550360202789307, "step": 285} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 285} {"info/global_step": 286, "train_info/time_within_train_step": 2.355361223220825, "step": 286} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 286} {"info/global_step": 287, "train_info/time_within_train_step": 2.354797601699829, "step": 287} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 287} {"info/global_step": 288, "train_info/time_within_train_step": 2.354448080062866, "step": 288} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 288} {"info/global_step": 289, "train_info/time_within_train_step": 2.3548011779785156, "step": 289} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 289} {"info/global_step": 290, "train_info/time_within_train_step": 2.5789074897766113, "step": 290} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 290} {"info/global_step": 291, "train_info/time_within_train_step": 2.354262590408325, "step": 291} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 291} {"info/global_step": 292, "train_info/time_within_train_step": 2.3543994426727295, "step": 292} {"train_info/time_between_train_steps": 0.003369569778442383, "step": 292} {"info/global_step": 293, "train_info/time_within_train_step": 2.3541319370269775, "step": 293} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 293} {"info/global_step": 294, "train_info/time_within_train_step": 2.3550665378570557, "step": 294} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 294} {"info/global_step": 295, "train_info/time_within_train_step": 2.3547980785369873, "step": 295} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 295} {"info/global_step": 296, "train_info/time_within_train_step": 2.355646848678589, "step": 296} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 296} {"info/global_step": 297, "train_info/time_within_train_step": 2.355276346206665, "step": 297} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 297} {"info/global_step": 298, "train_info/time_within_train_step": 2.355506420135498, "step": 298} {"train_info/time_between_train_steps": 0.0032432079315185547, "step": 298} {"info/global_step": 299, "train_info/time_within_train_step": 2.3550474643707275, "step": 299} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 299} {"info/global_step": 300, "train_info/time_within_train_step": 2.356130361557007, "step": 300} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746252984, "_runtime": 803}, "step": 300} {"logs": {"train/loss": 5.1235, "train/learning_rate": 0.0006, "train/epoch": 0.1, "_timestamp": 1746252984, "_runtime": 803}, "step": 300} {"train_info/time_between_train_steps": 24.448526620864868, "step": 300} {"info/global_step": 301, "train_info/time_within_train_step": 2.1973490715026855, "step": 301} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 301} {"info/global_step": 302, "train_info/time_within_train_step": 2.179757833480835, "step": 302} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 302} {"info/global_step": 303, "train_info/time_within_train_step": 2.1820871829986572, "step": 303} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 303} {"info/global_step": 304, "train_info/time_within_train_step": 2.276278495788574, "step": 304} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 304} {"info/global_step": 305, "train_info/time_within_train_step": 2.3511393070220947, "step": 305} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 305} {"info/global_step": 306, "train_info/time_within_train_step": 2.355412006378174, "step": 306} {"train_info/time_between_train_steps": 0.0032274723052978516, "step": 306} {"info/global_step": 307, "train_info/time_within_train_step": 2.3557817935943604, "step": 307} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 307} {"info/global_step": 308, "train_info/time_within_train_step": 2.358030319213867, "step": 308} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 308} {"info/global_step": 309, "train_info/time_within_train_step": 2.357048273086548, "step": 309} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 309} {"info/global_step": 310, "train_info/time_within_train_step": 2.357475519180298, "step": 310} {"train_info/time_between_train_steps": 0.003685474395751953, "step": 310} {"info/global_step": 311, "train_info/time_within_train_step": 2.359550714492798, "step": 311} {"train_info/time_between_train_steps": 0.0036554336547851562, "step": 311} {"info/global_step": 312, "train_info/time_within_train_step": 2.3581197261810303, "step": 312} {"train_info/time_between_train_steps": 0.0035774707794189453, "step": 312} {"info/global_step": 313, "train_info/time_within_train_step": 2.870840311050415, "step": 313} {"train_info/time_between_train_steps": 0.003225564956665039, "step": 313} {"info/global_step": 314, "train_info/time_within_train_step": 2.3577349185943604, "step": 314} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 314} {"info/global_step": 315, "train_info/time_within_train_step": 2.358799934387207, "step": 315} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 315} {"info/global_step": 316, "train_info/time_within_train_step": 2.3575711250305176, "step": 316} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 316} {"info/global_step": 317, "train_info/time_within_train_step": 2.35746431350708, "step": 317} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 317} {"info/global_step": 318, "train_info/time_within_train_step": 2.358017921447754, "step": 318} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 318} {"info/global_step": 319, "train_info/time_within_train_step": 2.3891549110412598, "step": 319} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 319} {"info/global_step": 320, "train_info/time_within_train_step": 2.3582239151000977, "step": 320} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 320} {"info/global_step": 321, "train_info/time_within_train_step": 2.3572444915771484, "step": 321} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 321} {"info/global_step": 322, "train_info/time_within_train_step": 2.358443021774292, "step": 322} {"train_info/time_between_train_steps": 0.003278017044067383, "step": 322} {"info/global_step": 323, "train_info/time_within_train_step": 2.3581016063690186, "step": 323} {"train_info/time_between_train_steps": 0.0033111572265625, "step": 323} {"info/global_step": 324, "train_info/time_within_train_step": 2.3591854572296143, "step": 324} {"train_info/time_between_train_steps": 0.0033986568450927734, "step": 324} {"info/global_step": 325, "train_info/time_within_train_step": 2.3577282428741455, "step": 325} {"train_info/time_between_train_steps": 0.003355741500854492, "step": 325} {"info/global_step": 326, "train_info/time_within_train_step": 2.359015464782715, "step": 326} {"train_info/time_between_train_steps": 0.0041959285736083984, "step": 326} {"info/global_step": 327, "train_info/time_within_train_step": 2.3586363792419434, "step": 327} {"train_info/time_between_train_steps": 0.003537416458129883, "step": 327} {"info/global_step": 328, "train_info/time_within_train_step": 2.3633739948272705, "step": 328} {"train_info/time_between_train_steps": 0.003634214401245117, "step": 328} {"info/global_step": 329, "train_info/time_within_train_step": 2.3583319187164307, "step": 329} {"train_info/time_between_train_steps": 0.003597259521484375, "step": 329} {"info/global_step": 330, "train_info/time_within_train_step": 2.357429265975952, "step": 330} {"train_info/time_between_train_steps": 0.003566741943359375, "step": 330} {"info/global_step": 331, "train_info/time_within_train_step": 2.359112024307251, "step": 331} {"train_info/time_between_train_steps": 0.0036468505859375, "step": 331} {"info/global_step": 332, "train_info/time_within_train_step": 2.3582510948181152, "step": 332} {"train_info/time_between_train_steps": 0.0035533905029296875, "step": 332} {"info/global_step": 333, "train_info/time_within_train_step": 2.3578264713287354, "step": 333} {"train_info/time_between_train_steps": 0.003530740737915039, "step": 333} {"info/global_step": 334, "train_info/time_within_train_step": 2.3587677478790283, "step": 334} {"train_info/time_between_train_steps": 0.003531932830810547, "step": 334} {"info/global_step": 335, "train_info/time_within_train_step": 2.3590941429138184, "step": 335} {"train_info/time_between_train_steps": 0.0036025047302246094, "step": 335} {"info/global_step": 336, "train_info/time_within_train_step": 2.3580260276794434, "step": 336} {"train_info/time_between_train_steps": 0.0035648345947265625, "step": 336} {"info/global_step": 337, "train_info/time_within_train_step": 2.7080514430999756, "step": 337} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 337} {"info/global_step": 338, "train_info/time_within_train_step": 2.357243537902832, "step": 338} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 338} {"info/global_step": 339, "train_info/time_within_train_step": 2.356769561767578, "step": 339} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 339} {"info/global_step": 340, "train_info/time_within_train_step": 2.3573458194732666, "step": 340} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 340} {"info/global_step": 341, "train_info/time_within_train_step": 2.3567392826080322, "step": 341} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 341} {"info/global_step": 342, "train_info/time_within_train_step": 2.3571979999542236, "step": 342} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 342} {"info/global_step": 343, "train_info/time_within_train_step": 2.357064723968506, "step": 343} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 343} {"info/global_step": 344, "train_info/time_within_train_step": 2.3572654724121094, "step": 344} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 344} {"info/global_step": 345, "train_info/time_within_train_step": 2.3567914962768555, "step": 345} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 345} {"info/global_step": 346, "train_info/time_within_train_step": 2.3576855659484863, "step": 346} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 346} {"info/global_step": 347, "train_info/time_within_train_step": 2.358532667160034, "step": 347} {"train_info/time_between_train_steps": 0.0032591819763183594, "step": 347} {"info/global_step": 348, "train_info/time_within_train_step": 2.3570926189422607, "step": 348} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 348} {"info/global_step": 349, "train_info/time_within_train_step": 2.3565051555633545, "step": 349} {"train_info/time_between_train_steps": 0.003282785415649414, "step": 349} {"info/global_step": 350, "train_info/time_within_train_step": 2.356931209564209, "step": 350} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746253127, "_runtime": 946}, "step": 350} {"logs": {"train/loss": 5.0655, "train/learning_rate": 0.0005888888888888889, "train/epoch": 0.12, "_timestamp": 1746253127, "_runtime": 946}, "step": 350} {"train_info/time_between_train_steps": 0.02470541000366211, "step": 350} {"info/global_step": 351, "train_info/time_within_train_step": 2.356396198272705, "step": 351} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 351} {"info/global_step": 352, "train_info/time_within_train_step": 2.357269287109375, "step": 352} {"train_info/time_between_train_steps": 0.0035822391510009766, "step": 352} {"info/global_step": 353, "train_info/time_within_train_step": 2.358261823654175, "step": 353} {"train_info/time_between_train_steps": 0.006582736968994141, "step": 353} {"info/global_step": 354, "train_info/time_within_train_step": 2.357457399368286, "step": 354} {"train_info/time_between_train_steps": 0.0066869258880615234, "step": 354} {"info/global_step": 355, "train_info/time_within_train_step": 2.3570141792297363, "step": 355} {"train_info/time_between_train_steps": 0.006720542907714844, "step": 355} {"info/global_step": 356, "train_info/time_within_train_step": 2.3690361976623535, "step": 356} {"train_info/time_between_train_steps": 0.0065691471099853516, "step": 356} {"info/global_step": 357, "train_info/time_within_train_step": 2.3569116592407227, "step": 357} {"train_info/time_between_train_steps": 0.006713151931762695, "step": 357} {"info/global_step": 358, "train_info/time_within_train_step": 2.3573596477508545, "step": 358} {"train_info/time_between_train_steps": 0.0065577030181884766, "step": 358} {"info/global_step": 359, "train_info/time_within_train_step": 2.357640504837036, "step": 359} {"train_info/time_between_train_steps": 0.006684303283691406, "step": 359} {"info/global_step": 360, "train_info/time_within_train_step": 2.3803510665893555, "step": 360} {"train_info/time_between_train_steps": 0.006700038909912109, "step": 360} {"info/global_step": 361, "train_info/time_within_train_step": 2.5860230922698975, "step": 361} {"train_info/time_between_train_steps": 0.006677150726318359, "step": 361} {"info/global_step": 362, "train_info/time_within_train_step": 2.3573338985443115, "step": 362} {"train_info/time_between_train_steps": 0.006616353988647461, "step": 362} {"info/global_step": 363, "train_info/time_within_train_step": 2.3577520847320557, "step": 363} {"train_info/time_between_train_steps": 0.006636142730712891, "step": 363} {"info/global_step": 364, "train_info/time_within_train_step": 2.3570332527160645, "step": 364} {"train_info/time_between_train_steps": 0.006678104400634766, "step": 364} {"info/global_step": 365, "train_info/time_within_train_step": 2.3576340675354004, "step": 365} {"train_info/time_between_train_steps": 0.006676912307739258, "step": 365} {"info/global_step": 366, "train_info/time_within_train_step": 2.3570351600646973, "step": 366} {"train_info/time_between_train_steps": 0.006705284118652344, "step": 366} {"info/global_step": 367, "train_info/time_within_train_step": 2.3574111461639404, "step": 367} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 367} {"info/global_step": 368, "train_info/time_within_train_step": 2.357043743133545, "step": 368} {"train_info/time_between_train_steps": 0.00661158561706543, "step": 368} {"info/global_step": 369, "train_info/time_within_train_step": 2.3570778369903564, "step": 369} {"train_info/time_between_train_steps": 0.003173828125, "step": 369} {"info/global_step": 370, "train_info/time_within_train_step": 2.3563711643218994, "step": 370} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 370} {"info/global_step": 371, "train_info/time_within_train_step": 2.3573715686798096, "step": 371} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 371} {"info/global_step": 372, "train_info/time_within_train_step": 2.357391357421875, "step": 372} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 372} {"info/global_step": 373, "train_info/time_within_train_step": 2.3572728633880615, "step": 373} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 373} {"info/global_step": 374, "train_info/time_within_train_step": 2.3578250408172607, "step": 374} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 374} {"info/global_step": 375, "train_info/time_within_train_step": 2.3571183681488037, "step": 375} {"train_info/time_between_train_steps": 0.13300633430480957, "step": 375} {"info/global_step": 376, "train_info/time_within_train_step": 2.3570170402526855, "step": 376} {"train_info/time_between_train_steps": 0.006621837615966797, "step": 376} {"info/global_step": 377, "train_info/time_within_train_step": 2.3571619987487793, "step": 377} {"train_info/time_between_train_steps": 0.006598711013793945, "step": 377} {"info/global_step": 378, "train_info/time_within_train_step": 2.357114315032959, "step": 378} {"train_info/time_between_train_steps": 0.006600618362426758, "step": 378} {"info/global_step": 379, "train_info/time_within_train_step": 2.3577394485473633, "step": 379} {"train_info/time_between_train_steps": 0.00662541389465332, "step": 379} {"info/global_step": 380, "train_info/time_within_train_step": 2.357121706008911, "step": 380} {"train_info/time_between_train_steps": 0.0066280364990234375, "step": 380} {"info/global_step": 381, "train_info/time_within_train_step": 2.367525339126587, "step": 381} {"train_info/time_between_train_steps": 0.006563425064086914, "step": 381} {"info/global_step": 382, "train_info/time_within_train_step": 2.3569583892822266, "step": 382} {"train_info/time_between_train_steps": 0.006670951843261719, "step": 382} {"info/global_step": 383, "train_info/time_within_train_step": 2.3570969104766846, "step": 383} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 383} {"info/global_step": 384, "train_info/time_within_train_step": 2.356799602508545, "step": 384} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 384} {"info/global_step": 385, "train_info/time_within_train_step": 2.6052799224853516, "step": 385} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 385} {"info/global_step": 386, "train_info/time_within_train_step": 2.356679916381836, "step": 386} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 386} {"info/global_step": 387, "train_info/time_within_train_step": 2.357215642929077, "step": 387} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 387} {"info/global_step": 388, "train_info/time_within_train_step": 2.3565189838409424, "step": 388} {"train_info/time_between_train_steps": 0.006568193435668945, "step": 388} {"info/global_step": 389, "train_info/time_within_train_step": 2.3570449352264404, "step": 389} {"train_info/time_between_train_steps": 0.006601572036743164, "step": 389} {"info/global_step": 390, "train_info/time_within_train_step": 2.357130527496338, "step": 390} {"train_info/time_between_train_steps": 0.006655216217041016, "step": 390} {"info/global_step": 391, "train_info/time_within_train_step": 2.357020854949951, "step": 391} {"train_info/time_between_train_steps": 0.00664210319519043, "step": 391} {"info/global_step": 392, "train_info/time_within_train_step": 2.3577215671539307, "step": 392} {"train_info/time_between_train_steps": 0.006585121154785156, "step": 392} {"info/global_step": 393, "train_info/time_within_train_step": 2.357785940170288, "step": 393} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 393} {"info/global_step": 394, "train_info/time_within_train_step": 2.356865882873535, "step": 394} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 394} {"info/global_step": 395, "train_info/time_within_train_step": 2.3567588329315186, "step": 395} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 395} {"info/global_step": 396, "train_info/time_within_train_step": 2.3569440841674805, "step": 396} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 396} {"info/global_step": 397, "train_info/time_within_train_step": 2.357020616531372, "step": 397} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 397} {"info/global_step": 398, "train_info/time_within_train_step": 2.357124090194702, "step": 398} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 398} {"info/global_step": 399, "train_info/time_within_train_step": 2.3566129207611084, "step": 399} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 399} {"info/global_step": 400, "train_info/time_within_train_step": 2.3571977615356445, "step": 400} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746253247, "_runtime": 1066}, "step": 400} {"logs": {"train/loss": 4.9774, "train/learning_rate": 0.0005777777777777776, "train/epoch": 0.13, "_timestamp": 1746253247, "_runtime": 1066}, "step": 400} {"train_info/time_between_train_steps": 21.93536901473999, "step": 400} {"info/global_step": 401, "train_info/time_within_train_step": 2.197704792022705, "step": 401} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 401} {"info/global_step": 402, "train_info/time_within_train_step": 2.182316541671753, "step": 402} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 402} {"info/global_step": 403, "train_info/time_within_train_step": 2.1868581771850586, "step": 403} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 403} {"info/global_step": 404, "train_info/time_within_train_step": 2.318981409072876, "step": 404} {"train_info/time_between_train_steps": 0.003222942352294922, "step": 404} {"info/global_step": 405, "train_info/time_within_train_step": 2.3511765003204346, "step": 405} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 405} {"info/global_step": 406, "train_info/time_within_train_step": 2.3540642261505127, "step": 406} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 406} {"info/global_step": 407, "train_info/time_within_train_step": 2.356847047805786, "step": 407} {"train_info/time_between_train_steps": 0.0032804012298583984, "step": 407} {"info/global_step": 408, "train_info/time_within_train_step": 2.5605545043945312, "step": 408} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 408} {"info/global_step": 409, "train_info/time_within_train_step": 2.356926202774048, "step": 409} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 409} {"info/global_step": 410, "train_info/time_within_train_step": 2.3568074703216553, "step": 410} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 410} {"info/global_step": 411, "train_info/time_within_train_step": 2.357936382293701, "step": 411} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 411} {"info/global_step": 412, "train_info/time_within_train_step": 2.3577263355255127, "step": 412} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 412} {"info/global_step": 413, "train_info/time_within_train_step": 2.3585615158081055, "step": 413} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 413} {"info/global_step": 414, "train_info/time_within_train_step": 2.357966661453247, "step": 414} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 414} {"info/global_step": 415, "train_info/time_within_train_step": 2.357738733291626, "step": 415} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 415} {"info/global_step": 416, "train_info/time_within_train_step": 2.358107089996338, "step": 416} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 416} {"info/global_step": 417, "train_info/time_within_train_step": 2.3573806285858154, "step": 417} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 417} {"info/global_step": 418, "train_info/time_within_train_step": 2.358295440673828, "step": 418} {"train_info/time_between_train_steps": 0.0032622814178466797, "step": 418} {"info/global_step": 419, "train_info/time_within_train_step": 2.356826066970825, "step": 419} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 419} {"info/global_step": 420, "train_info/time_within_train_step": 2.356890916824341, "step": 420} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 420} {"info/global_step": 421, "train_info/time_within_train_step": 2.3570735454559326, "step": 421} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 421} {"info/global_step": 422, "train_info/time_within_train_step": 2.356862783432007, "step": 422} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 422} {"info/global_step": 423, "train_info/time_within_train_step": 2.3566083908081055, "step": 423} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 423} {"info/global_step": 424, "train_info/time_within_train_step": 2.3558976650238037, "step": 424} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 424} {"info/global_step": 425, "train_info/time_within_train_step": 2.3579022884368896, "step": 425} {"train_info/time_between_train_steps": 0.0032744407653808594, "step": 425} {"info/global_step": 426, "train_info/time_within_train_step": 2.356956958770752, "step": 426} {"train_info/time_between_train_steps": 0.0032875537872314453, "step": 426} {"info/global_step": 427, "train_info/time_within_train_step": 2.3573720455169678, "step": 427} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 427} {"info/global_step": 428, "train_info/time_within_train_step": 2.3567798137664795, "step": 428} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 428} {"info/global_step": 429, "train_info/time_within_train_step": 2.356782913208008, "step": 429} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 429} {"info/global_step": 430, "train_info/time_within_train_step": 2.3572046756744385, "step": 430} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 430} {"info/global_step": 431, "train_info/time_within_train_step": 2.3572657108306885, "step": 431} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 431} {"info/global_step": 432, "train_info/time_within_train_step": 2.5686004161834717, "step": 432} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 432} {"info/global_step": 433, "train_info/time_within_train_step": 2.3575806617736816, "step": 433} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 433} {"info/global_step": 434, "train_info/time_within_train_step": 2.3578710556030273, "step": 434} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 434} {"info/global_step": 435, "train_info/time_within_train_step": 2.3573131561279297, "step": 435} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 435} {"info/global_step": 436, "train_info/time_within_train_step": 2.3900392055511475, "step": 436} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 436} {"info/global_step": 437, "train_info/time_within_train_step": 2.35603404045105, "step": 437} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 437} {"info/global_step": 438, "train_info/time_within_train_step": 2.4789211750030518, "step": 438} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 438} {"info/global_step": 439, "train_info/time_within_train_step": 2.35679292678833, "step": 439} {"train_info/time_between_train_steps": 0.0031528472900390625, "step": 439} {"info/global_step": 440, "train_info/time_within_train_step": 2.3568742275238037, "step": 440} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 440} {"info/global_step": 441, "train_info/time_within_train_step": 2.357295513153076, "step": 441} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 441} {"info/global_step": 442, "train_info/time_within_train_step": 2.3565006256103516, "step": 442} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 442} {"info/global_step": 443, "train_info/time_within_train_step": 2.3564329147338867, "step": 443} {"train_info/time_between_train_steps": 0.0033228397369384766, "step": 443} {"info/global_step": 444, "train_info/time_within_train_step": 2.3575339317321777, "step": 444} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 444} {"info/global_step": 445, "train_info/time_within_train_step": 2.3807175159454346, "step": 445} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 445} {"info/global_step": 446, "train_info/time_within_train_step": 2.356621265411377, "step": 446} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 446} {"info/global_step": 447, "train_info/time_within_train_step": 2.3562076091766357, "step": 447} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 447} {"info/global_step": 448, "train_info/time_within_train_step": 2.357675790786743, "step": 448} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 448} {"info/global_step": 449, "train_info/time_within_train_step": 2.356933116912842, "step": 449} {"train_info/time_between_train_steps": 0.0032720565795898438, "step": 449} {"info/global_step": 450, "train_info/time_within_train_step": 2.3572964668273926, "step": 450} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746253388, "_runtime": 1207}, "step": 450} {"logs": {"train/loss": 4.9059, "train/learning_rate": 0.0005666666666666666, "train/epoch": 0.15, "_timestamp": 1746253388, "_runtime": 1207}, "step": 450} {"train_info/time_between_train_steps": 0.02466750144958496, "step": 450} {"info/global_step": 451, "train_info/time_within_train_step": 2.357658863067627, "step": 451} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 451} {"info/global_step": 452, "train_info/time_within_train_step": 2.3571784496307373, "step": 452} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 452} {"info/global_step": 453, "train_info/time_within_train_step": 2.3570396900177, "step": 453} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 453} {"info/global_step": 454, "train_info/time_within_train_step": 2.356884002685547, "step": 454} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 454} {"info/global_step": 455, "train_info/time_within_train_step": 2.3580005168914795, "step": 455} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 455} {"info/global_step": 456, "train_info/time_within_train_step": 2.5645318031311035, "step": 456} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 456} {"info/global_step": 457, "train_info/time_within_train_step": 2.356419324874878, "step": 457} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 457} {"info/global_step": 458, "train_info/time_within_train_step": 2.356980800628662, "step": 458} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 458} {"info/global_step": 459, "train_info/time_within_train_step": 2.3559486865997314, "step": 459} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 459} {"info/global_step": 460, "train_info/time_within_train_step": 2.357095956802368, "step": 460} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 460} {"info/global_step": 461, "train_info/time_within_train_step": 2.3566339015960693, "step": 461} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 461} {"info/global_step": 462, "train_info/time_within_train_step": 2.3564183712005615, "step": 462} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 462} {"info/global_step": 463, "train_info/time_within_train_step": 2.35613751411438, "step": 463} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 463} {"info/global_step": 464, "train_info/time_within_train_step": 2.3558053970336914, "step": 464} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 464} {"info/global_step": 465, "train_info/time_within_train_step": 2.3572864532470703, "step": 465} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 465} {"info/global_step": 466, "train_info/time_within_train_step": 2.356215715408325, "step": 466} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 466} {"info/global_step": 467, "train_info/time_within_train_step": 2.356961965560913, "step": 467} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 467} {"info/global_step": 468, "train_info/time_within_train_step": 2.356412649154663, "step": 468} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 468} {"info/global_step": 469, "train_info/time_within_train_step": 2.3565056324005127, "step": 469} {"train_info/time_between_train_steps": 0.003250598907470703, "step": 469} {"info/global_step": 470, "train_info/time_within_train_step": 2.357489824295044, "step": 470} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 470} {"info/global_step": 471, "train_info/time_within_train_step": 2.3565971851348877, "step": 471} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 471} {"info/global_step": 472, "train_info/time_within_train_step": 2.357210397720337, "step": 472} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 472} {"info/global_step": 473, "train_info/time_within_train_step": 2.35599946975708, "step": 473} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 473} {"info/global_step": 474, "train_info/time_within_train_step": 2.3561184406280518, "step": 474} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 474} {"info/global_step": 475, "train_info/time_within_train_step": 2.35654878616333, "step": 475} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 475} {"info/global_step": 476, "train_info/time_within_train_step": 2.356110095977783, "step": 476} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 476} {"info/global_step": 477, "train_info/time_within_train_step": 2.380182981491089, "step": 477} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 477} {"info/global_step": 478, "train_info/time_within_train_step": 2.356463670730591, "step": 478} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 478} {"info/global_step": 479, "train_info/time_within_train_step": 2.355207920074463, "step": 479} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 479} {"info/global_step": 480, "train_info/time_within_train_step": 2.5582141876220703, "step": 480} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 480} {"info/global_step": 481, "train_info/time_within_train_step": 2.3561394214630127, "step": 481} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 481} {"info/global_step": 482, "train_info/time_within_train_step": 2.3561854362487793, "step": 482} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 482} {"info/global_step": 483, "train_info/time_within_train_step": 2.3554317951202393, "step": 483} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 483} {"info/global_step": 484, "train_info/time_within_train_step": 2.3561856746673584, "step": 484} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 484} {"info/global_step": 485, "train_info/time_within_train_step": 2.356071710586548, "step": 485} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 485} {"info/global_step": 486, "train_info/time_within_train_step": 2.355473279953003, "step": 486} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 486} {"info/global_step": 487, "train_info/time_within_train_step": 2.3569979667663574, "step": 487} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 487} {"info/global_step": 488, "train_info/time_within_train_step": 2.355344295501709, "step": 488} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 488} {"info/global_step": 489, "train_info/time_within_train_step": 2.355853319168091, "step": 489} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 489} {"info/global_step": 490, "train_info/time_within_train_step": 2.3559579849243164, "step": 490} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 490} {"info/global_step": 491, "train_info/time_within_train_step": 2.355513334274292, "step": 491} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 491} {"info/global_step": 492, "train_info/time_within_train_step": 2.3557238578796387, "step": 492} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 492} {"info/global_step": 493, "train_info/time_within_train_step": 2.356391668319702, "step": 493} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 493} {"info/global_step": 494, "train_info/time_within_train_step": 2.355652093887329, "step": 494} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 494} {"info/global_step": 495, "train_info/time_within_train_step": 2.3562188148498535, "step": 495} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 495} {"info/global_step": 496, "train_info/time_within_train_step": 2.356562376022339, "step": 496} {"train_info/time_between_train_steps": 0.0032930374145507812, "step": 496} {"info/global_step": 497, "train_info/time_within_train_step": 2.3562099933624268, "step": 497} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 497} {"info/global_step": 498, "train_info/time_within_train_step": 2.35617995262146, "step": 498} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 498} {"info/global_step": 499, "train_info/time_within_train_step": 2.3565804958343506, "step": 499} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 499} {"info/global_step": 500, "train_info/time_within_train_step": 2.8562231063842773, "step": 500} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746253508, "_runtime": 1327}, "step": 500} {"logs": {"train/loss": 4.822, "train/learning_rate": 0.0005555555555555556, "train/epoch": 0.17, "_timestamp": 1746253508, "_runtime": 1327}, "step": 500} {"train_info/time_between_train_steps": 13.89379620552063, "step": 500} {"info/global_step": 501, "train_info/time_within_train_step": 2.204705238342285, "step": 501} {"train_info/time_between_train_steps": 0.003265857696533203, "step": 501} {"info/global_step": 502, "train_info/time_within_train_step": 2.1842093467712402, "step": 502} {"train_info/time_between_train_steps": 0.0032591819763183594, "step": 502} {"info/global_step": 503, "train_info/time_within_train_step": 2.2605388164520264, "step": 503} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 503} {"info/global_step": 504, "train_info/time_within_train_step": 2.579590082168579, "step": 504} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 504} {"info/global_step": 505, "train_info/time_within_train_step": 2.352078914642334, "step": 505} {"train_info/time_between_train_steps": 0.003204345703125, "step": 505} {"info/global_step": 506, "train_info/time_within_train_step": 2.355168342590332, "step": 506} {"train_info/time_between_train_steps": 0.003241300582885742, "step": 506} {"info/global_step": 507, "train_info/time_within_train_step": 2.3542518615722656, "step": 507} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 507} {"info/global_step": 508, "train_info/time_within_train_step": 2.3543128967285156, "step": 508} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 508} {"info/global_step": 509, "train_info/time_within_train_step": 2.3548521995544434, "step": 509} {"train_info/time_between_train_steps": 0.003463268280029297, "step": 509} {"info/global_step": 510, "train_info/time_within_train_step": 2.354132652282715, "step": 510} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 510} {"info/global_step": 511, "train_info/time_within_train_step": 2.357142925262451, "step": 511} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 511} {"info/global_step": 512, "train_info/time_within_train_step": 2.3561244010925293, "step": 512} {"train_info/time_between_train_steps": 0.0032308101654052734, "step": 512} {"info/global_step": 513, "train_info/time_within_train_step": 2.355912446975708, "step": 513} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 513} {"info/global_step": 514, "train_info/time_within_train_step": 2.3566770553588867, "step": 514} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 514} {"info/global_step": 515, "train_info/time_within_train_step": 2.35577654838562, "step": 515} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 515} {"info/global_step": 516, "train_info/time_within_train_step": 2.355788230895996, "step": 516} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 516} {"info/global_step": 517, "train_info/time_within_train_step": 2.355748176574707, "step": 517} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 517} {"info/global_step": 518, "train_info/time_within_train_step": 2.3560431003570557, "step": 518} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 518} {"info/global_step": 519, "train_info/time_within_train_step": 2.3554742336273193, "step": 519} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 519} {"info/global_step": 520, "train_info/time_within_train_step": 2.3572237491607666, "step": 520} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 520} {"info/global_step": 521, "train_info/time_within_train_step": 2.356741189956665, "step": 521} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 521} {"info/global_step": 522, "train_info/time_within_train_step": 2.3556432723999023, "step": 522} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 522} {"info/global_step": 523, "train_info/time_within_train_step": 2.356794834136963, "step": 523} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 523} {"info/global_step": 524, "train_info/time_within_train_step": 2.357314109802246, "step": 524} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 524} {"info/global_step": 525, "train_info/time_within_train_step": 2.355621099472046, "step": 525} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 525} {"info/global_step": 526, "train_info/time_within_train_step": 2.3569700717926025, "step": 526} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 526} {"info/global_step": 527, "train_info/time_within_train_step": 2.562899589538574, "step": 527} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 527} {"info/global_step": 528, "train_info/time_within_train_step": 2.355699062347412, "step": 528} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 528} {"info/global_step": 529, "train_info/time_within_train_step": 2.3557121753692627, "step": 529} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 529} {"info/global_step": 530, "train_info/time_within_train_step": 2.355804443359375, "step": 530} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 530} {"info/global_step": 531, "train_info/time_within_train_step": 2.3830363750457764, "step": 531} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 531} {"info/global_step": 532, "train_info/time_within_train_step": 2.356320858001709, "step": 532} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 532} {"info/global_step": 533, "train_info/time_within_train_step": 2.3557727336883545, "step": 533} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 533} {"info/global_step": 534, "train_info/time_within_train_step": 2.355987310409546, "step": 534} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 534} {"info/global_step": 535, "train_info/time_within_train_step": 2.3558778762817383, "step": 535} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 535} {"info/global_step": 536, "train_info/time_within_train_step": 2.356564998626709, "step": 536} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 536} {"info/global_step": 537, "train_info/time_within_train_step": 2.356592893600464, "step": 537} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 537} {"info/global_step": 538, "train_info/time_within_train_step": 2.3555593490600586, "step": 538} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 538} {"info/global_step": 539, "train_info/time_within_train_step": 2.3563125133514404, "step": 539} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 539} {"info/global_step": 540, "train_info/time_within_train_step": 2.379523515701294, "step": 540} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 540} {"info/global_step": 541, "train_info/time_within_train_step": 2.3557863235473633, "step": 541} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 541} {"info/global_step": 542, "train_info/time_within_train_step": 2.3561460971832275, "step": 542} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 542} {"info/global_step": 543, "train_info/time_within_train_step": 2.3569512367248535, "step": 543} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 543} {"info/global_step": 544, "train_info/time_within_train_step": 2.356872797012329, "step": 544} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 544} {"info/global_step": 545, "train_info/time_within_train_step": 2.3563878536224365, "step": 545} {"train_info/time_between_train_steps": 0.0032422542572021484, "step": 545} {"info/global_step": 546, "train_info/time_within_train_step": 2.3562209606170654, "step": 546} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 546} {"info/global_step": 547, "train_info/time_within_train_step": 2.3560917377471924, "step": 547} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 547} {"info/global_step": 548, "train_info/time_within_train_step": 2.373525381088257, "step": 548} {"train_info/time_between_train_steps": 0.002936840057373047, "step": 548} {"info/global_step": 549, "train_info/time_within_train_step": 2.356074094772339, "step": 549} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 549} {"info/global_step": 550, "train_info/time_within_train_step": 2.3542771339416504, "step": 550} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746253641, "_runtime": 1460}, "step": 550} {"logs": {"train/loss": 4.7381, "train/learning_rate": 0.0005444444444444444, "train/epoch": 0.18, "_timestamp": 1746253641, "_runtime": 1460}, "step": 550} {"train_info/time_between_train_steps": 0.0249483585357666, "step": 550} {"info/global_step": 551, "train_info/time_within_train_step": 2.354661703109741, "step": 551} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 551} {"info/global_step": 552, "train_info/time_within_train_step": 2.563169240951538, "step": 552} {"train_info/time_between_train_steps": 0.00287628173828125, "step": 552} {"info/global_step": 553, "train_info/time_within_train_step": 2.3545591831207275, "step": 553} {"train_info/time_between_train_steps": 0.0028634071350097656, "step": 553} {"info/global_step": 554, "train_info/time_within_train_step": 2.3549883365631104, "step": 554} {"train_info/time_between_train_steps": 0.002873659133911133, "step": 554} {"info/global_step": 555, "train_info/time_within_train_step": 2.3546347618103027, "step": 555} {"train_info/time_between_train_steps": 0.002863645553588867, "step": 555} {"info/global_step": 556, "train_info/time_within_train_step": 2.3546643257141113, "step": 556} {"train_info/time_between_train_steps": 0.002901792526245117, "step": 556} {"info/global_step": 557, "train_info/time_within_train_step": 2.354525089263916, "step": 557} {"train_info/time_between_train_steps": 0.0028929710388183594, "step": 557} {"info/global_step": 558, "train_info/time_within_train_step": 2.354557514190674, "step": 558} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 558} {"info/global_step": 559, "train_info/time_within_train_step": 2.3544435501098633, "step": 559} {"train_info/time_between_train_steps": 0.002872467041015625, "step": 559} {"info/global_step": 560, "train_info/time_within_train_step": 2.3541767597198486, "step": 560} {"train_info/time_between_train_steps": 0.0028607845306396484, "step": 560} {"info/global_step": 561, "train_info/time_within_train_step": 2.3545424938201904, "step": 561} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 561} {"info/global_step": 562, "train_info/time_within_train_step": 2.3556673526763916, "step": 562} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 562} {"info/global_step": 563, "train_info/time_within_train_step": 2.3546571731567383, "step": 563} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 563} {"info/global_step": 564, "train_info/time_within_train_step": 2.3545360565185547, "step": 564} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 564} {"info/global_step": 565, "train_info/time_within_train_step": 2.3551623821258545, "step": 565} {"train_info/time_between_train_steps": 0.002902507781982422, "step": 565} {"info/global_step": 566, "train_info/time_within_train_step": 2.353788137435913, "step": 566} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 566} {"info/global_step": 567, "train_info/time_within_train_step": 2.3547775745391846, "step": 567} {"train_info/time_between_train_steps": 0.0028944015502929688, "step": 567} {"info/global_step": 568, "train_info/time_within_train_step": 2.3547160625457764, "step": 568} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 568} {"info/global_step": 569, "train_info/time_within_train_step": 2.3537399768829346, "step": 569} {"train_info/time_between_train_steps": 0.0029146671295166016, "step": 569} {"info/global_step": 570, "train_info/time_within_train_step": 2.3535680770874023, "step": 570} {"train_info/time_between_train_steps": 0.002919435501098633, "step": 570} {"info/global_step": 571, "train_info/time_within_train_step": 2.354168653488159, "step": 571} {"train_info/time_between_train_steps": 0.002881288528442383, "step": 571} {"info/global_step": 572, "train_info/time_within_train_step": 2.3919124603271484, "step": 572} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 572} {"info/global_step": 573, "train_info/time_within_train_step": 2.3542399406433105, "step": 573} {"train_info/time_between_train_steps": 0.0029211044311523438, "step": 573} {"info/global_step": 574, "train_info/time_within_train_step": 2.354093074798584, "step": 574} {"train_info/time_between_train_steps": 0.002894163131713867, "step": 574} {"info/global_step": 575, "train_info/time_within_train_step": 2.3553950786590576, "step": 575} {"train_info/time_between_train_steps": 0.0029273033142089844, "step": 575} {"info/global_step": 576, "train_info/time_within_train_step": 2.3550684452056885, "step": 576} {"train_info/time_between_train_steps": 0.0029082298278808594, "step": 576} {"info/global_step": 577, "train_info/time_within_train_step": 2.5521202087402344, "step": 577} {"train_info/time_between_train_steps": 0.002965688705444336, "step": 577} {"info/global_step": 578, "train_info/time_within_train_step": 2.353996515274048, "step": 578} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 578} {"info/global_step": 579, "train_info/time_within_train_step": 2.3546688556671143, "step": 579} {"train_info/time_between_train_steps": 0.0028946399688720703, "step": 579} {"info/global_step": 580, "train_info/time_within_train_step": 2.355177402496338, "step": 580} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 580} {"info/global_step": 581, "train_info/time_within_train_step": 2.354959726333618, "step": 581} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 581} {"info/global_step": 582, "train_info/time_within_train_step": 2.3540945053100586, "step": 582} {"train_info/time_between_train_steps": 0.0029172897338867188, "step": 582} {"info/global_step": 583, "train_info/time_within_train_step": 2.3540658950805664, "step": 583} {"train_info/time_between_train_steps": 0.0030400753021240234, "step": 583} {"info/global_step": 584, "train_info/time_within_train_step": 2.35341215133667, "step": 584} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 584} {"info/global_step": 585, "train_info/time_within_train_step": 2.354247570037842, "step": 585} {"train_info/time_between_train_steps": 0.002958059310913086, "step": 585} {"info/global_step": 586, "train_info/time_within_train_step": 2.3555619716644287, "step": 586} {"train_info/time_between_train_steps": 0.0034461021423339844, "step": 586} {"info/global_step": 587, "train_info/time_within_train_step": 2.3545079231262207, "step": 587} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 587} {"info/global_step": 588, "train_info/time_within_train_step": 2.354503631591797, "step": 588} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 588} {"info/global_step": 589, "train_info/time_within_train_step": 2.3544819355010986, "step": 589} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 589} {"info/global_step": 590, "train_info/time_within_train_step": 2.3536407947540283, "step": 590} {"train_info/time_between_train_steps": 0.002966165542602539, "step": 590} {"info/global_step": 591, "train_info/time_within_train_step": 2.3557581901550293, "step": 591} {"train_info/time_between_train_steps": 0.0028781890869140625, "step": 591} {"info/global_step": 592, "train_info/time_within_train_step": 2.354753255844116, "step": 592} {"train_info/time_between_train_steps": 0.002871990203857422, "step": 592} {"info/global_step": 593, "train_info/time_within_train_step": 2.3547182083129883, "step": 593} {"train_info/time_between_train_steps": 0.0029256343841552734, "step": 593} {"info/global_step": 594, "train_info/time_within_train_step": 2.3542497158050537, "step": 594} {"train_info/time_between_train_steps": 0.0034193992614746094, "step": 594} {"info/global_step": 595, "train_info/time_within_train_step": 2.353118658065796, "step": 595} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 595} {"info/global_step": 596, "train_info/time_within_train_step": 2.3535377979278564, "step": 596} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 596} {"info/global_step": 597, "train_info/time_within_train_step": 2.354374885559082, "step": 597} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 597} {"info/global_step": 598, "train_info/time_within_train_step": 2.353870391845703, "step": 598} {"train_info/time_between_train_steps": 0.0028884410858154297, "step": 598} {"info/global_step": 599, "train_info/time_within_train_step": 2.354689598083496, "step": 599} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 599} {"info/global_step": 600, "train_info/time_within_train_step": 2.3543572425842285, "step": 600} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746253761, "_runtime": 1580}, "step": 600} {"logs": {"train/loss": 4.6677, "train/learning_rate": 0.0005333333333333333, "train/epoch": 0.2, "_timestamp": 1746253761, "_runtime": 1580}, "step": 600} {"train_info/time_between_train_steps": 15.736468076705933, "step": 600} {"info/global_step": 601, "train_info/time_within_train_step": 2.194194793701172, "step": 601} {"train_info/time_between_train_steps": 0.00289154052734375, "step": 601} {"info/global_step": 602, "train_info/time_within_train_step": 2.368257999420166, "step": 602} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 602} {"info/global_step": 603, "train_info/time_within_train_step": 2.2415454387664795, "step": 603} {"train_info/time_between_train_steps": 0.0029449462890625, "step": 603} {"info/global_step": 604, "train_info/time_within_train_step": 2.3484654426574707, "step": 604} {"train_info/time_between_train_steps": 0.0029354095458984375, "step": 604} {"info/global_step": 605, "train_info/time_within_train_step": 2.351199150085449, "step": 605} {"train_info/time_between_train_steps": 0.0029211044311523438, "step": 605} {"info/global_step": 606, "train_info/time_within_train_step": 2.354276180267334, "step": 606} {"train_info/time_between_train_steps": 0.0029096603393554688, "step": 606} {"info/global_step": 607, "train_info/time_within_train_step": 2.3546884059906006, "step": 607} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 607} {"info/global_step": 608, "train_info/time_within_train_step": 2.3561792373657227, "step": 608} {"train_info/time_between_train_steps": 0.0029091835021972656, "step": 608} {"info/global_step": 609, "train_info/time_within_train_step": 2.3558990955352783, "step": 609} {"train_info/time_between_train_steps": 0.002912759780883789, "step": 609} {"info/global_step": 610, "train_info/time_within_train_step": 2.3556413650512695, "step": 610} {"train_info/time_between_train_steps": 0.0029854774475097656, "step": 610} {"info/global_step": 611, "train_info/time_within_train_step": 2.355879783630371, "step": 611} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 611} {"info/global_step": 612, "train_info/time_within_train_step": 2.356994390487671, "step": 612} {"train_info/time_between_train_steps": 0.002976655960083008, "step": 612} {"info/global_step": 613, "train_info/time_within_train_step": 2.357159376144409, "step": 613} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 613} {"info/global_step": 614, "train_info/time_within_train_step": 2.3559255599975586, "step": 614} {"train_info/time_between_train_steps": 0.002947568893432617, "step": 614} {"info/global_step": 615, "train_info/time_within_train_step": 2.3563292026519775, "step": 615} {"train_info/time_between_train_steps": 0.0028786659240722656, "step": 615} {"info/global_step": 616, "train_info/time_within_train_step": 2.355403184890747, "step": 616} {"train_info/time_between_train_steps": 0.0029082298278808594, "step": 616} {"info/global_step": 617, "train_info/time_within_train_step": 2.356180191040039, "step": 617} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 617} {"info/global_step": 618, "train_info/time_within_train_step": 2.356203079223633, "step": 618} {"train_info/time_between_train_steps": 0.0029261112213134766, "step": 618} {"info/global_step": 619, "train_info/time_within_train_step": 2.354992389678955, "step": 619} {"train_info/time_between_train_steps": 0.002970457077026367, "step": 619} {"info/global_step": 620, "train_info/time_within_train_step": 2.3557257652282715, "step": 620} {"train_info/time_between_train_steps": 0.0028963088989257812, "step": 620} {"info/global_step": 621, "train_info/time_within_train_step": 2.3566086292266846, "step": 621} {"train_info/time_between_train_steps": 0.0028829574584960938, "step": 621} {"info/global_step": 622, "train_info/time_within_train_step": 2.356558084487915, "step": 622} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 622} {"info/global_step": 623, "train_info/time_within_train_step": 2.355053663253784, "step": 623} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 623} {"info/global_step": 624, "train_info/time_within_train_step": 2.3559978008270264, "step": 624} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 624} {"info/global_step": 625, "train_info/time_within_train_step": 2.356478214263916, "step": 625} {"train_info/time_between_train_steps": 0.0029115676879882812, "step": 625} {"info/global_step": 626, "train_info/time_within_train_step": 2.521113872528076, "step": 626} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 626} {"info/global_step": 627, "train_info/time_within_train_step": 2.3559656143188477, "step": 627} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 627} {"info/global_step": 628, "train_info/time_within_train_step": 2.356675863265991, "step": 628} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 628} {"info/global_step": 629, "train_info/time_within_train_step": 2.3554341793060303, "step": 629} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 629} {"info/global_step": 630, "train_info/time_within_train_step": 2.355799674987793, "step": 630} {"train_info/time_between_train_steps": 0.0029358863830566406, "step": 630} {"info/global_step": 631, "train_info/time_within_train_step": 2.355651617050171, "step": 631} {"train_info/time_between_train_steps": 0.0029544830322265625, "step": 631} {"info/global_step": 632, "train_info/time_within_train_step": 2.3566296100616455, "step": 632} {"train_info/time_between_train_steps": 0.0029904842376708984, "step": 632} {"info/global_step": 633, "train_info/time_within_train_step": 2.3553683757781982, "step": 633} {"train_info/time_between_train_steps": 0.0029633045196533203, "step": 633} {"info/global_step": 634, "train_info/time_within_train_step": 2.3560030460357666, "step": 634} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 634} {"info/global_step": 635, "train_info/time_within_train_step": 2.355407238006592, "step": 635} {"train_info/time_between_train_steps": 0.0034453868865966797, "step": 635} {"info/global_step": 636, "train_info/time_within_train_step": 2.3553853034973145, "step": 636} {"train_info/time_between_train_steps": 0.0029382705688476562, "step": 636} {"info/global_step": 637, "train_info/time_within_train_step": 2.356508255004883, "step": 637} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 637} {"info/global_step": 638, "train_info/time_within_train_step": 2.3553988933563232, "step": 638} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 638} {"info/global_step": 639, "train_info/time_within_train_step": 2.3557684421539307, "step": 639} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 639} {"info/global_step": 640, "train_info/time_within_train_step": 2.355289936065674, "step": 640} {"train_info/time_between_train_steps": 0.0029091835021972656, "step": 640} {"info/global_step": 641, "train_info/time_within_train_step": 2.3549673557281494, "step": 641} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 641} {"info/global_step": 642, "train_info/time_within_train_step": 2.354161500930786, "step": 642} {"train_info/time_between_train_steps": 0.0028972625732421875, "step": 642} {"info/global_step": 643, "train_info/time_within_train_step": 2.3556010723114014, "step": 643} {"train_info/time_between_train_steps": 0.002915620803833008, "step": 643} {"info/global_step": 644, "train_info/time_within_train_step": 2.355743169784546, "step": 644} {"train_info/time_between_train_steps": 0.0029387474060058594, "step": 644} {"info/global_step": 645, "train_info/time_within_train_step": 2.3550896644592285, "step": 645} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 645} {"info/global_step": 646, "train_info/time_within_train_step": 2.3560309410095215, "step": 646} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 646} {"info/global_step": 647, "train_info/time_within_train_step": 2.3561859130859375, "step": 647} {"train_info/time_between_train_steps": 0.002887248992919922, "step": 647} {"info/global_step": 648, "train_info/time_within_train_step": 2.3553764820098877, "step": 648} {"train_info/time_between_train_steps": 0.002924203872680664, "step": 648} {"info/global_step": 649, "train_info/time_within_train_step": 2.355081558227539, "step": 649} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 649} {"info/global_step": 650, "train_info/time_within_train_step": 2.515230655670166, "step": 650} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746253895, "_runtime": 1714}, "step": 650} {"logs": {"train/loss": 4.6048, "train/learning_rate": 0.0005222222222222222, "train/epoch": 0.22, "_timestamp": 1746253895, "_runtime": 1714}, "step": 650} {"train_info/time_between_train_steps": 0.024241924285888672, "step": 650} {"info/global_step": 651, "train_info/time_within_train_step": 2.353912115097046, "step": 651} {"train_info/time_between_train_steps": 0.0028929710388183594, "step": 651} {"info/global_step": 652, "train_info/time_within_train_step": 2.354393720626831, "step": 652} {"train_info/time_between_train_steps": 0.00292205810546875, "step": 652} {"info/global_step": 653, "train_info/time_within_train_step": 2.3546810150146484, "step": 653} {"train_info/time_between_train_steps": 0.0028824806213378906, "step": 653} {"info/global_step": 654, "train_info/time_within_train_step": 2.3544015884399414, "step": 654} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 654} {"info/global_step": 655, "train_info/time_within_train_step": 2.354173183441162, "step": 655} {"train_info/time_between_train_steps": 0.002899646759033203, "step": 655} {"info/global_step": 656, "train_info/time_within_train_step": 2.3550479412078857, "step": 656} {"train_info/time_between_train_steps": 0.002939462661743164, "step": 656} {"info/global_step": 657, "train_info/time_within_train_step": 2.354377269744873, "step": 657} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 657} {"info/global_step": 658, "train_info/time_within_train_step": 2.3555662631988525, "step": 658} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 658} {"info/global_step": 659, "train_info/time_within_train_step": 2.3561348915100098, "step": 659} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 659} {"info/global_step": 660, "train_info/time_within_train_step": 2.3544375896453857, "step": 660} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 660} {"info/global_step": 661, "train_info/time_within_train_step": 2.354485273361206, "step": 661} {"train_info/time_between_train_steps": 0.0029430389404296875, "step": 661} {"info/global_step": 662, "train_info/time_within_train_step": 2.35495924949646, "step": 662} {"train_info/time_between_train_steps": 0.003482341766357422, "step": 662} {"info/global_step": 663, "train_info/time_within_train_step": 2.3552494049072266, "step": 663} {"train_info/time_between_train_steps": 0.002928495407104492, "step": 663} {"info/global_step": 664, "train_info/time_within_train_step": 2.3563385009765625, "step": 664} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 664} {"info/global_step": 665, "train_info/time_within_train_step": 2.3550193309783936, "step": 665} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 665} {"info/global_step": 666, "train_info/time_within_train_step": 2.3561489582061768, "step": 666} {"train_info/time_between_train_steps": 0.002881288528442383, "step": 666} {"info/global_step": 667, "train_info/time_within_train_step": 2.3543694019317627, "step": 667} {"train_info/time_between_train_steps": 0.0029125213623046875, "step": 667} {"info/global_step": 668, "train_info/time_within_train_step": 2.3542964458465576, "step": 668} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 668} {"info/global_step": 669, "train_info/time_within_train_step": 2.3543765544891357, "step": 669} {"train_info/time_between_train_steps": 0.002888202667236328, "step": 669} {"info/global_step": 670, "train_info/time_within_train_step": 2.354839563369751, "step": 670} {"train_info/time_between_train_steps": 0.0029146671295166016, "step": 670} {"info/global_step": 671, "train_info/time_within_train_step": 2.3548293113708496, "step": 671} {"train_info/time_between_train_steps": 0.002882242202758789, "step": 671} {"info/global_step": 672, "train_info/time_within_train_step": 2.3548460006713867, "step": 672} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 672} {"info/global_step": 673, "train_info/time_within_train_step": 2.3552560806274414, "step": 673} {"train_info/time_between_train_steps": 0.0028884410858154297, "step": 673} {"info/global_step": 674, "train_info/time_within_train_step": 2.354757070541382, "step": 674} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 674} {"info/global_step": 675, "train_info/time_within_train_step": 2.4918770790100098, "step": 675} {"train_info/time_between_train_steps": 0.0028891563415527344, "step": 675} {"info/global_step": 676, "train_info/time_within_train_step": 2.3537285327911377, "step": 676} {"train_info/time_between_train_steps": 0.0028769969940185547, "step": 676} {"info/global_step": 677, "train_info/time_within_train_step": 2.3546082973480225, "step": 677} {"train_info/time_between_train_steps": 0.002924680709838867, "step": 677} {"info/global_step": 678, "train_info/time_within_train_step": 2.3541359901428223, "step": 678} {"train_info/time_between_train_steps": 0.002886056900024414, "step": 678} {"info/global_step": 679, "train_info/time_within_train_step": 2.3547613620758057, "step": 679} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 679} {"info/global_step": 680, "train_info/time_within_train_step": 2.3552520275115967, "step": 680} {"train_info/time_between_train_steps": 0.0030019283294677734, "step": 680} {"info/global_step": 681, "train_info/time_within_train_step": 2.3547563552856445, "step": 681} {"train_info/time_between_train_steps": 0.0029189586639404297, "step": 681} {"info/global_step": 682, "train_info/time_within_train_step": 2.3552792072296143, "step": 682} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 682} {"info/global_step": 683, "train_info/time_within_train_step": 2.3553249835968018, "step": 683} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 683} {"info/global_step": 684, "train_info/time_within_train_step": 2.3545007705688477, "step": 684} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 684} {"info/global_step": 685, "train_info/time_within_train_step": 2.3548715114593506, "step": 685} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 685} {"info/global_step": 686, "train_info/time_within_train_step": 2.3547255992889404, "step": 686} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 686} {"info/global_step": 687, "train_info/time_within_train_step": 2.3547215461730957, "step": 687} {"train_info/time_between_train_steps": 0.0028846263885498047, "step": 687} {"info/global_step": 688, "train_info/time_within_train_step": 2.355076789855957, "step": 688} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 688} {"info/global_step": 689, "train_info/time_within_train_step": 2.3550214767456055, "step": 689} {"train_info/time_between_train_steps": 0.0028786659240722656, "step": 689} {"info/global_step": 690, "train_info/time_within_train_step": 2.3539655208587646, "step": 690} {"train_info/time_between_train_steps": 0.0028831958770751953, "step": 690} {"info/global_step": 691, "train_info/time_within_train_step": 2.3539934158325195, "step": 691} {"train_info/time_between_train_steps": 0.002859830856323242, "step": 691} {"info/global_step": 692, "train_info/time_within_train_step": 2.3538384437561035, "step": 692} {"train_info/time_between_train_steps": 0.0029184818267822266, "step": 692} {"info/global_step": 693, "train_info/time_within_train_step": 2.3546841144561768, "step": 693} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 693} {"info/global_step": 694, "train_info/time_within_train_step": 2.3543784618377686, "step": 694} {"train_info/time_between_train_steps": 0.002892017364501953, "step": 694} {"info/global_step": 695, "train_info/time_within_train_step": 2.3544414043426514, "step": 695} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 695} {"info/global_step": 696, "train_info/time_within_train_step": 2.354379653930664, "step": 696} {"train_info/time_between_train_steps": 0.0028700828552246094, "step": 696} {"info/global_step": 697, "train_info/time_within_train_step": 2.354987382888794, "step": 697} {"train_info/time_between_train_steps": 0.002929210662841797, "step": 697} {"info/global_step": 698, "train_info/time_within_train_step": 2.4798624515533447, "step": 698} {"train_info/time_between_train_steps": 0.002941608428955078, "step": 698} {"info/global_step": 699, "train_info/time_within_train_step": 2.3540072441101074, "step": 699} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 699} {"info/global_step": 700, "train_info/time_within_train_step": 2.3545310497283936, "step": 700} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746254015, "_runtime": 1834}, "step": 700} {"logs": {"train/loss": 4.5558, "train/learning_rate": 0.0005111111111111111, "train/epoch": 0.23, "_timestamp": 1746254015, "_runtime": 1834}, "step": 700} {"train_info/time_between_train_steps": 14.809498071670532, "step": 700} {"info/global_step": 701, "train_info/time_within_train_step": 2.1991019248962402, "step": 701} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 701} {"info/global_step": 702, "train_info/time_within_train_step": 2.182490348815918, "step": 702} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 702} {"info/global_step": 703, "train_info/time_within_train_step": 2.2748842239379883, "step": 703} {"train_info/time_between_train_steps": 0.0029082298278808594, "step": 703} {"info/global_step": 704, "train_info/time_within_train_step": 2.372001886367798, "step": 704} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 704} {"info/global_step": 705, "train_info/time_within_train_step": 2.352996587753296, "step": 705} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 705} {"info/global_step": 706, "train_info/time_within_train_step": 2.3552258014678955, "step": 706} {"train_info/time_between_train_steps": 0.002887248992919922, "step": 706} {"info/global_step": 707, "train_info/time_within_train_step": 2.355490207672119, "step": 707} {"train_info/time_between_train_steps": 0.0028734207153320312, "step": 707} {"info/global_step": 708, "train_info/time_within_train_step": 2.355750799179077, "step": 708} {"train_info/time_between_train_steps": 0.0031011104583740234, "step": 708} {"info/global_step": 709, "train_info/time_within_train_step": 2.3562207221984863, "step": 709} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 709} {"info/global_step": 710, "train_info/time_within_train_step": 2.3576865196228027, "step": 710} {"train_info/time_between_train_steps": 0.002925872802734375, "step": 710} {"info/global_step": 711, "train_info/time_within_train_step": 2.3565874099731445, "step": 711} {"train_info/time_between_train_steps": 0.0028905868530273438, "step": 711} {"info/global_step": 712, "train_info/time_within_train_step": 2.356884479522705, "step": 712} {"train_info/time_between_train_steps": 0.0029413700103759766, "step": 712} {"info/global_step": 713, "train_info/time_within_train_step": 2.3580610752105713, "step": 713} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 713} {"info/global_step": 714, "train_info/time_within_train_step": 2.3582258224487305, "step": 714} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 714} {"info/global_step": 715, "train_info/time_within_train_step": 2.3577961921691895, "step": 715} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 715} {"info/global_step": 716, "train_info/time_within_train_step": 2.3576698303222656, "step": 716} {"train_info/time_between_train_steps": 0.0028994083404541016, "step": 716} {"info/global_step": 717, "train_info/time_within_train_step": 2.3574788570404053, "step": 717} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 717} {"info/global_step": 718, "train_info/time_within_train_step": 2.35772442817688, "step": 718} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 718} {"info/global_step": 719, "train_info/time_within_train_step": 2.3569602966308594, "step": 719} {"train_info/time_between_train_steps": 0.002925872802734375, "step": 719} {"info/global_step": 720, "train_info/time_within_train_step": 2.356898307800293, "step": 720} {"train_info/time_between_train_steps": 0.0029180049896240234, "step": 720} {"info/global_step": 721, "train_info/time_within_train_step": 2.4421961307525635, "step": 721} {"train_info/time_between_train_steps": 0.0028755664825439453, "step": 721} {"info/global_step": 722, "train_info/time_within_train_step": 2.357757568359375, "step": 722} {"train_info/time_between_train_steps": 0.0029022693634033203, "step": 722} {"info/global_step": 723, "train_info/time_within_train_step": 2.356189012527466, "step": 723} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 723} {"info/global_step": 724, "train_info/time_within_train_step": 2.3569531440734863, "step": 724} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 724} {"info/global_step": 725, "train_info/time_within_train_step": 2.357278823852539, "step": 725} {"train_info/time_between_train_steps": 0.002877473831176758, "step": 725} {"info/global_step": 726, "train_info/time_within_train_step": 2.3581316471099854, "step": 726} {"train_info/time_between_train_steps": 0.002932310104370117, "step": 726} {"info/global_step": 727, "train_info/time_within_train_step": 2.357642650604248, "step": 727} {"train_info/time_between_train_steps": 0.0028786659240722656, "step": 727} {"info/global_step": 728, "train_info/time_within_train_step": 2.3566017150878906, "step": 728} {"train_info/time_between_train_steps": 0.002880096435546875, "step": 728} {"info/global_step": 729, "train_info/time_within_train_step": 2.3577821254730225, "step": 729} {"train_info/time_between_train_steps": 0.0028688907623291016, "step": 729} {"info/global_step": 730, "train_info/time_within_train_step": 2.3566548824310303, "step": 730} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 730} {"info/global_step": 731, "train_info/time_within_train_step": 2.3579046726226807, "step": 731} {"train_info/time_between_train_steps": 0.0029108524322509766, "step": 731} {"info/global_step": 732, "train_info/time_within_train_step": 2.357100486755371, "step": 732} {"train_info/time_between_train_steps": 0.003037691116333008, "step": 732} {"info/global_step": 733, "train_info/time_within_train_step": 2.3573596477508545, "step": 733} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 733} {"info/global_step": 734, "train_info/time_within_train_step": 2.35913348197937, "step": 734} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 734} {"info/global_step": 735, "train_info/time_within_train_step": 2.3572473526000977, "step": 735} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 735} {"info/global_step": 736, "train_info/time_within_train_step": 2.357407331466675, "step": 736} {"train_info/time_between_train_steps": 0.0029256343841552734, "step": 736} {"info/global_step": 737, "train_info/time_within_train_step": 2.358076333999634, "step": 737} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 737} {"info/global_step": 738, "train_info/time_within_train_step": 2.3577795028686523, "step": 738} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 738} {"info/global_step": 739, "train_info/time_within_train_step": 2.3579699993133545, "step": 739} {"train_info/time_between_train_steps": 0.002947092056274414, "step": 739} {"info/global_step": 740, "train_info/time_within_train_step": 2.3575918674468994, "step": 740} {"train_info/time_between_train_steps": 0.002913951873779297, "step": 740} {"info/global_step": 741, "train_info/time_within_train_step": 2.3566324710845947, "step": 741} {"train_info/time_between_train_steps": 0.0029206275939941406, "step": 741} {"info/global_step": 742, "train_info/time_within_train_step": 2.3573977947235107, "step": 742} {"train_info/time_between_train_steps": 0.003095388412475586, "step": 742} {"info/global_step": 743, "train_info/time_within_train_step": 2.357370376586914, "step": 743} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 743} {"info/global_step": 744, "train_info/time_within_train_step": 2.512799024581909, "step": 744} {"train_info/time_between_train_steps": 0.0029900074005126953, "step": 744} {"info/global_step": 745, "train_info/time_within_train_step": 2.3565733432769775, "step": 745} {"train_info/time_between_train_steps": 0.0029523372650146484, "step": 745} {"info/global_step": 746, "train_info/time_within_train_step": 2.356807231903076, "step": 746} {"train_info/time_between_train_steps": 0.002964019775390625, "step": 746} {"info/global_step": 747, "train_info/time_within_train_step": 2.3570053577423096, "step": 747} {"train_info/time_between_train_steps": 0.0029592514038085938, "step": 747} {"info/global_step": 748, "train_info/time_within_train_step": 2.357016086578369, "step": 748} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 748} {"info/global_step": 749, "train_info/time_within_train_step": 2.357041597366333, "step": 749} {"train_info/time_between_train_steps": 0.006186008453369141, "step": 749} {"info/global_step": 750, "train_info/time_within_train_step": 2.8668360710144043, "step": 750} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746254149, "_runtime": 1968}, "step": 750} {"logs": {"train/loss": 4.4897, "train/learning_rate": 0.0005, "train/epoch": 0.25, "_timestamp": 1746254149, "_runtime": 1968}, "step": 750} {"train_info/time_between_train_steps": 0.02770066261291504, "step": 750} {"info/global_step": 751, "train_info/time_within_train_step": 2.3592491149902344, "step": 751} {"train_info/time_between_train_steps": 0.0061588287353515625, "step": 751} {"info/global_step": 752, "train_info/time_within_train_step": 2.3567116260528564, "step": 752} {"train_info/time_between_train_steps": 0.00619196891784668, "step": 752} {"info/global_step": 753, "train_info/time_within_train_step": 2.3567054271698, "step": 753} {"train_info/time_between_train_steps": 0.0061492919921875, "step": 753} {"info/global_step": 754, "train_info/time_within_train_step": 2.3562099933624268, "step": 754} {"train_info/time_between_train_steps": 0.006140708923339844, "step": 754} {"info/global_step": 755, "train_info/time_within_train_step": 2.357231378555298, "step": 755} {"train_info/time_between_train_steps": 0.00616908073425293, "step": 755} {"info/global_step": 756, "train_info/time_within_train_step": 2.3562240600585938, "step": 756} {"train_info/time_between_train_steps": 0.006103992462158203, "step": 756} {"info/global_step": 757, "train_info/time_within_train_step": 2.3556299209594727, "step": 757} {"train_info/time_between_train_steps": 0.006083011627197266, "step": 757} {"info/global_step": 758, "train_info/time_within_train_step": 2.3558318614959717, "step": 758} {"train_info/time_between_train_steps": 0.006130218505859375, "step": 758} {"info/global_step": 759, "train_info/time_within_train_step": 2.3560492992401123, "step": 759} {"train_info/time_between_train_steps": 0.0061206817626953125, "step": 759} {"info/global_step": 760, "train_info/time_within_train_step": 2.3561270236968994, "step": 760} {"train_info/time_between_train_steps": 0.006152153015136719, "step": 760} {"info/global_step": 761, "train_info/time_within_train_step": 2.3567206859588623, "step": 761} {"train_info/time_between_train_steps": 0.006165981292724609, "step": 761} {"info/global_step": 762, "train_info/time_within_train_step": 2.3560638427734375, "step": 762} {"train_info/time_between_train_steps": 0.006151676177978516, "step": 762} {"info/global_step": 763, "train_info/time_within_train_step": 2.3554024696350098, "step": 763} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 763} {"info/global_step": 764, "train_info/time_within_train_step": 2.357182502746582, "step": 764} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 764} {"info/global_step": 765, "train_info/time_within_train_step": 2.355790853500366, "step": 765} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 765} {"info/global_step": 766, "train_info/time_within_train_step": 2.3563618659973145, "step": 766} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 766} {"info/global_step": 767, "train_info/time_within_train_step": 2.356477737426758, "step": 767} {"train_info/time_between_train_steps": 0.002975940704345703, "step": 767} {"info/global_step": 768, "train_info/time_within_train_step": 2.4390738010406494, "step": 768} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 768} {"info/global_step": 769, "train_info/time_within_train_step": 2.3557515144348145, "step": 769} {"train_info/time_between_train_steps": 0.0029523372650146484, "step": 769} {"info/global_step": 770, "train_info/time_within_train_step": 2.3572418689727783, "step": 770} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 770} {"info/global_step": 771, "train_info/time_within_train_step": 2.355807304382324, "step": 771} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 771} {"info/global_step": 772, "train_info/time_within_train_step": 2.3565046787261963, "step": 772} {"train_info/time_between_train_steps": 0.002939462661743164, "step": 772} {"info/global_step": 773, "train_info/time_within_train_step": 2.3568801879882812, "step": 773} {"train_info/time_between_train_steps": 0.0029637813568115234, "step": 773} {"info/global_step": 774, "train_info/time_within_train_step": 2.356372356414795, "step": 774} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 774} {"info/global_step": 775, "train_info/time_within_train_step": 2.3554627895355225, "step": 775} {"train_info/time_between_train_steps": 0.0029592514038085938, "step": 775} {"info/global_step": 776, "train_info/time_within_train_step": 2.3556039333343506, "step": 776} {"train_info/time_between_train_steps": 0.0029358863830566406, "step": 776} {"info/global_step": 777, "train_info/time_within_train_step": 2.355332612991333, "step": 777} {"train_info/time_between_train_steps": 0.0029425621032714844, "step": 777} {"info/global_step": 778, "train_info/time_within_train_step": 2.357410430908203, "step": 778} {"train_info/time_between_train_steps": 0.0029985904693603516, "step": 778} {"info/global_step": 779, "train_info/time_within_train_step": 2.3570713996887207, "step": 779} {"train_info/time_between_train_steps": 0.002945423126220703, "step": 779} {"info/global_step": 780, "train_info/time_within_train_step": 2.356816053390503, "step": 780} {"train_info/time_between_train_steps": 0.002930879592895508, "step": 780} {"info/global_step": 781, "train_info/time_within_train_step": 2.3562512397766113, "step": 781} {"train_info/time_between_train_steps": 0.002908945083618164, "step": 781} {"info/global_step": 782, "train_info/time_within_train_step": 2.3559532165527344, "step": 782} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 782} {"info/global_step": 783, "train_info/time_within_train_step": 2.3574960231781006, "step": 783} {"train_info/time_between_train_steps": 0.002912759780883789, "step": 783} {"info/global_step": 784, "train_info/time_within_train_step": 2.3570947647094727, "step": 784} {"train_info/time_between_train_steps": 0.0029115676879882812, "step": 784} {"info/global_step": 785, "train_info/time_within_train_step": 2.358287811279297, "step": 785} {"train_info/time_between_train_steps": 0.0029311180114746094, "step": 785} {"info/global_step": 786, "train_info/time_within_train_step": 2.3564858436584473, "step": 786} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 786} {"info/global_step": 787, "train_info/time_within_train_step": 2.3563098907470703, "step": 787} {"train_info/time_between_train_steps": 0.002958059310913086, "step": 787} {"info/global_step": 788, "train_info/time_within_train_step": 2.355792999267578, "step": 788} {"train_info/time_between_train_steps": 0.0029144287109375, "step": 788} {"info/global_step": 789, "train_info/time_within_train_step": 2.356506824493408, "step": 789} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 789} {"info/global_step": 790, "train_info/time_within_train_step": 2.3985016345977783, "step": 790} {"train_info/time_between_train_steps": 0.0028815269470214844, "step": 790} {"info/global_step": 791, "train_info/time_within_train_step": 2.3561110496520996, "step": 791} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 791} {"info/global_step": 792, "train_info/time_within_train_step": 2.3570592403411865, "step": 792} {"train_info/time_between_train_steps": 0.0029954910278320312, "step": 792} {"info/global_step": 793, "train_info/time_within_train_step": 2.3566107749938965, "step": 793} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 793} {"info/global_step": 794, "train_info/time_within_train_step": 2.3577349185943604, "step": 794} {"train_info/time_between_train_steps": 0.002923727035522461, "step": 794} {"info/global_step": 795, "train_info/time_within_train_step": 2.3570094108581543, "step": 795} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 795} {"info/global_step": 796, "train_info/time_within_train_step": 2.3562278747558594, "step": 796} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 796} {"info/global_step": 797, "train_info/time_within_train_step": 2.3570656776428223, "step": 797} {"train_info/time_between_train_steps": 0.002983570098876953, "step": 797} {"info/global_step": 798, "train_info/time_within_train_step": 2.3569881916046143, "step": 798} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 798} {"info/global_step": 799, "train_info/time_within_train_step": 2.3584983348846436, "step": 799} {"train_info/time_between_train_steps": 0.003062725067138672, "step": 799} {"info/global_step": 800, "train_info/time_within_train_step": 2.356773614883423, "step": 800} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746254268, "_runtime": 2087}, "step": 800} {"logs": {"train/loss": 4.4583, "train/learning_rate": 0.0004888888888888889, "train/epoch": 0.27, "_timestamp": 1746254268, "_runtime": 2087}, "step": 800} {"train_info/time_between_train_steps": 13.304758548736572, "step": 800} {"info/global_step": 801, "train_info/time_within_train_step": 2.200214385986328, "step": 801} {"train_info/time_between_train_steps": 0.0029649734497070312, "step": 801} {"info/global_step": 802, "train_info/time_within_train_step": 2.184270143508911, "step": 802} {"train_info/time_between_train_steps": 0.0029768943786621094, "step": 802} {"info/global_step": 803, "train_info/time_within_train_step": 2.2935128211975098, "step": 803} {"train_info/time_between_train_steps": 0.002950429916381836, "step": 803} {"info/global_step": 804, "train_info/time_within_train_step": 2.350538969039917, "step": 804} {"train_info/time_between_train_steps": 0.0029115676879882812, "step": 804} {"info/global_step": 805, "train_info/time_within_train_step": 2.354063034057617, "step": 805} {"train_info/time_between_train_steps": 0.002965211868286133, "step": 805} {"info/global_step": 806, "train_info/time_within_train_step": 2.3565921783447266, "step": 806} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 806} {"info/global_step": 807, "train_info/time_within_train_step": 2.354919910430908, "step": 807} {"train_info/time_between_train_steps": 0.0029573440551757812, "step": 807} {"info/global_step": 808, "train_info/time_within_train_step": 2.356710433959961, "step": 808} {"train_info/time_between_train_steps": 0.0029304027557373047, "step": 808} {"info/global_step": 809, "train_info/time_within_train_step": 2.3574981689453125, "step": 809} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 809} {"info/global_step": 810, "train_info/time_within_train_step": 2.356722354888916, "step": 810} {"train_info/time_between_train_steps": 0.0029458999633789062, "step": 810} {"info/global_step": 811, "train_info/time_within_train_step": 2.3564915657043457, "step": 811} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 811} {"info/global_step": 812, "train_info/time_within_train_step": 2.415863513946533, "step": 812} {"train_info/time_between_train_steps": 0.0029740333557128906, "step": 812} {"info/global_step": 813, "train_info/time_within_train_step": 2.3567967414855957, "step": 813} {"train_info/time_between_train_steps": 0.002927541732788086, "step": 813} {"info/global_step": 814, "train_info/time_within_train_step": 2.3579111099243164, "step": 814} {"train_info/time_between_train_steps": 0.002907991409301758, "step": 814} {"info/global_step": 815, "train_info/time_within_train_step": 2.3568921089172363, "step": 815} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 815} {"info/global_step": 816, "train_info/time_within_train_step": 2.3577651977539062, "step": 816} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 816} {"info/global_step": 817, "train_info/time_within_train_step": 2.3912458419799805, "step": 817} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 817} {"info/global_step": 818, "train_info/time_within_train_step": 2.357539653778076, "step": 818} {"train_info/time_between_train_steps": 0.003318309783935547, "step": 818} {"info/global_step": 819, "train_info/time_within_train_step": 2.3581368923187256, "step": 819} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 819} {"info/global_step": 820, "train_info/time_within_train_step": 2.3580758571624756, "step": 820} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 820} {"info/global_step": 821, "train_info/time_within_train_step": 2.357311487197876, "step": 821} {"train_info/time_between_train_steps": 0.0029916763305664062, "step": 821} {"info/global_step": 822, "train_info/time_within_train_step": 2.356553077697754, "step": 822} {"train_info/time_between_train_steps": 0.002933502197265625, "step": 822} {"info/global_step": 823, "train_info/time_within_train_step": 2.3571133613586426, "step": 823} {"train_info/time_between_train_steps": 0.002927064895629883, "step": 823} {"info/global_step": 824, "train_info/time_within_train_step": 2.357466697692871, "step": 824} {"train_info/time_between_train_steps": 0.002966642379760742, "step": 824} {"info/global_step": 825, "train_info/time_within_train_step": 2.35780930519104, "step": 825} {"train_info/time_between_train_steps": 0.002972126007080078, "step": 825} {"info/global_step": 826, "train_info/time_within_train_step": 2.3577651977539062, "step": 826} {"train_info/time_between_train_steps": 0.004042387008666992, "step": 826} {"info/global_step": 827, "train_info/time_within_train_step": 2.3587615489959717, "step": 827} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 827} {"info/global_step": 828, "train_info/time_within_train_step": 2.359025239944458, "step": 828} {"train_info/time_between_train_steps": 0.002997159957885742, "step": 828} {"info/global_step": 829, "train_info/time_within_train_step": 2.357618808746338, "step": 829} {"train_info/time_between_train_steps": 0.002928495407104492, "step": 829} {"info/global_step": 830, "train_info/time_within_train_step": 2.358415365219116, "step": 830} {"train_info/time_between_train_steps": 0.0029523372650146484, "step": 830} {"info/global_step": 831, "train_info/time_within_train_step": 2.3578827381134033, "step": 831} {"train_info/time_between_train_steps": 0.002955198287963867, "step": 831} {"info/global_step": 832, "train_info/time_within_train_step": 2.357222318649292, "step": 832} {"train_info/time_between_train_steps": 0.0029730796813964844, "step": 832} {"info/global_step": 833, "train_info/time_within_train_step": 2.358407497406006, "step": 833} {"train_info/time_between_train_steps": 0.003041505813598633, "step": 833} {"info/global_step": 834, "train_info/time_within_train_step": 2.402888059616089, "step": 834} {"train_info/time_between_train_steps": 0.003072023391723633, "step": 834} {"info/global_step": 835, "train_info/time_within_train_step": 2.358734130859375, "step": 835} {"train_info/time_between_train_steps": 0.0030150413513183594, "step": 835} {"info/global_step": 836, "train_info/time_within_train_step": 2.3576836585998535, "step": 836} {"train_info/time_between_train_steps": 0.0030138492584228516, "step": 836} {"info/global_step": 837, "train_info/time_within_train_step": 2.3580565452575684, "step": 837} {"train_info/time_between_train_steps": 0.0030057430267333984, "step": 837} {"info/global_step": 838, "train_info/time_within_train_step": 2.357844352722168, "step": 838} {"train_info/time_between_train_steps": 0.003034830093383789, "step": 838} {"info/global_step": 839, "train_info/time_within_train_step": 2.35823130607605, "step": 839} {"train_info/time_between_train_steps": 0.0030994415283203125, "step": 839} {"info/global_step": 840, "train_info/time_within_train_step": 2.358511209487915, "step": 840} {"train_info/time_between_train_steps": 0.003114938735961914, "step": 840} {"info/global_step": 841, "train_info/time_within_train_step": 2.358015775680542, "step": 841} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 841} {"info/global_step": 842, "train_info/time_within_train_step": 2.357320547103882, "step": 842} {"train_info/time_between_train_steps": 0.002967357635498047, "step": 842} {"info/global_step": 843, "train_info/time_within_train_step": 2.357208013534546, "step": 843} {"train_info/time_between_train_steps": 0.003123044967651367, "step": 843} {"info/global_step": 844, "train_info/time_within_train_step": 2.3574483394622803, "step": 844} {"train_info/time_between_train_steps": 0.003098011016845703, "step": 844} {"info/global_step": 845, "train_info/time_within_train_step": 2.3575868606567383, "step": 845} {"train_info/time_between_train_steps": 0.0034096240997314453, "step": 845} {"info/global_step": 846, "train_info/time_within_train_step": 2.35843563079834, "step": 846} {"train_info/time_between_train_steps": 0.003418445587158203, "step": 846} {"info/global_step": 847, "train_info/time_within_train_step": 2.358994960784912, "step": 847} {"train_info/time_between_train_steps": 0.0036253929138183594, "step": 847} {"info/global_step": 848, "train_info/time_within_train_step": 2.3599636554718018, "step": 848} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 848} {"info/global_step": 849, "train_info/time_within_train_step": 2.3597652912139893, "step": 849} {"train_info/time_between_train_steps": 0.0035305023193359375, "step": 849} {"info/global_step": 850, "train_info/time_within_train_step": 2.3607594966888428, "step": 850} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4918.0, "train_info/memory_max_reserved": 4918.0, "_timestamp": 1746254400, "_runtime": 2219}, "step": 850} {"logs": {"train/loss": 4.4188, "train/learning_rate": 0.0004777777777777777, "train/epoch": 0.28, "_timestamp": 1746254400, "_runtime": 2219}, "step": 850} {"train_info/time_between_train_steps": 0.02497243881225586, "step": 850} {"info/global_step": 851, "train_info/time_within_train_step": 2.358534812927246, "step": 851} {"train_info/time_between_train_steps": 0.003407001495361328, "step": 851} {"info/global_step": 852, "train_info/time_within_train_step": 2.3599729537963867, "step": 852} {"train_info/time_between_train_steps": 0.003744363784790039, "step": 852} {"info/global_step": 853, "train_info/time_within_train_step": 2.3595705032348633, "step": 853} {"train_info/time_between_train_steps": 0.003932952880859375, "step": 853} {"info/global_step": 854, "train_info/time_within_train_step": 2.359409809112549, "step": 854} {"train_info/time_between_train_steps": 0.003544330596923828, "step": 854} {"info/global_step": 855, "train_info/time_within_train_step": 2.358534336090088, "step": 855} {"train_info/time_between_train_steps": 0.0035943984985351562, "step": 855} {"info/global_step": 856, "train_info/time_within_train_step": 2.393261432647705, "step": 856} {"train_info/time_between_train_steps": 0.003468751907348633, "step": 856} {"info/global_step": 857, "train_info/time_within_train_step": 2.359316825866699, "step": 857} {"train_info/time_between_train_steps": 0.003684520721435547, "step": 857} {"info/global_step": 858, "train_info/time_within_train_step": 2.3610663414001465, "step": 858} {"train_info/time_between_train_steps": 0.003663301467895508, "step": 858} {"info/global_step": 859, "train_info/time_within_train_step": 2.3607845306396484, "step": 859} {"train_info/time_between_train_steps": 0.004098415374755859, "step": 859} {"info/global_step": 860, "train_info/time_within_train_step": 2.360459089279175, "step": 860} {"train_info/time_between_train_steps": 0.003846406936645508, "step": 860} {"train_info/time_between_train_steps": 2.5900800228118896, "step": 860} {"info/global_step": 861, "train_info/time_within_train_step": 2.5976479053497314, "step": 861} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 861} {"info/global_step": 862, "train_info/time_within_train_step": 2.357499599456787, "step": 862} {"train_info/time_between_train_steps": 0.003790616989135742, "step": 862} {"info/global_step": 863, "train_info/time_within_train_step": 2.3593780994415283, "step": 863} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 863} {"info/global_step": 864, "train_info/time_within_train_step": 2.3583970069885254, "step": 864} {"train_info/time_between_train_steps": 0.0036573410034179688, "step": 864} {"info/global_step": 865, "train_info/time_within_train_step": 2.3576748371124268, "step": 865} {"train_info/time_between_train_steps": 0.0034551620483398438, "step": 865} {"info/global_step": 866, "train_info/time_within_train_step": 2.3588545322418213, "step": 866} {"train_info/time_between_train_steps": 0.0033681392669677734, "step": 866} {"info/global_step": 867, "train_info/time_within_train_step": 2.3580162525177, "step": 867} {"train_info/time_between_train_steps": 0.003506898880004883, "step": 867} {"info/global_step": 868, "train_info/time_within_train_step": 2.3582029342651367, "step": 868} {"train_info/time_between_train_steps": 0.003332376480102539, "step": 868} {"info/global_step": 869, "train_info/time_within_train_step": 2.3583710193634033, "step": 869} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 869} {"info/global_step": 870, "train_info/time_within_train_step": 2.3580222129821777, "step": 870} {"train_info/time_between_train_steps": 0.0034029483795166016, "step": 870} {"info/global_step": 871, "train_info/time_within_train_step": 2.3569512367248535, "step": 871} {"train_info/time_between_train_steps": 0.0033659934997558594, "step": 871} {"info/global_step": 872, "train_info/time_within_train_step": 2.3588876724243164, "step": 872} {"train_info/time_between_train_steps": 0.0033719539642333984, "step": 872} {"info/global_step": 873, "train_info/time_within_train_step": 2.357377529144287, "step": 873} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 873} {"info/global_step": 874, "train_info/time_within_train_step": 2.3581316471099854, "step": 874} {"train_info/time_between_train_steps": 0.0034482479095458984, "step": 874} {"info/global_step": 875, "train_info/time_within_train_step": 2.3590493202209473, "step": 875} {"train_info/time_between_train_steps": 0.0034379959106445312, "step": 875} {"info/global_step": 876, "train_info/time_within_train_step": 2.3567593097686768, "step": 876} {"train_info/time_between_train_steps": 0.0034825801849365234, "step": 876} {"info/global_step": 877, "train_info/time_within_train_step": 2.3584394454956055, "step": 877} {"train_info/time_between_train_steps": 0.003447294235229492, "step": 877} {"info/global_step": 878, "train_info/time_within_train_step": 2.3580479621887207, "step": 878} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 878} {"info/global_step": 879, "train_info/time_within_train_step": 2.3570873737335205, "step": 879} {"train_info/time_between_train_steps": 0.0033991336822509766, "step": 879} {"info/global_step": 880, "train_info/time_within_train_step": 2.3578290939331055, "step": 880} {"train_info/time_between_train_steps": 0.0034203529357910156, "step": 880} {"info/global_step": 881, "train_info/time_within_train_step": 2.358398914337158, "step": 881} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 881} {"info/global_step": 882, "train_info/time_within_train_step": 2.3587191104888916, "step": 882} {"train_info/time_between_train_steps": 0.0034720897674560547, "step": 882} {"info/global_step": 883, "train_info/time_within_train_step": 2.3577797412872314, "step": 883} {"train_info/time_between_train_steps": 0.00342559814453125, "step": 883} {"info/global_step": 884, "train_info/time_within_train_step": 2.6522834300994873, "step": 884} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 884} {"info/global_step": 885, "train_info/time_within_train_step": 2.357734441757202, "step": 885} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 885} {"info/global_step": 886, "train_info/time_within_train_step": 2.358318567276001, "step": 886} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 886} {"info/global_step": 887, "train_info/time_within_train_step": 2.3624258041381836, "step": 887} {"train_info/time_between_train_steps": 0.0032715797424316406, "step": 887} {"info/global_step": 888, "train_info/time_within_train_step": 2.3571383953094482, "step": 888} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 888} {"info/global_step": 889, "train_info/time_within_train_step": 2.3573338985443115, "step": 889} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 889} {"info/global_step": 890, "train_info/time_within_train_step": 2.3566195964813232, "step": 890} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 890} {"info/global_step": 891, "train_info/time_within_train_step": 2.3568685054779053, "step": 891} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 891} {"info/global_step": 892, "train_info/time_within_train_step": 2.3577842712402344, "step": 892} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 892} {"info/global_step": 893, "train_info/time_within_train_step": 2.3583719730377197, "step": 893} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 893} {"info/global_step": 894, "train_info/time_within_train_step": 2.3582794666290283, "step": 894} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 894} {"info/global_step": 895, "train_info/time_within_train_step": 2.3574655055999756, "step": 895} {"train_info/time_between_train_steps": 0.0032396316528320312, "step": 895} {"info/global_step": 896, "train_info/time_within_train_step": 2.3580658435821533, "step": 896} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 896} {"info/global_step": 897, "train_info/time_within_train_step": 2.3569085597991943, "step": 897} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 897} {"info/global_step": 898, "train_info/time_within_train_step": 2.357248067855835, "step": 898} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 898} {"info/global_step": 899, "train_info/time_within_train_step": 2.357816219329834, "step": 899} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 899} {"info/global_step": 900, "train_info/time_within_train_step": 2.357839822769165, "step": 900} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4958.0, "train_info/memory_max_reserved": 4958.0, "_timestamp": 1746254522, "_runtime": 2341}, "step": 900} {"logs": {"train/loss": 4.4305, "train/learning_rate": 0.0004666666666666666, "train/epoch": 1.01, "_timestamp": 1746254522, "_runtime": 2341}, "step": 900} {"train_info/time_between_train_steps": 13.468150854110718, "step": 900} {"info/global_step": 901, "train_info/time_within_train_step": 2.199777841567993, "step": 901} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 901} {"info/global_step": 902, "train_info/time_within_train_step": 2.1833157539367676, "step": 902} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 902} {"info/global_step": 903, "train_info/time_within_train_step": 2.2951979637145996, "step": 903} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 903} {"info/global_step": 904, "train_info/time_within_train_step": 2.34971284866333, "step": 904} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 904} {"info/global_step": 905, "train_info/time_within_train_step": 2.3529090881347656, "step": 905} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 905} {"info/global_step": 906, "train_info/time_within_train_step": 2.3554749488830566, "step": 906} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 906} {"info/global_step": 907, "train_info/time_within_train_step": 2.355008602142334, "step": 907} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 907} {"info/global_step": 908, "train_info/time_within_train_step": 2.544687032699585, "step": 908} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 908} {"info/global_step": 909, "train_info/time_within_train_step": 2.355862855911255, "step": 909} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 909} {"info/global_step": 910, "train_info/time_within_train_step": 2.3567728996276855, "step": 910} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 910} {"info/global_step": 911, "train_info/time_within_train_step": 2.3560738563537598, "step": 911} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 911} {"info/global_step": 912, "train_info/time_within_train_step": 2.356494426727295, "step": 912} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 912} {"info/global_step": 913, "train_info/time_within_train_step": 2.3569843769073486, "step": 913} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 913} {"info/global_step": 914, "train_info/time_within_train_step": 2.3562004566192627, "step": 914} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 914} {"info/global_step": 915, "train_info/time_within_train_step": 2.35697340965271, "step": 915} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 915} {"info/global_step": 916, "train_info/time_within_train_step": 2.3567843437194824, "step": 916} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 916} {"info/global_step": 917, "train_info/time_within_train_step": 2.3575901985168457, "step": 917} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 917} {"info/global_step": 918, "train_info/time_within_train_step": 2.355915069580078, "step": 918} {"train_info/time_between_train_steps": 0.00648951530456543, "step": 918} {"info/global_step": 919, "train_info/time_within_train_step": 2.356506109237671, "step": 919} {"train_info/time_between_train_steps": 0.006513118743896484, "step": 919} {"info/global_step": 920, "train_info/time_within_train_step": 2.3568427562713623, "step": 920} {"train_info/time_between_train_steps": 0.006412506103515625, "step": 920} {"info/global_step": 921, "train_info/time_within_train_step": 2.356724739074707, "step": 921} {"train_info/time_between_train_steps": 0.006402254104614258, "step": 921} {"info/global_step": 922, "train_info/time_within_train_step": 2.3559563159942627, "step": 922} {"train_info/time_between_train_steps": 0.006467342376708984, "step": 922} {"info/global_step": 923, "train_info/time_within_train_step": 2.479090690612793, "step": 923} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 923} {"info/global_step": 924, "train_info/time_within_train_step": 2.357285976409912, "step": 924} {"train_info/time_between_train_steps": 0.003173828125, "step": 924} {"info/global_step": 925, "train_info/time_within_train_step": 2.3567850589752197, "step": 925} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 925} {"info/global_step": 926, "train_info/time_within_train_step": 2.3569509983062744, "step": 926} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 926} {"info/global_step": 927, "train_info/time_within_train_step": 2.356780529022217, "step": 927} {"train_info/time_between_train_steps": 0.0037071704864501953, "step": 927} {"info/global_step": 928, "train_info/time_within_train_step": 2.3560006618499756, "step": 928} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 928} {"info/global_step": 929, "train_info/time_within_train_step": 2.3567638397216797, "step": 929} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 929} {"info/global_step": 930, "train_info/time_within_train_step": 2.357656478881836, "step": 930} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 930} {"info/global_step": 931, "train_info/time_within_train_step": 2.356854200363159, "step": 931} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 931} {"info/global_step": 932, "train_info/time_within_train_step": 2.553896188735962, "step": 932} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 932} {"info/global_step": 933, "train_info/time_within_train_step": 2.356877088546753, "step": 933} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 933} {"info/global_step": 934, "train_info/time_within_train_step": 2.3571715354919434, "step": 934} {"train_info/time_between_train_steps": 0.0032432079315185547, "step": 934} {"info/global_step": 935, "train_info/time_within_train_step": 2.3576416969299316, "step": 935} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 935} {"info/global_step": 936, "train_info/time_within_train_step": 2.3567631244659424, "step": 936} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 936} {"info/global_step": 937, "train_info/time_within_train_step": 2.3563196659088135, "step": 937} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 937} {"info/global_step": 938, "train_info/time_within_train_step": 2.3569936752319336, "step": 938} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 938} {"info/global_step": 939, "train_info/time_within_train_step": 2.356609582901001, "step": 939} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 939} {"info/global_step": 940, "train_info/time_within_train_step": 2.356868267059326, "step": 940} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 940} {"info/global_step": 941, "train_info/time_within_train_step": 2.3561487197875977, "step": 941} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 941} {"info/global_step": 942, "train_info/time_within_train_step": 2.3567655086517334, "step": 942} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 942} {"info/global_step": 943, "train_info/time_within_train_step": 2.356553316116333, "step": 943} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 943} {"info/global_step": 944, "train_info/time_within_train_step": 2.356611490249634, "step": 944} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 944} {"info/global_step": 945, "train_info/time_within_train_step": 2.357247829437256, "step": 945} {"train_info/time_between_train_steps": 0.003136873245239258, "step": 945} {"info/global_step": 946, "train_info/time_within_train_step": 2.356501817703247, "step": 946} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 946} {"info/global_step": 947, "train_info/time_within_train_step": 2.356663942337036, "step": 947} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 947} {"info/global_step": 948, "train_info/time_within_train_step": 2.3565258979797363, "step": 948} {"train_info/time_between_train_steps": 0.0032913684844970703, "step": 948} {"info/global_step": 949, "train_info/time_within_train_step": 2.3562510013580322, "step": 949} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 949} {"info/global_step": 950, "train_info/time_within_train_step": 2.355802297592163, "step": 950} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4958.0, "train_info/memory_max_reserved": 4958.0, "_timestamp": 1746254655, "_runtime": 2474}, "step": 950} {"logs": {"train/loss": 4.3502, "train/learning_rate": 0.00045555555555555556, "train/epoch": 1.03, "_timestamp": 1746254655, "_runtime": 2474}, "step": 950} {"train_info/time_between_train_steps": 0.02841639518737793, "step": 950} {"info/global_step": 951, "train_info/time_within_train_step": 2.355912208557129, "step": 951} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 951} {"info/global_step": 952, "train_info/time_within_train_step": 2.3568103313446045, "step": 952} {"train_info/time_between_train_steps": 0.006558418273925781, "step": 952} {"info/global_step": 953, "train_info/time_within_train_step": 2.355600118637085, "step": 953} {"train_info/time_between_train_steps": 0.006587028503417969, "step": 953} {"info/global_step": 954, "train_info/time_within_train_step": 2.356191396713257, "step": 954} {"train_info/time_between_train_steps": 0.006500959396362305, "step": 954} {"info/global_step": 955, "train_info/time_within_train_step": 2.3563592433929443, "step": 955} {"train_info/time_between_train_steps": 0.0065364837646484375, "step": 955} {"info/global_step": 956, "train_info/time_within_train_step": 2.5559206008911133, "step": 956} {"train_info/time_between_train_steps": 0.00652313232421875, "step": 956} {"info/global_step": 957, "train_info/time_within_train_step": 2.3551406860351562, "step": 957} {"train_info/time_between_train_steps": 0.006530046463012695, "step": 957} {"info/global_step": 958, "train_info/time_within_train_step": 2.355541229248047, "step": 958} {"train_info/time_between_train_steps": 0.006494998931884766, "step": 958} {"info/global_step": 959, "train_info/time_within_train_step": 2.3546111583709717, "step": 959} {"train_info/time_between_train_steps": 0.006533622741699219, "step": 959} {"info/global_step": 960, "train_info/time_within_train_step": 2.354715585708618, "step": 960} {"train_info/time_between_train_steps": 0.006546735763549805, "step": 960} {"info/global_step": 961, "train_info/time_within_train_step": 2.3551509380340576, "step": 961} {"train_info/time_between_train_steps": 0.006531715393066406, "step": 961} {"info/global_step": 962, "train_info/time_within_train_step": 2.355811357498169, "step": 962} {"train_info/time_between_train_steps": 0.0065271854400634766, "step": 962} {"info/global_step": 963, "train_info/time_within_train_step": 2.3560471534729004, "step": 963} {"train_info/time_between_train_steps": 0.00648045539855957, "step": 963} {"info/global_step": 964, "train_info/time_within_train_step": 2.3572988510131836, "step": 964} {"train_info/time_between_train_steps": 0.005152225494384766, "step": 964} {"info/global_step": 965, "train_info/time_within_train_step": 2.3573293685913086, "step": 965} {"train_info/time_between_train_steps": 0.006514310836791992, "step": 965} {"info/global_step": 966, "train_info/time_within_train_step": 2.3557846546173096, "step": 966} {"train_info/time_between_train_steps": 0.006587028503417969, "step": 966} {"info/global_step": 967, "train_info/time_within_train_step": 2.3549132347106934, "step": 967} {"train_info/time_between_train_steps": 0.00648951530456543, "step": 967} {"info/global_step": 968, "train_info/time_within_train_step": 2.3559248447418213, "step": 968} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 968} {"info/global_step": 969, "train_info/time_within_train_step": 2.3551878929138184, "step": 969} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 969} {"info/global_step": 970, "train_info/time_within_train_step": 2.379556894302368, "step": 970} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 970} {"info/global_step": 971, "train_info/time_within_train_step": 2.3551480770111084, "step": 971} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 971} {"info/global_step": 972, "train_info/time_within_train_step": 2.3567442893981934, "step": 972} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 972} {"info/global_step": 973, "train_info/time_within_train_step": 2.355743408203125, "step": 973} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 973} {"info/global_step": 974, "train_info/time_within_train_step": 2.3555898666381836, "step": 974} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 974} {"info/global_step": 975, "train_info/time_within_train_step": 2.355790376663208, "step": 975} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 975} {"info/global_step": 976, "train_info/time_within_train_step": 2.39369797706604, "step": 976} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 976} {"info/global_step": 977, "train_info/time_within_train_step": 2.3553545475006104, "step": 977} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 977} {"info/global_step": 978, "train_info/time_within_train_step": 2.3543994426727295, "step": 978} {"train_info/time_between_train_steps": 0.006531715393066406, "step": 978} {"info/global_step": 979, "train_info/time_within_train_step": 2.3560166358947754, "step": 979} {"train_info/time_between_train_steps": 0.006581544876098633, "step": 979} {"info/global_step": 980, "train_info/time_within_train_step": 2.5590007305145264, "step": 980} {"train_info/time_between_train_steps": 0.003268718719482422, "step": 980} {"info/global_step": 981, "train_info/time_within_train_step": 2.3565807342529297, "step": 981} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 981} {"info/global_step": 982, "train_info/time_within_train_step": 2.3557546138763428, "step": 982} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 982} {"info/global_step": 983, "train_info/time_within_train_step": 2.3553221225738525, "step": 983} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 983} {"info/global_step": 984, "train_info/time_within_train_step": 2.3545687198638916, "step": 984} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 984} {"info/global_step": 985, "train_info/time_within_train_step": 2.355245590209961, "step": 985} {"train_info/time_between_train_steps": 0.12096643447875977, "step": 985} {"info/global_step": 986, "train_info/time_within_train_step": 2.355956554412842, "step": 986} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 986} {"info/global_step": 987, "train_info/time_within_train_step": 2.3879573345184326, "step": 987} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 987} {"info/global_step": 988, "train_info/time_within_train_step": 2.356539011001587, "step": 988} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 988} {"info/global_step": 989, "train_info/time_within_train_step": 2.3563129901885986, "step": 989} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 989} {"info/global_step": 990, "train_info/time_within_train_step": 2.3562209606170654, "step": 990} {"train_info/time_between_train_steps": 0.003204345703125, "step": 990} {"info/global_step": 991, "train_info/time_within_train_step": 2.3565311431884766, "step": 991} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 991} {"info/global_step": 992, "train_info/time_within_train_step": 2.35532808303833, "step": 992} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 992} {"info/global_step": 993, "train_info/time_within_train_step": 2.356018543243408, "step": 993} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 993} {"info/global_step": 994, "train_info/time_within_train_step": 2.3554179668426514, "step": 994} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 994} {"info/global_step": 995, "train_info/time_within_train_step": 2.354851007461548, "step": 995} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 995} {"info/global_step": 996, "train_info/time_within_train_step": 2.355250835418701, "step": 996} {"train_info/time_between_train_steps": 0.003208637237548828, "step": 996} {"info/global_step": 997, "train_info/time_within_train_step": 2.364793539047241, "step": 997} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 997} {"info/global_step": 998, "train_info/time_within_train_step": 2.355097532272339, "step": 998} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 998} {"info/global_step": 999, "train_info/time_within_train_step": 2.355659246444702, "step": 999} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 999} {"info/global_step": 1000, "train_info/time_within_train_step": 2.898303270339966, "step": 1000} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 4958.0, "train_info/memory_max_reserved": 4958.0, "_timestamp": 1746254775, "_runtime": 2594}, "step": 1000} {"logs": {"train/loss": 4.3199, "train/learning_rate": 0.00044444444444444436, "train/epoch": 1.05, "_timestamp": 1746254775, "_runtime": 2594}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746254780, "_runtime": 2599}, "step": 1000} {"logs": {"eval/loss": 4.684910774230957, "eval/runtime": 4.2134, "eval/samples_per_second": 47.468, "eval/steps_per_second": 1.187, "train/epoch": 1.05, "_timestamp": 1746254780, "_runtime": 2599}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746254780, "_runtime": 2599}, "step": 1000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.684910774230957, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 108.30060867197095, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.2134, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 47.468, "train/epoch": 1.05, "_timestamp": 1746254780, "_runtime": 2599}, "step": 1000} {"train_info/time_between_train_steps": 20.305423974990845, "step": 1000} {"info/global_step": 1001, "train_info/time_within_train_step": 2.193203926086426, "step": 1001} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 1001} {"info/global_step": 1002, "train_info/time_within_train_step": 2.1833503246307373, "step": 1002} {"train_info/time_between_train_steps": 0.0032296180725097656, "step": 1002} {"info/global_step": 1003, "train_info/time_within_train_step": 2.4631073474884033, "step": 1003} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 1003} {"info/global_step": 1004, "train_info/time_within_train_step": 2.3510560989379883, "step": 1004} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 1004} {"info/global_step": 1005, "train_info/time_within_train_step": 2.354206085205078, "step": 1005} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 1005} {"info/global_step": 1006, "train_info/time_within_train_step": 2.356034517288208, "step": 1006} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 1006} {"info/global_step": 1007, "train_info/time_within_train_step": 2.356602191925049, "step": 1007} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 1007} {"info/global_step": 1008, "train_info/time_within_train_step": 2.3572092056274414, "step": 1008} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 1008} {"info/global_step": 1009, "train_info/time_within_train_step": 2.358510732650757, "step": 1009} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 1009} {"info/global_step": 1010, "train_info/time_within_train_step": 2.3572757244110107, "step": 1010} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 1010} {"info/global_step": 1011, "train_info/time_within_train_step": 2.357902765274048, "step": 1011} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 1011} {"info/global_step": 1012, "train_info/time_within_train_step": 2.3590807914733887, "step": 1012} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 1012} {"info/global_step": 1013, "train_info/time_within_train_step": 2.3594260215759277, "step": 1013} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 1013} {"info/global_step": 1014, "train_info/time_within_train_step": 2.358356237411499, "step": 1014} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 1014} {"info/global_step": 1015, "train_info/time_within_train_step": 2.358011484146118, "step": 1015} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 1015} {"info/global_step": 1016, "train_info/time_within_train_step": 2.358607053756714, "step": 1016} {"train_info/time_between_train_steps": 0.0037746429443359375, "step": 1016} {"info/global_step": 1017, "train_info/time_within_train_step": 2.3591036796569824, "step": 1017} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 1017} {"info/global_step": 1018, "train_info/time_within_train_step": 2.358334541320801, "step": 1018} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 1018} {"info/global_step": 1019, "train_info/time_within_train_step": 2.357511281967163, "step": 1019} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 1019} {"info/global_step": 1020, "train_info/time_within_train_step": 2.357595682144165, "step": 1020} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 1020} {"info/global_step": 1021, "train_info/time_within_train_step": 2.3579394817352295, "step": 1021} {"train_info/time_between_train_steps": 0.0032596588134765625, "step": 1021} {"info/global_step": 1022, "train_info/time_within_train_step": 2.3583977222442627, "step": 1022} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 1022} {"info/global_step": 1023, "train_info/time_within_train_step": 2.3581550121307373, "step": 1023} {"train_info/time_between_train_steps": 0.0035288333892822266, "step": 1023} {"info/global_step": 1024, "train_info/time_within_train_step": 2.359494209289551, "step": 1024} {"train_info/time_between_train_steps": 0.003433704376220703, "step": 1024} {"info/global_step": 1025, "train_info/time_within_train_step": 2.360076427459717, "step": 1025} {"train_info/time_between_train_steps": 0.0034394264221191406, "step": 1025} {"info/global_step": 1026, "train_info/time_within_train_step": 2.3586015701293945, "step": 1026} {"train_info/time_between_train_steps": 0.0034074783325195312, "step": 1026} {"info/global_step": 1027, "train_info/time_within_train_step": 2.6694893836975098, "step": 1027} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 1027} {"info/global_step": 1028, "train_info/time_within_train_step": 2.357044219970703, "step": 1028} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 1028} {"info/global_step": 1029, "train_info/time_within_train_step": 2.3587419986724854, "step": 1029} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 1029} {"info/global_step": 1030, "train_info/time_within_train_step": 2.3583691120147705, "step": 1030} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 1030} {"info/global_step": 1031, "train_info/time_within_train_step": 2.3584463596343994, "step": 1031} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 1031} {"info/global_step": 1032, "train_info/time_within_train_step": 2.356891393661499, "step": 1032} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 1032} {"info/global_step": 1033, "train_info/time_within_train_step": 2.357654094696045, "step": 1033} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 1033} {"info/global_step": 1034, "train_info/time_within_train_step": 2.3574752807617188, "step": 1034} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 1034} {"info/global_step": 1035, "train_info/time_within_train_step": 2.357966184616089, "step": 1035} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 1035} {"info/global_step": 1036, "train_info/time_within_train_step": 2.3576500415802, "step": 1036} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 1036} {"info/global_step": 1037, "train_info/time_within_train_step": 2.3808999061584473, "step": 1037} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 1037} {"info/global_step": 1038, "train_info/time_within_train_step": 2.3570919036865234, "step": 1038} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 1038} {"info/global_step": 1039, "train_info/time_within_train_step": 2.3575258255004883, "step": 1039} {"train_info/time_between_train_steps": 0.003265380859375, "step": 1039} {"info/global_step": 1040, "train_info/time_within_train_step": 2.35703182220459, "step": 1040} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 1040} {"info/global_step": 1041, "train_info/time_within_train_step": 2.3574471473693848, "step": 1041} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 1041} {"info/global_step": 1042, "train_info/time_within_train_step": 2.358330726623535, "step": 1042} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 1042} {"info/global_step": 1043, "train_info/time_within_train_step": 2.393939256668091, "step": 1043} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 1043} {"info/global_step": 1044, "train_info/time_within_train_step": 2.3568131923675537, "step": 1044} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 1044} {"info/global_step": 1045, "train_info/time_within_train_step": 2.356255531311035, "step": 1045} {"train_info/time_between_train_steps": 0.0032444000244140625, "step": 1045} {"info/global_step": 1046, "train_info/time_within_train_step": 2.356637716293335, "step": 1046} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 1046} {"info/global_step": 1047, "train_info/time_within_train_step": 2.3572115898132324, "step": 1047} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 1047} {"info/global_step": 1048, "train_info/time_within_train_step": 2.490431785583496, "step": 1048} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 1048} {"info/global_step": 1049, "train_info/time_within_train_step": 2.3567728996276855, "step": 1049} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 1049} {"info/global_step": 1050, "train_info/time_within_train_step": 2.35721755027771, "step": 1050} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746254915, "_runtime": 2734}, "step": 1050} {"logs": {"train/loss": 4.2891, "train/learning_rate": 0.0004333333333333333, "train/epoch": 1.06, "_timestamp": 1746254915, "_runtime": 2734}, "step": 1050} {"train_info/time_between_train_steps": 0.02478170394897461, "step": 1050} {"info/global_step": 1051, "train_info/time_within_train_step": 2.5736842155456543, "step": 1051} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 1051} {"info/global_step": 1052, "train_info/time_within_train_step": 2.3574914932250977, "step": 1052} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 1052} {"info/global_step": 1053, "train_info/time_within_train_step": 2.357147216796875, "step": 1053} {"train_info/time_between_train_steps": 0.003247976303100586, "step": 1053} {"info/global_step": 1054, "train_info/time_within_train_step": 2.3912527561187744, "step": 1054} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 1054} {"info/global_step": 1055, "train_info/time_within_train_step": 2.3575024604797363, "step": 1055} {"train_info/time_between_train_steps": 0.003170490264892578, "step": 1055} {"info/global_step": 1056, "train_info/time_within_train_step": 2.357579231262207, "step": 1056} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 1056} {"info/global_step": 1057, "train_info/time_within_train_step": 2.357332229614258, "step": 1057} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 1057} {"info/global_step": 1058, "train_info/time_within_train_step": 2.3567984104156494, "step": 1058} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 1058} {"info/global_step": 1059, "train_info/time_within_train_step": 2.3570921421051025, "step": 1059} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 1059} {"info/global_step": 1060, "train_info/time_within_train_step": 2.3566715717315674, "step": 1060} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 1060} {"info/global_step": 1061, "train_info/time_within_train_step": 2.357288122177124, "step": 1061} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 1061} {"info/global_step": 1062, "train_info/time_within_train_step": 2.3802907466888428, "step": 1062} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 1062} {"info/global_step": 1063, "train_info/time_within_train_step": 2.357393264770508, "step": 1063} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 1063} {"info/global_step": 1064, "train_info/time_within_train_step": 2.356832265853882, "step": 1064} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 1064} {"info/global_step": 1065, "train_info/time_within_train_step": 2.357773780822754, "step": 1065} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 1065} {"info/global_step": 1066, "train_info/time_within_train_step": 2.356748342514038, "step": 1066} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 1066} {"info/global_step": 1067, "train_info/time_within_train_step": 2.357306957244873, "step": 1067} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 1067} {"info/global_step": 1068, "train_info/time_within_train_step": 2.3950345516204834, "step": 1068} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 1068} {"info/global_step": 1069, "train_info/time_within_train_step": 2.356645345687866, "step": 1069} {"train_info/time_between_train_steps": 0.0034308433532714844, "step": 1069} {"info/global_step": 1070, "train_info/time_within_train_step": 2.357945680618286, "step": 1070} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 1070} {"info/global_step": 1071, "train_info/time_within_train_step": 2.3572559356689453, "step": 1071} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 1071} {"info/global_step": 1072, "train_info/time_within_train_step": 2.357382297515869, "step": 1072} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 1072} {"info/global_step": 1073, "train_info/time_within_train_step": 2.3579938411712646, "step": 1073} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 1073} {"info/global_step": 1074, "train_info/time_within_train_step": 2.3566298484802246, "step": 1074} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 1074} {"info/global_step": 1075, "train_info/time_within_train_step": 2.571502685546875, "step": 1075} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 1075} {"info/global_step": 1076, "train_info/time_within_train_step": 2.3579275608062744, "step": 1076} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 1076} {"info/global_step": 1077, "train_info/time_within_train_step": 2.3573460578918457, "step": 1077} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 1077} {"info/global_step": 1078, "train_info/time_within_train_step": 2.356884241104126, "step": 1078} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 1078} {"info/global_step": 1079, "train_info/time_within_train_step": 2.3568520545959473, "step": 1079} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 1079} {"info/global_step": 1080, "train_info/time_within_train_step": 2.3570141792297363, "step": 1080} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 1080} {"info/global_step": 1081, "train_info/time_within_train_step": 2.3579142093658447, "step": 1081} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 1081} {"info/global_step": 1082, "train_info/time_within_train_step": 2.3567142486572266, "step": 1082} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 1082} {"info/global_step": 1083, "train_info/time_within_train_step": 2.3567955493927, "step": 1083} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 1083} {"info/global_step": 1084, "train_info/time_within_train_step": 2.3580198287963867, "step": 1084} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 1084} {"info/global_step": 1085, "train_info/time_within_train_step": 2.357299566268921, "step": 1085} {"train_info/time_between_train_steps": 0.0032444000244140625, "step": 1085} {"info/global_step": 1086, "train_info/time_within_train_step": 2.3574981689453125, "step": 1086} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 1086} {"info/global_step": 1087, "train_info/time_within_train_step": 2.357100009918213, "step": 1087} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 1087} {"info/global_step": 1088, "train_info/time_within_train_step": 2.357750654220581, "step": 1088} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 1088} {"info/global_step": 1089, "train_info/time_within_train_step": 2.367081880569458, "step": 1089} {"train_info/time_between_train_steps": 0.0034525394439697266, "step": 1089} {"info/global_step": 1090, "train_info/time_within_train_step": 2.3575475215911865, "step": 1090} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 1090} {"info/global_step": 1091, "train_info/time_within_train_step": 2.3556129932403564, "step": 1091} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 1091} {"info/global_step": 1092, "train_info/time_within_train_step": 2.356548309326172, "step": 1092} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 1092} {"info/global_step": 1093, "train_info/time_within_train_step": 2.3572041988372803, "step": 1093} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 1093} {"info/global_step": 1094, "train_info/time_within_train_step": 2.356795310974121, "step": 1094} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 1094} {"info/global_step": 1095, "train_info/time_within_train_step": 2.3579413890838623, "step": 1095} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 1095} {"info/global_step": 1096, "train_info/time_within_train_step": 2.3571832180023193, "step": 1096} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 1096} {"info/global_step": 1097, "train_info/time_within_train_step": 2.357365608215332, "step": 1097} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 1097} {"info/global_step": 1098, "train_info/time_within_train_step": 2.355787515640259, "step": 1098} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 1098} {"info/global_step": 1099, "train_info/time_within_train_step": 2.5739002227783203, "step": 1099} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 1099} {"info/global_step": 1100, "train_info/time_within_train_step": 2.357027530670166, "step": 1100} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746255035, "_runtime": 2854}, "step": 1100} {"logs": {"train/loss": 4.2595, "train/learning_rate": 0.0004222222222222222, "train/epoch": 1.08, "_timestamp": 1746255035, "_runtime": 2854}, "step": 1100} {"train_info/time_between_train_steps": 14.435771226882935, "step": 1100} {"info/global_step": 1101, "train_info/time_within_train_step": 2.2027974128723145, "step": 1101} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 1101} {"info/global_step": 1102, "train_info/time_within_train_step": 2.1837551593780518, "step": 1102} {"train_info/time_between_train_steps": 0.003725290298461914, "step": 1102} {"info/global_step": 1103, "train_info/time_within_train_step": 2.264840602874756, "step": 1103} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 1103} {"info/global_step": 1104, "train_info/time_within_train_step": 2.348726272583008, "step": 1104} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 1104} {"info/global_step": 1105, "train_info/time_within_train_step": 2.3536574840545654, "step": 1105} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 1105} {"info/global_step": 1106, "train_info/time_within_train_step": 2.3552355766296387, "step": 1106} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 1106} {"info/global_step": 1107, "train_info/time_within_train_step": 2.355372905731201, "step": 1107} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 1107} {"info/global_step": 1108, "train_info/time_within_train_step": 2.355717420578003, "step": 1108} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 1108} {"info/global_step": 1109, "train_info/time_within_train_step": 2.3554017543792725, "step": 1109} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 1109} {"info/global_step": 1110, "train_info/time_within_train_step": 2.3557286262512207, "step": 1110} {"train_info/time_between_train_steps": 0.12474942207336426, "step": 1110} {"info/global_step": 1111, "train_info/time_within_train_step": 2.35683274269104, "step": 1111} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 1111} {"info/global_step": 1112, "train_info/time_within_train_step": 2.3555309772491455, "step": 1112} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 1112} {"info/global_step": 1113, "train_info/time_within_train_step": 2.3570752143859863, "step": 1113} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 1113} {"info/global_step": 1114, "train_info/time_within_train_step": 2.356893539428711, "step": 1114} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 1114} {"info/global_step": 1115, "train_info/time_within_train_step": 2.3563671112060547, "step": 1115} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 1115} {"info/global_step": 1116, "train_info/time_within_train_step": 2.3564693927764893, "step": 1116} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 1116} {"info/global_step": 1117, "train_info/time_within_train_step": 2.3572142124176025, "step": 1117} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 1117} {"info/global_step": 1118, "train_info/time_within_train_step": 2.3582608699798584, "step": 1118} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 1118} {"info/global_step": 1119, "train_info/time_within_train_step": 2.3571598529815674, "step": 1119} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 1119} {"info/global_step": 1120, "train_info/time_within_train_step": 2.357327461242676, "step": 1120} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 1120} {"info/global_step": 1121, "train_info/time_within_train_step": 2.3580822944641113, "step": 1121} {"train_info/time_between_train_steps": 0.003216266632080078, "step": 1121} {"info/global_step": 1122, "train_info/time_within_train_step": 2.547776460647583, "step": 1122} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 1122} {"info/global_step": 1123, "train_info/time_within_train_step": 2.355741500854492, "step": 1123} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 1123} {"info/global_step": 1124, "train_info/time_within_train_step": 2.3580615520477295, "step": 1124} {"train_info/time_between_train_steps": 0.004177570343017578, "step": 1124} {"info/global_step": 1125, "train_info/time_within_train_step": 2.357710599899292, "step": 1125} {"train_info/time_between_train_steps": 0.003460407257080078, "step": 1125} {"info/global_step": 1126, "train_info/time_within_train_step": 2.357748031616211, "step": 1126} {"train_info/time_between_train_steps": 0.0034914016723632812, "step": 1126} {"info/global_step": 1127, "train_info/time_within_train_step": 2.357952833175659, "step": 1127} {"train_info/time_between_train_steps": 0.0034911632537841797, "step": 1127} {"info/global_step": 1128, "train_info/time_within_train_step": 2.3579931259155273, "step": 1128} {"train_info/time_between_train_steps": 0.00347137451171875, "step": 1128} {"info/global_step": 1129, "train_info/time_within_train_step": 2.3576724529266357, "step": 1129} {"train_info/time_between_train_steps": 0.003483295440673828, "step": 1129} {"info/global_step": 1130, "train_info/time_within_train_step": 2.356473445892334, "step": 1130} {"train_info/time_between_train_steps": 0.003427743911743164, "step": 1130} {"info/global_step": 1131, "train_info/time_within_train_step": 2.357388496398926, "step": 1131} {"train_info/time_between_train_steps": 0.0034449100494384766, "step": 1131} {"info/global_step": 1132, "train_info/time_within_train_step": 2.356349468231201, "step": 1132} {"train_info/time_between_train_steps": 0.003483295440673828, "step": 1132} {"info/global_step": 1133, "train_info/time_within_train_step": 2.3575541973114014, "step": 1133} {"train_info/time_between_train_steps": 0.003473520278930664, "step": 1133} {"info/global_step": 1134, "train_info/time_within_train_step": 2.356217861175537, "step": 1134} {"train_info/time_between_train_steps": 0.003470182418823242, "step": 1134} {"info/global_step": 1135, "train_info/time_within_train_step": 2.3577160835266113, "step": 1135} {"train_info/time_between_train_steps": 0.0034155845642089844, "step": 1135} {"info/global_step": 1136, "train_info/time_within_train_step": 2.3568124771118164, "step": 1136} {"train_info/time_between_train_steps": 0.0034821033477783203, "step": 1136} {"info/global_step": 1137, "train_info/time_within_train_step": 2.3570101261138916, "step": 1137} {"train_info/time_between_train_steps": 0.003489255905151367, "step": 1137} {"info/global_step": 1138, "train_info/time_within_train_step": 2.3577070236206055, "step": 1138} {"train_info/time_between_train_steps": 0.0034399032592773438, "step": 1138} {"info/global_step": 1139, "train_info/time_within_train_step": 2.357867956161499, "step": 1139} {"train_info/time_between_train_steps": 0.003493785858154297, "step": 1139} {"info/global_step": 1140, "train_info/time_within_train_step": 2.3577985763549805, "step": 1140} {"train_info/time_between_train_steps": 0.0034568309783935547, "step": 1140} {"info/global_step": 1141, "train_info/time_within_train_step": 2.358753204345703, "step": 1141} {"train_info/time_between_train_steps": 0.0034906864166259766, "step": 1141} {"info/global_step": 1142, "train_info/time_within_train_step": 2.3575990200042725, "step": 1142} {"train_info/time_between_train_steps": 0.0035066604614257812, "step": 1142} {"info/global_step": 1143, "train_info/time_within_train_step": 2.35603404045105, "step": 1143} {"train_info/time_between_train_steps": 0.0035028457641601562, "step": 1143} {"info/global_step": 1144, "train_info/time_within_train_step": 2.3564934730529785, "step": 1144} {"train_info/time_between_train_steps": 0.0034012794494628906, "step": 1144} {"info/global_step": 1145, "train_info/time_within_train_step": 2.3570244312286377, "step": 1145} {"train_info/time_between_train_steps": 0.0034334659576416016, "step": 1145} {"info/global_step": 1146, "train_info/time_within_train_step": 2.652796983718872, "step": 1146} {"train_info/time_between_train_steps": 0.003297567367553711, "step": 1146} {"info/global_step": 1147, "train_info/time_within_train_step": 2.35620379447937, "step": 1147} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 1147} {"info/global_step": 1148, "train_info/time_within_train_step": 2.357069730758667, "step": 1148} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 1148} {"info/global_step": 1149, "train_info/time_within_train_step": 2.356201171875, "step": 1149} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 1149} {"info/global_step": 1150, "train_info/time_within_train_step": 2.356069326400757, "step": 1150} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746255169, "_runtime": 2988}, "step": 1150} {"logs": {"train/loss": 4.236, "train/learning_rate": 0.0004111111111111111, "train/epoch": 1.1, "_timestamp": 1746255169, "_runtime": 2988}, "step": 1150} {"train_info/time_between_train_steps": 0.024983644485473633, "step": 1150} {"info/global_step": 1151, "train_info/time_within_train_step": 2.3564460277557373, "step": 1151} {"train_info/time_between_train_steps": 0.0032737255096435547, "step": 1151} {"info/global_step": 1152, "train_info/time_within_train_step": 2.355881452560425, "step": 1152} {"train_info/time_between_train_steps": 0.00323486328125, "step": 1152} {"info/global_step": 1153, "train_info/time_within_train_step": 2.355884075164795, "step": 1153} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 1153} {"info/global_step": 1154, "train_info/time_within_train_step": 2.355809450149536, "step": 1154} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 1154} {"info/global_step": 1155, "train_info/time_within_train_step": 2.3559083938598633, "step": 1155} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 1155} {"info/global_step": 1156, "train_info/time_within_train_step": 2.356415033340454, "step": 1156} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 1156} {"info/global_step": 1157, "train_info/time_within_train_step": 2.3563764095306396, "step": 1157} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 1157} {"info/global_step": 1158, "train_info/time_within_train_step": 2.3564512729644775, "step": 1158} {"train_info/time_between_train_steps": 0.0032804012298583984, "step": 1158} {"info/global_step": 1159, "train_info/time_within_train_step": 2.3567373752593994, "step": 1159} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 1159} {"info/global_step": 1160, "train_info/time_within_train_step": 2.356635332107544, "step": 1160} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 1160} {"info/global_step": 1161, "train_info/time_within_train_step": 2.3560752868652344, "step": 1161} {"train_info/time_between_train_steps": 0.0032913684844970703, "step": 1161} {"info/global_step": 1162, "train_info/time_within_train_step": 2.3559730052948, "step": 1162} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 1162} {"info/global_step": 1163, "train_info/time_within_train_step": 2.356104850769043, "step": 1163} {"train_info/time_between_train_steps": 0.003272533416748047, "step": 1163} {"info/global_step": 1164, "train_info/time_within_train_step": 2.3553380966186523, "step": 1164} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 1164} {"info/global_step": 1165, "train_info/time_within_train_step": 2.354872226715088, "step": 1165} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 1165} {"info/global_step": 1166, "train_info/time_within_train_step": 2.3555266857147217, "step": 1166} {"train_info/time_between_train_steps": 0.0033774375915527344, "step": 1166} {"info/global_step": 1167, "train_info/time_within_train_step": 2.3565280437469482, "step": 1167} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 1167} {"info/global_step": 1168, "train_info/time_within_train_step": 2.356390953063965, "step": 1168} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 1168} {"info/global_step": 1169, "train_info/time_within_train_step": 2.3554792404174805, "step": 1169} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 1169} {"info/global_step": 1170, "train_info/time_within_train_step": 2.3566861152648926, "step": 1170} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 1170} {"info/global_step": 1171, "train_info/time_within_train_step": 2.355903148651123, "step": 1171} {"train_info/time_between_train_steps": 0.003267049789428711, "step": 1171} {"info/global_step": 1172, "train_info/time_within_train_step": 2.5819923877716064, "step": 1172} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 1172} {"info/global_step": 1173, "train_info/time_within_train_step": 2.4883835315704346, "step": 1173} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 1173} {"info/global_step": 1174, "train_info/time_within_train_step": 2.3552029132843018, "step": 1174} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 1174} {"info/global_step": 1175, "train_info/time_within_train_step": 2.3559155464172363, "step": 1175} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 1175} {"info/global_step": 1176, "train_info/time_within_train_step": 2.3560078144073486, "step": 1176} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 1176} {"info/global_step": 1177, "train_info/time_within_train_step": 2.356006622314453, "step": 1177} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 1177} {"info/global_step": 1178, "train_info/time_within_train_step": 2.3561019897460938, "step": 1178} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 1178} {"info/global_step": 1179, "train_info/time_within_train_step": 2.3549532890319824, "step": 1179} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 1179} {"info/global_step": 1180, "train_info/time_within_train_step": 2.35632586479187, "step": 1180} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 1180} {"info/global_step": 1181, "train_info/time_within_train_step": 2.3547070026397705, "step": 1181} {"train_info/time_between_train_steps": 0.003283262252807617, "step": 1181} {"info/global_step": 1182, "train_info/time_within_train_step": 2.3778014183044434, "step": 1182} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 1182} {"info/global_step": 1183, "train_info/time_within_train_step": 2.355771780014038, "step": 1183} {"train_info/time_between_train_steps": 0.003244638442993164, "step": 1183} {"info/global_step": 1184, "train_info/time_within_train_step": 2.35636043548584, "step": 1184} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 1184} {"info/global_step": 1185, "train_info/time_within_train_step": 2.3556628227233887, "step": 1185} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 1185} {"info/global_step": 1186, "train_info/time_within_train_step": 2.3580336570739746, "step": 1186} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 1186} {"info/global_step": 1187, "train_info/time_within_train_step": 2.3566219806671143, "step": 1187} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 1187} {"info/global_step": 1188, "train_info/time_within_train_step": 2.3932700157165527, "step": 1188} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 1188} {"info/global_step": 1189, "train_info/time_within_train_step": 2.355428457260132, "step": 1189} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 1189} {"info/global_step": 1190, "train_info/time_within_train_step": 2.3555221557617188, "step": 1190} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 1190} {"info/global_step": 1191, "train_info/time_within_train_step": 2.3553149700164795, "step": 1191} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 1191} {"info/global_step": 1192, "train_info/time_within_train_step": 2.355973720550537, "step": 1192} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 1192} {"info/global_step": 1193, "train_info/time_within_train_step": 2.35630464553833, "step": 1193} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 1193} {"info/global_step": 1194, "train_info/time_within_train_step": 2.355816602706909, "step": 1194} {"train_info/time_between_train_steps": 0.003264904022216797, "step": 1194} {"info/global_step": 1195, "train_info/time_within_train_step": 2.3570377826690674, "step": 1195} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 1195} {"info/global_step": 1196, "train_info/time_within_train_step": 2.5847525596618652, "step": 1196} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 1196} {"info/global_step": 1197, "train_info/time_within_train_step": 2.356346845626831, "step": 1197} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 1197} {"info/global_step": 1198, "train_info/time_within_train_step": 2.354914426803589, "step": 1198} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 1198} {"info/global_step": 1199, "train_info/time_within_train_step": 2.356400489807129, "step": 1199} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 1199} {"info/global_step": 1200, "train_info/time_within_train_step": 2.3558125495910645, "step": 1200} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746255288, "_runtime": 3107}, "step": 1200} {"logs": {"train/loss": 4.2112, "train/learning_rate": 0.00039999999999999996, "train/epoch": 1.11, "_timestamp": 1746255288, "_runtime": 3107}, "step": 1200} {"train_info/time_between_train_steps": 14.607748746871948, "step": 1200} {"info/global_step": 1201, "train_info/time_within_train_step": 2.1993064880371094, "step": 1201} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 1201} {"info/global_step": 1202, "train_info/time_within_train_step": 2.1816701889038086, "step": 1202} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 1202} {"info/global_step": 1203, "train_info/time_within_train_step": 2.2693798542022705, "step": 1203} {"train_info/time_between_train_steps": 0.003259420394897461, "step": 1203} {"info/global_step": 1204, "train_info/time_within_train_step": 2.3504879474639893, "step": 1204} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 1204} {"info/global_step": 1205, "train_info/time_within_train_step": 2.352844476699829, "step": 1205} {"train_info/time_between_train_steps": 0.0032465457916259766, "step": 1205} {"info/global_step": 1206, "train_info/time_within_train_step": 2.356152057647705, "step": 1206} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 1206} {"info/global_step": 1207, "train_info/time_within_train_step": 2.356085777282715, "step": 1207} {"train_info/time_between_train_steps": 0.003275156021118164, "step": 1207} {"info/global_step": 1208, "train_info/time_within_train_step": 2.357344627380371, "step": 1208} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 1208} {"info/global_step": 1209, "train_info/time_within_train_step": 2.3565802574157715, "step": 1209} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 1209} {"info/global_step": 1210, "train_info/time_within_train_step": 2.3577537536621094, "step": 1210} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 1210} {"info/global_step": 1211, "train_info/time_within_train_step": 2.3579423427581787, "step": 1211} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 1211} {"info/global_step": 1212, "train_info/time_within_train_step": 2.356963872909546, "step": 1212} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 1212} {"info/global_step": 1213, "train_info/time_within_train_step": 2.357842206954956, "step": 1213} {"train_info/time_between_train_steps": 0.0032706260681152344, "step": 1213} {"info/global_step": 1214, "train_info/time_within_train_step": 2.356463670730591, "step": 1214} {"train_info/time_between_train_steps": 0.003208637237548828, "step": 1214} {"info/global_step": 1215, "train_info/time_within_train_step": 2.35676908493042, "step": 1215} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 1215} {"info/global_step": 1216, "train_info/time_within_train_step": 2.3575286865234375, "step": 1216} {"train_info/time_between_train_steps": 0.003231048583984375, "step": 1216} {"info/global_step": 1217, "train_info/time_within_train_step": 2.3571672439575195, "step": 1217} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 1217} {"info/global_step": 1218, "train_info/time_within_train_step": 2.3570897579193115, "step": 1218} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 1218} {"info/global_step": 1219, "train_info/time_within_train_step": 2.588001012802124, "step": 1219} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 1219} {"info/global_step": 1220, "train_info/time_within_train_step": 2.3581290245056152, "step": 1220} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 1220} {"info/global_step": 1221, "train_info/time_within_train_step": 2.3575093746185303, "step": 1221} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 1221} {"info/global_step": 1222, "train_info/time_within_train_step": 2.357496976852417, "step": 1222} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 1222} {"info/global_step": 1223, "train_info/time_within_train_step": 2.3576905727386475, "step": 1223} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 1223} {"info/global_step": 1224, "train_info/time_within_train_step": 2.3567728996276855, "step": 1224} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 1224} {"info/global_step": 1225, "train_info/time_within_train_step": 2.3575544357299805, "step": 1225} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 1225} {"info/global_step": 1226, "train_info/time_within_train_step": 2.3570058345794678, "step": 1226} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 1226} {"info/global_step": 1227, "train_info/time_within_train_step": 2.3577749729156494, "step": 1227} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 1227} {"info/global_step": 1228, "train_info/time_within_train_step": 2.357950448989868, "step": 1228} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 1228} {"info/global_step": 1229, "train_info/time_within_train_step": 2.3580079078674316, "step": 1229} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 1229} {"info/global_step": 1230, "train_info/time_within_train_step": 2.3579769134521484, "step": 1230} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 1230} {"info/global_step": 1231, "train_info/time_within_train_step": 2.3584673404693604, "step": 1231} {"train_info/time_between_train_steps": 0.003204345703125, "step": 1231} {"info/global_step": 1232, "train_info/time_within_train_step": 2.3567657470703125, "step": 1232} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 1232} {"info/global_step": 1233, "train_info/time_within_train_step": 2.357248067855835, "step": 1233} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 1233} {"info/global_step": 1234, "train_info/time_within_train_step": 2.356975555419922, "step": 1234} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 1234} {"info/global_step": 1235, "train_info/time_within_train_step": 2.356456995010376, "step": 1235} {"train_info/time_between_train_steps": 0.1266324520111084, "step": 1235} {"info/global_step": 1236, "train_info/time_within_train_step": 2.3756816387176514, "step": 1236} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 1236} {"info/global_step": 1237, "train_info/time_within_train_step": 2.357746124267578, "step": 1237} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 1237} {"info/global_step": 1238, "train_info/time_within_train_step": 2.3575243949890137, "step": 1238} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 1238} {"info/global_step": 1239, "train_info/time_within_train_step": 2.3583309650421143, "step": 1239} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 1239} {"info/global_step": 1240, "train_info/time_within_train_step": 2.3569555282592773, "step": 1240} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 1240} {"info/global_step": 1241, "train_info/time_within_train_step": 2.358206033706665, "step": 1241} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 1241} {"info/global_step": 1242, "train_info/time_within_train_step": 2.357820510864258, "step": 1242} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 1242} {"info/global_step": 1243, "train_info/time_within_train_step": 2.357891321182251, "step": 1243} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 1243} {"info/global_step": 1244, "train_info/time_within_train_step": 2.5862677097320557, "step": 1244} {"train_info/time_between_train_steps": 0.0032427310943603516, "step": 1244} {"info/global_step": 1245, "train_info/time_within_train_step": 2.356863021850586, "step": 1245} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 1245} {"info/global_step": 1246, "train_info/time_within_train_step": 2.356666326522827, "step": 1246} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 1246} {"info/global_step": 1247, "train_info/time_within_train_step": 2.389495372772217, "step": 1247} {"train_info/time_between_train_steps": 0.0032851696014404297, "step": 1247} {"info/global_step": 1248, "train_info/time_within_train_step": 2.356893539428711, "step": 1248} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 1248} {"info/global_step": 1249, "train_info/time_within_train_step": 2.3573989868164062, "step": 1249} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 1249} {"info/global_step": 1250, "train_info/time_within_train_step": 2.901048183441162, "step": 1250} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746255423, "_runtime": 3242}, "step": 1250} {"logs": {"train/loss": 4.1767, "train/learning_rate": 0.00038888888888888887, "train/epoch": 1.13, "_timestamp": 1746255423, "_runtime": 3242}, "step": 1250} {"train_info/time_between_train_steps": 0.02340078353881836, "step": 1250} {"info/global_step": 1251, "train_info/time_within_train_step": 2.3582067489624023, "step": 1251} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 1251} {"info/global_step": 1252, "train_info/time_within_train_step": 2.357545852661133, "step": 1252} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 1252} {"info/global_step": 1253, "train_info/time_within_train_step": 2.366173267364502, "step": 1253} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 1253} {"info/global_step": 1254, "train_info/time_within_train_step": 2.358368158340454, "step": 1254} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 1254} {"info/global_step": 1255, "train_info/time_within_train_step": 2.3570556640625, "step": 1255} {"train_info/time_between_train_steps": 0.0032606124877929688, "step": 1255} {"info/global_step": 1256, "train_info/time_within_train_step": 2.35691499710083, "step": 1256} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 1256} {"info/global_step": 1257, "train_info/time_within_train_step": 2.3576908111572266, "step": 1257} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 1257} {"info/global_step": 1258, "train_info/time_within_train_step": 2.3570375442504883, "step": 1258} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 1258} {"info/global_step": 1259, "train_info/time_within_train_step": 2.3579673767089844, "step": 1259} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 1259} {"info/global_step": 1260, "train_info/time_within_train_step": 2.357125759124756, "step": 1260} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 1260} {"info/global_step": 1261, "train_info/time_within_train_step": 2.357067108154297, "step": 1261} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 1261} {"info/global_step": 1262, "train_info/time_within_train_step": 2.3568837642669678, "step": 1262} {"train_info/time_between_train_steps": 0.003248929977416992, "step": 1262} {"info/global_step": 1263, "train_info/time_within_train_step": 2.3578994274139404, "step": 1263} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 1263} {"info/global_step": 1264, "train_info/time_within_train_step": 2.356531858444214, "step": 1264} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 1264} {"info/global_step": 1265, "train_info/time_within_train_step": 2.357593059539795, "step": 1265} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 1265} {"info/global_step": 1266, "train_info/time_within_train_step": 2.3573203086853027, "step": 1266} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 1266} {"info/global_step": 1267, "train_info/time_within_train_step": 2.357131004333496, "step": 1267} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 1267} {"info/global_step": 1268, "train_info/time_within_train_step": 2.3573997020721436, "step": 1268} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 1268} {"info/global_step": 1269, "train_info/time_within_train_step": 2.5581557750701904, "step": 1269} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 1269} {"info/global_step": 1270, "train_info/time_within_train_step": 2.356950283050537, "step": 1270} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 1270} {"info/global_step": 1271, "train_info/time_within_train_step": 2.357541561126709, "step": 1271} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 1271} {"info/global_step": 1272, "train_info/time_within_train_step": 2.357208013534546, "step": 1272} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 1272} {"info/global_step": 1273, "train_info/time_within_train_step": 2.3565104007720947, "step": 1273} {"train_info/time_between_train_steps": 0.0032622814178466797, "step": 1273} {"info/global_step": 1274, "train_info/time_within_train_step": 2.357996702194214, "step": 1274} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 1274} {"info/global_step": 1275, "train_info/time_within_train_step": 2.357009172439575, "step": 1275} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 1275} {"info/global_step": 1276, "train_info/time_within_train_step": 2.356574296951294, "step": 1276} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 1276} {"info/global_step": 1277, "train_info/time_within_train_step": 2.357229471206665, "step": 1277} {"train_info/time_between_train_steps": 0.004254579544067383, "step": 1277} {"info/global_step": 1278, "train_info/time_within_train_step": 2.3583102226257324, "step": 1278} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 1278} {"info/global_step": 1279, "train_info/time_within_train_step": 2.356633424758911, "step": 1279} {"train_info/time_between_train_steps": 0.0032482147216796875, "step": 1279} {"info/global_step": 1280, "train_info/time_within_train_step": 2.357893466949463, "step": 1280} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 1280} {"info/global_step": 1281, "train_info/time_within_train_step": 2.35788893699646, "step": 1281} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 1281} {"info/global_step": 1282, "train_info/time_within_train_step": 2.3564815521240234, "step": 1282} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 1282} {"info/global_step": 1283, "train_info/time_within_train_step": 2.357516050338745, "step": 1283} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 1283} {"info/global_step": 1284, "train_info/time_within_train_step": 2.35848069190979, "step": 1284} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 1284} {"info/global_step": 1285, "train_info/time_within_train_step": 2.3567190170288086, "step": 1285} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 1285} {"info/global_step": 1286, "train_info/time_within_train_step": 2.3577847480773926, "step": 1286} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 1286} {"info/global_step": 1287, "train_info/time_within_train_step": 2.3567891120910645, "step": 1287} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 1287} {"info/global_step": 1288, "train_info/time_within_train_step": 2.3565099239349365, "step": 1288} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 1288} {"info/global_step": 1289, "train_info/time_within_train_step": 2.357097864151001, "step": 1289} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 1289} {"info/global_step": 1290, "train_info/time_within_train_step": 2.3571078777313232, "step": 1290} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 1290} {"info/global_step": 1291, "train_info/time_within_train_step": 2.357429265975952, "step": 1291} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 1291} {"info/global_step": 1292, "train_info/time_within_train_step": 2.357236623764038, "step": 1292} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 1292} {"info/global_step": 1293, "train_info/time_within_train_step": 2.5929136276245117, "step": 1293} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 1293} {"info/global_step": 1294, "train_info/time_within_train_step": 2.3561179637908936, "step": 1294} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 1294} {"info/global_step": 1295, "train_info/time_within_train_step": 2.3566439151763916, "step": 1295} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 1295} {"info/global_step": 1296, "train_info/time_within_train_step": 2.3557512760162354, "step": 1296} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 1296} {"info/global_step": 1297, "train_info/time_within_train_step": 2.390357255935669, "step": 1297} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 1297} {"info/global_step": 1298, "train_info/time_within_train_step": 2.5008692741394043, "step": 1298} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 1298} {"info/global_step": 1299, "train_info/time_within_train_step": 2.357386350631714, "step": 1299} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 1299} {"info/global_step": 1300, "train_info/time_within_train_step": 2.3578264713287354, "step": 1300} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746255542, "_runtime": 3361}, "step": 1300} {"logs": {"train/loss": 4.1512, "train/learning_rate": 0.00037777777777777777, "train/epoch": 1.15, "_timestamp": 1746255542, "_runtime": 3361}, "step": 1300} {"train_info/time_between_train_steps": 29.720782995224, "step": 1300} {"info/global_step": 1301, "train_info/time_within_train_step": 2.20351243019104, "step": 1301} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 1301} {"info/global_step": 1302, "train_info/time_within_train_step": 2.183199644088745, "step": 1302} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 1302} {"info/global_step": 1303, "train_info/time_within_train_step": 2.183229446411133, "step": 1303} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 1303} {"info/global_step": 1304, "train_info/time_within_train_step": 2.24948787689209, "step": 1304} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 1304} {"info/global_step": 1305, "train_info/time_within_train_step": 2.3494491577148438, "step": 1305} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 1305} {"info/global_step": 1306, "train_info/time_within_train_step": 2.353461503982544, "step": 1306} {"train_info/time_between_train_steps": 0.0034868717193603516, "step": 1306} {"info/global_step": 1307, "train_info/time_within_train_step": 2.353644847869873, "step": 1307} {"train_info/time_between_train_steps": 0.003437519073486328, "step": 1307} {"info/global_step": 1308, "train_info/time_within_train_step": 2.3556909561157227, "step": 1308} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 1308} {"info/global_step": 1309, "train_info/time_within_train_step": 2.3552534580230713, "step": 1309} {"train_info/time_between_train_steps": 0.003272533416748047, "step": 1309} {"info/global_step": 1310, "train_info/time_within_train_step": 2.3883609771728516, "step": 1310} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 1310} {"info/global_step": 1311, "train_info/time_within_train_step": 2.355908155441284, "step": 1311} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 1311} {"info/global_step": 1312, "train_info/time_within_train_step": 2.3576691150665283, "step": 1312} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 1312} {"info/global_step": 1313, "train_info/time_within_train_step": 2.358053207397461, "step": 1313} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 1313} {"info/global_step": 1314, "train_info/time_within_train_step": 2.356393575668335, "step": 1314} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 1314} {"info/global_step": 1315, "train_info/time_within_train_step": 2.358332395553589, "step": 1315} {"train_info/time_between_train_steps": 0.0032422542572021484, "step": 1315} {"info/global_step": 1316, "train_info/time_within_train_step": 2.356572151184082, "step": 1316} {"train_info/time_between_train_steps": 0.003288745880126953, "step": 1316} {"info/global_step": 1317, "train_info/time_within_train_step": 2.3564140796661377, "step": 1317} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 1317} {"info/global_step": 1318, "train_info/time_within_train_step": 2.59375262260437, "step": 1318} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 1318} {"info/global_step": 1319, "train_info/time_within_train_step": 2.356278419494629, "step": 1319} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 1319} {"info/global_step": 1320, "train_info/time_within_train_step": 2.3553764820098877, "step": 1320} {"train_info/time_between_train_steps": 0.003254413604736328, "step": 1320} {"info/global_step": 1321, "train_info/time_within_train_step": 2.3564810752868652, "step": 1321} {"train_info/time_between_train_steps": 0.0032792091369628906, "step": 1321} {"info/global_step": 1322, "train_info/time_within_train_step": 2.35697603225708, "step": 1322} {"train_info/time_between_train_steps": 0.0032396316528320312, "step": 1322} {"info/global_step": 1323, "train_info/time_within_train_step": 2.355563163757324, "step": 1323} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 1323} {"info/global_step": 1324, "train_info/time_within_train_step": 2.3564155101776123, "step": 1324} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 1324} {"info/global_step": 1325, "train_info/time_within_train_step": 2.3562171459198, "step": 1325} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 1325} {"info/global_step": 1326, "train_info/time_within_train_step": 2.3572583198547363, "step": 1326} {"train_info/time_between_train_steps": 0.0033576488494873047, "step": 1326} {"info/global_step": 1327, "train_info/time_within_train_step": 2.3570544719696045, "step": 1327} {"train_info/time_between_train_steps": 0.0032308101654052734, "step": 1327} {"info/global_step": 1328, "train_info/time_within_train_step": 2.3560144901275635, "step": 1328} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 1328} {"info/global_step": 1329, "train_info/time_within_train_step": 2.3560380935668945, "step": 1329} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 1329} {"info/global_step": 1330, "train_info/time_within_train_step": 2.356646776199341, "step": 1330} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 1330} {"info/global_step": 1331, "train_info/time_within_train_step": 2.3569090366363525, "step": 1331} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 1331} {"info/global_step": 1332, "train_info/time_within_train_step": 2.356177806854248, "step": 1332} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 1332} {"info/global_step": 1333, "train_info/time_within_train_step": 2.3553130626678467, "step": 1333} {"train_info/time_between_train_steps": 0.003278493881225586, "step": 1333} {"info/global_step": 1334, "train_info/time_within_train_step": 2.3552024364471436, "step": 1334} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 1334} {"info/global_step": 1335, "train_info/time_within_train_step": 2.3555219173431396, "step": 1335} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 1335} {"info/global_step": 1336, "train_info/time_within_train_step": 2.3562779426574707, "step": 1336} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 1336} {"info/global_step": 1337, "train_info/time_within_train_step": 2.3563971519470215, "step": 1337} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 1337} {"info/global_step": 1338, "train_info/time_within_train_step": 2.354851245880127, "step": 1338} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 1338} {"info/global_step": 1339, "train_info/time_within_train_step": 2.355581283569336, "step": 1339} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 1339} {"info/global_step": 1340, "train_info/time_within_train_step": 2.356437921524048, "step": 1340} {"train_info/time_between_train_steps": 0.0032570362091064453, "step": 1340} {"info/global_step": 1341, "train_info/time_within_train_step": 2.355506658554077, "step": 1341} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 1341} {"info/global_step": 1342, "train_info/time_within_train_step": 2.5977814197540283, "step": 1342} {"train_info/time_between_train_steps": 0.003254413604736328, "step": 1342} {"info/global_step": 1343, "train_info/time_within_train_step": 2.3553388118743896, "step": 1343} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 1343} {"info/global_step": 1344, "train_info/time_within_train_step": 2.3555827140808105, "step": 1344} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 1344} {"info/global_step": 1345, "train_info/time_within_train_step": 2.355529308319092, "step": 1345} {"train_info/time_between_train_steps": 0.00323486328125, "step": 1345} {"info/global_step": 1346, "train_info/time_within_train_step": 2.3556203842163086, "step": 1346} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 1346} {"info/global_step": 1347, "train_info/time_within_train_step": 2.3554303646087646, "step": 1347} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 1347} {"info/global_step": 1348, "train_info/time_within_train_step": 2.3562517166137695, "step": 1348} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 1348} {"info/global_step": 1349, "train_info/time_within_train_step": 2.3562769889831543, "step": 1349} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 1349} {"info/global_step": 1350, "train_info/time_within_train_step": 2.3556838035583496, "step": 1350} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746255691, "_runtime": 3510}, "step": 1350} {"logs": {"train/loss": 4.1308, "train/learning_rate": 0.00036666666666666667, "train/epoch": 1.16, "_timestamp": 1746255691, "_runtime": 3510}, "step": 1350} {"train_info/time_between_train_steps": 0.030225276947021484, "step": 1350} {"info/global_step": 1351, "train_info/time_within_train_step": 2.3569564819335938, "step": 1351} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 1351} {"info/global_step": 1352, "train_info/time_within_train_step": 2.3561620712280273, "step": 1352} {"train_info/time_between_train_steps": 0.0032660961151123047, "step": 1352} {"info/global_step": 1353, "train_info/time_within_train_step": 2.355630874633789, "step": 1353} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 1353} {"info/global_step": 1354, "train_info/time_within_train_step": 2.3561129570007324, "step": 1354} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 1354} {"info/global_step": 1355, "train_info/time_within_train_step": 2.355421543121338, "step": 1355} {"train_info/time_between_train_steps": 0.003173828125, "step": 1355} {"info/global_step": 1356, "train_info/time_within_train_step": 2.355541467666626, "step": 1356} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 1356} {"info/global_step": 1357, "train_info/time_within_train_step": 2.355351686477661, "step": 1357} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 1357} {"info/global_step": 1358, "train_info/time_within_train_step": 2.3561160564422607, "step": 1358} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 1358} {"info/global_step": 1359, "train_info/time_within_train_step": 2.3561534881591797, "step": 1359} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 1359} {"info/global_step": 1360, "train_info/time_within_train_step": 2.3552563190460205, "step": 1360} {"train_info/time_between_train_steps": 0.10472464561462402, "step": 1360} {"info/global_step": 1361, "train_info/time_within_train_step": 2.356403350830078, "step": 1361} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 1361} {"info/global_step": 1362, "train_info/time_within_train_step": 2.356509208679199, "step": 1362} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 1362} {"info/global_step": 1363, "train_info/time_within_train_step": 2.3556971549987793, "step": 1363} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 1363} {"info/global_step": 1364, "train_info/time_within_train_step": 2.355984926223755, "step": 1364} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 1364} {"info/global_step": 1365, "train_info/time_within_train_step": 2.356027364730835, "step": 1365} {"train_info/time_between_train_steps": 0.0032701492309570312, "step": 1365} {"info/global_step": 1366, "train_info/time_within_train_step": 2.3549795150756836, "step": 1366} {"train_info/time_between_train_steps": 0.003231048583984375, "step": 1366} {"info/global_step": 1367, "train_info/time_within_train_step": 2.354663133621216, "step": 1367} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 1367} {"info/global_step": 1368, "train_info/time_within_train_step": 2.6136112213134766, "step": 1368} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 1368} {"info/global_step": 1369, "train_info/time_within_train_step": 2.355759859085083, "step": 1369} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 1369} {"info/global_step": 1370, "train_info/time_within_train_step": 2.355677843093872, "step": 1370} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 1370} {"info/global_step": 1371, "train_info/time_within_train_step": 2.3556249141693115, "step": 1371} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 1371} {"info/global_step": 1372, "train_info/time_within_train_step": 2.355095624923706, "step": 1372} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 1372} {"info/global_step": 1373, "train_info/time_within_train_step": 2.355689287185669, "step": 1373} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 1373} {"info/global_step": 1374, "train_info/time_within_train_step": 2.3573522567749023, "step": 1374} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 1374} {"info/global_step": 1375, "train_info/time_within_train_step": 2.3551557064056396, "step": 1375} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 1375} {"info/global_step": 1376, "train_info/time_within_train_step": 2.354918956756592, "step": 1376} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 1376} {"info/global_step": 1377, "train_info/time_within_train_step": 2.3557350635528564, "step": 1377} {"train_info/time_between_train_steps": 0.0034058094024658203, "step": 1377} {"info/global_step": 1378, "train_info/time_within_train_step": 2.355464458465576, "step": 1378} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 1378} {"info/global_step": 1379, "train_info/time_within_train_step": 2.355178117752075, "step": 1379} {"train_info/time_between_train_steps": 0.003143310546875, "step": 1379} {"info/global_step": 1380, "train_info/time_within_train_step": 2.355724573135376, "step": 1380} {"train_info/time_between_train_steps": 0.0031244754791259766, "step": 1380} {"info/global_step": 1381, "train_info/time_within_train_step": 2.3549983501434326, "step": 1381} {"train_info/time_between_train_steps": 0.003140687942504883, "step": 1381} {"info/global_step": 1382, "train_info/time_within_train_step": 2.3556742668151855, "step": 1382} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 1382} {"info/global_step": 1383, "train_info/time_within_train_step": 2.355358839035034, "step": 1383} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 1383} {"info/global_step": 1384, "train_info/time_within_train_step": 2.355898141860962, "step": 1384} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 1384} {"info/global_step": 1385, "train_info/time_within_train_step": 2.3546948432922363, "step": 1385} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 1385} {"info/global_step": 1386, "train_info/time_within_train_step": 2.3554017543792725, "step": 1386} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 1386} {"info/global_step": 1387, "train_info/time_within_train_step": 2.3552963733673096, "step": 1387} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 1387} {"info/global_step": 1388, "train_info/time_within_train_step": 2.3560822010040283, "step": 1388} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 1388} {"info/global_step": 1389, "train_info/time_within_train_step": 2.356208086013794, "step": 1389} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 1389} {"info/global_step": 1390, "train_info/time_within_train_step": 2.3556628227233887, "step": 1390} {"train_info/time_between_train_steps": 0.003243684768676758, "step": 1390} {"info/global_step": 1391, "train_info/time_within_train_step": 2.356292247772217, "step": 1391} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 1391} {"info/global_step": 1392, "train_info/time_within_train_step": 2.5583317279815674, "step": 1392} {"train_info/time_between_train_steps": 0.0032548904418945312, "step": 1392} {"info/global_step": 1393, "train_info/time_within_train_step": 2.355771064758301, "step": 1393} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 1393} {"info/global_step": 1394, "train_info/time_within_train_step": 2.3548777103424072, "step": 1394} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 1394} {"info/global_step": 1395, "train_info/time_within_train_step": 2.355088710784912, "step": 1395} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 1395} {"info/global_step": 1396, "train_info/time_within_train_step": 2.3550734519958496, "step": 1396} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 1396} {"info/global_step": 1397, "train_info/time_within_train_step": 2.35553240776062, "step": 1397} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 1397} {"info/global_step": 1398, "train_info/time_within_train_step": 2.355602264404297, "step": 1398} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 1398} {"info/global_step": 1399, "train_info/time_within_train_step": 2.354827404022217, "step": 1399} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 1399} {"info/global_step": 1400, "train_info/time_within_train_step": 2.356067419052124, "step": 1400} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746255810, "_runtime": 3629}, "step": 1400} {"logs": {"train/loss": 4.1085, "train/learning_rate": 0.0003555555555555555, "train/epoch": 1.18, "_timestamp": 1746255810, "_runtime": 3629}, "step": 1400} {"train_info/time_between_train_steps": 21.038169145584106, "step": 1400} {"info/global_step": 1401, "train_info/time_within_train_step": 2.2004165649414062, "step": 1401} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 1401} {"info/global_step": 1402, "train_info/time_within_train_step": 2.183009386062622, "step": 1402} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 1402} {"info/global_step": 1403, "train_info/time_within_train_step": 2.1867053508758545, "step": 1403} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 1403} {"info/global_step": 1404, "train_info/time_within_train_step": 2.317948818206787, "step": 1404} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 1404} {"info/global_step": 1405, "train_info/time_within_train_step": 2.3523008823394775, "step": 1405} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 1405} {"info/global_step": 1406, "train_info/time_within_train_step": 2.356062650680542, "step": 1406} {"train_info/time_between_train_steps": 0.0031528472900390625, "step": 1406} {"info/global_step": 1407, "train_info/time_within_train_step": 2.355576992034912, "step": 1407} {"train_info/time_between_train_steps": 0.0037453174591064453, "step": 1407} {"info/global_step": 1408, "train_info/time_within_train_step": 2.3770673274993896, "step": 1408} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 1408} {"info/global_step": 1409, "train_info/time_within_train_step": 2.3552935123443604, "step": 1409} {"train_info/time_between_train_steps": 0.0029621124267578125, "step": 1409} {"info/global_step": 1410, "train_info/time_within_train_step": 2.3568732738494873, "step": 1410} {"train_info/time_between_train_steps": 0.00310516357421875, "step": 1410} {"info/global_step": 1411, "train_info/time_within_train_step": 2.3560800552368164, "step": 1411} {"train_info/time_between_train_steps": 0.0030236244201660156, "step": 1411} {"info/global_step": 1412, "train_info/time_within_train_step": 2.356820583343506, "step": 1412} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 1412} {"info/global_step": 1413, "train_info/time_within_train_step": 2.357741117477417, "step": 1413} {"train_info/time_between_train_steps": 0.0030350685119628906, "step": 1413} {"info/global_step": 1414, "train_info/time_within_train_step": 2.3579914569854736, "step": 1414} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 1414} {"info/global_step": 1415, "train_info/time_within_train_step": 2.356592893600464, "step": 1415} {"train_info/time_between_train_steps": 0.0031099319458007812, "step": 1415} {"info/global_step": 1416, "train_info/time_within_train_step": 2.3573789596557617, "step": 1416} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 1416} {"info/global_step": 1417, "train_info/time_within_train_step": 2.652841567993164, "step": 1417} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 1417} {"info/global_step": 1418, "train_info/time_within_train_step": 2.3567731380462646, "step": 1418} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 1418} {"info/global_step": 1419, "train_info/time_within_train_step": 2.3567452430725098, "step": 1419} {"train_info/time_between_train_steps": 0.0028994083404541016, "step": 1419} {"info/global_step": 1420, "train_info/time_within_train_step": 2.394418716430664, "step": 1420} {"train_info/time_between_train_steps": 0.0029256343841552734, "step": 1420} {"info/global_step": 1421, "train_info/time_within_train_step": 2.3566501140594482, "step": 1421} {"train_info/time_between_train_steps": 0.0029451847076416016, "step": 1421} {"info/global_step": 1422, "train_info/time_within_train_step": 2.357144594192505, "step": 1422} {"train_info/time_between_train_steps": 0.002860546112060547, "step": 1422} {"info/global_step": 1423, "train_info/time_within_train_step": 2.356147289276123, "step": 1423} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 1423} {"info/global_step": 1424, "train_info/time_within_train_step": 2.355306625366211, "step": 1424} {"train_info/time_between_train_steps": 0.002887725830078125, "step": 1424} {"info/global_step": 1425, "train_info/time_within_train_step": 2.3559491634368896, "step": 1425} {"train_info/time_between_train_steps": 0.002880096435546875, "step": 1425} {"info/global_step": 1426, "train_info/time_within_train_step": 2.356844902038574, "step": 1426} {"train_info/time_between_train_steps": 0.003000020980834961, "step": 1426} {"info/global_step": 1427, "train_info/time_within_train_step": 2.3564608097076416, "step": 1427} {"train_info/time_between_train_steps": 0.002913951873779297, "step": 1427} {"info/global_step": 1428, "train_info/time_within_train_step": 2.355794906616211, "step": 1428} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 1428} {"info/global_step": 1429, "train_info/time_within_train_step": 2.3571977615356445, "step": 1429} {"train_info/time_between_train_steps": 0.002957582473754883, "step": 1429} {"info/global_step": 1430, "train_info/time_within_train_step": 2.3556628227233887, "step": 1430} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 1430} {"info/global_step": 1431, "train_info/time_within_train_step": 2.3565869331359863, "step": 1431} {"train_info/time_between_train_steps": 0.0029129981994628906, "step": 1431} {"info/global_step": 1432, "train_info/time_within_train_step": 2.3566110134124756, "step": 1432} {"train_info/time_between_train_steps": 0.002925395965576172, "step": 1432} {"info/global_step": 1433, "train_info/time_within_train_step": 2.357511520385742, "step": 1433} {"train_info/time_between_train_steps": 0.0029807090759277344, "step": 1433} {"info/global_step": 1434, "train_info/time_within_train_step": 2.3613462448120117, "step": 1434} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 1434} {"info/global_step": 1435, "train_info/time_within_train_step": 2.3793702125549316, "step": 1435} {"train_info/time_between_train_steps": 0.002966165542602539, "step": 1435} {"info/global_step": 1436, "train_info/time_within_train_step": 2.3569390773773193, "step": 1436} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 1436} {"info/global_step": 1437, "train_info/time_within_train_step": 2.356032609939575, "step": 1437} {"train_info/time_between_train_steps": 0.002953767776489258, "step": 1437} {"info/global_step": 1438, "train_info/time_within_train_step": 2.3568310737609863, "step": 1438} {"train_info/time_between_train_steps": 0.002913951873779297, "step": 1438} {"info/global_step": 1439, "train_info/time_within_train_step": 2.35650372505188, "step": 1439} {"train_info/time_between_train_steps": 0.002958059310913086, "step": 1439} {"info/global_step": 1440, "train_info/time_within_train_step": 2.356482744216919, "step": 1440} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 1440} {"info/global_step": 1441, "train_info/time_within_train_step": 2.35688853263855, "step": 1441} {"train_info/time_between_train_steps": 0.0030214786529541016, "step": 1441} {"info/global_step": 1442, "train_info/time_within_train_step": 2.356975555419922, "step": 1442} {"train_info/time_between_train_steps": 0.002933025360107422, "step": 1442} {"info/global_step": 1443, "train_info/time_within_train_step": 2.548635244369507, "step": 1443} {"train_info/time_between_train_steps": 0.003039121627807617, "step": 1443} {"info/global_step": 1444, "train_info/time_within_train_step": 2.356403112411499, "step": 1444} {"train_info/time_between_train_steps": 0.002969980239868164, "step": 1444} {"info/global_step": 1445, "train_info/time_within_train_step": 2.3563215732574463, "step": 1445} {"train_info/time_between_train_steps": 0.003387451171875, "step": 1445} {"info/global_step": 1446, "train_info/time_within_train_step": 2.3563411235809326, "step": 1446} {"train_info/time_between_train_steps": 0.003081083297729492, "step": 1446} {"info/global_step": 1447, "train_info/time_within_train_step": 2.356971263885498, "step": 1447} {"train_info/time_between_train_steps": 0.003080606460571289, "step": 1447} {"info/global_step": 1448, "train_info/time_within_train_step": 2.3570735454559326, "step": 1448} {"train_info/time_between_train_steps": 0.0030670166015625, "step": 1448} {"info/global_step": 1449, "train_info/time_within_train_step": 2.3566508293151855, "step": 1449} {"train_info/time_between_train_steps": 0.003088235855102539, "step": 1449} {"info/global_step": 1450, "train_info/time_within_train_step": 2.356853485107422, "step": 1450} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746255951, "_runtime": 3770}, "step": 1450} {"logs": {"train/loss": 4.0803, "train/learning_rate": 0.0003444444444444444, "train/epoch": 1.2, "_timestamp": 1746255951, "_runtime": 3770}, "step": 1450} {"train_info/time_between_train_steps": 0.024764299392700195, "step": 1450} {"info/global_step": 1451, "train_info/time_within_train_step": 2.3564035892486572, "step": 1451} {"train_info/time_between_train_steps": 0.0030679702758789062, "step": 1451} {"info/global_step": 1452, "train_info/time_within_train_step": 2.355954885482788, "step": 1452} {"train_info/time_between_train_steps": 0.003062009811401367, "step": 1452} {"info/global_step": 1453, "train_info/time_within_train_step": 2.3567652702331543, "step": 1453} {"train_info/time_between_train_steps": 0.0030286312103271484, "step": 1453} {"info/global_step": 1454, "train_info/time_within_train_step": 2.356326103210449, "step": 1454} {"train_info/time_between_train_steps": 0.003108501434326172, "step": 1454} {"info/global_step": 1455, "train_info/time_within_train_step": 2.3567872047424316, "step": 1455} {"train_info/time_between_train_steps": 0.003108501434326172, "step": 1455} {"info/global_step": 1456, "train_info/time_within_train_step": 2.3567521572113037, "step": 1456} {"train_info/time_between_train_steps": 0.0030803680419921875, "step": 1456} {"info/global_step": 1457, "train_info/time_within_train_step": 2.3570644855499268, "step": 1457} {"train_info/time_between_train_steps": 0.003040313720703125, "step": 1457} {"info/global_step": 1458, "train_info/time_within_train_step": 2.3566746711730957, "step": 1458} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 1458} {"info/global_step": 1459, "train_info/time_within_train_step": 2.358430862426758, "step": 1459} {"train_info/time_between_train_steps": 0.00310516357421875, "step": 1459} {"info/global_step": 1460, "train_info/time_within_train_step": 2.356757164001465, "step": 1460} {"train_info/time_between_train_steps": 0.0030546188354492188, "step": 1460} {"info/global_step": 1461, "train_info/time_within_train_step": 2.3567140102386475, "step": 1461} {"train_info/time_between_train_steps": 0.003073453903198242, "step": 1461} {"info/global_step": 1462, "train_info/time_within_train_step": 2.3570053577423096, "step": 1462} {"train_info/time_between_train_steps": 0.003065824508666992, "step": 1462} {"info/global_step": 1463, "train_info/time_within_train_step": 2.3563952445983887, "step": 1463} {"train_info/time_between_train_steps": 0.0030477046966552734, "step": 1463} {"info/global_step": 1464, "train_info/time_within_train_step": 2.3556735515594482, "step": 1464} {"train_info/time_between_train_steps": 0.003091573715209961, "step": 1464} {"info/global_step": 1465, "train_info/time_within_train_step": 2.3571202754974365, "step": 1465} {"train_info/time_between_train_steps": 0.003088235855102539, "step": 1465} {"info/global_step": 1466, "train_info/time_within_train_step": 2.3575174808502197, "step": 1466} {"train_info/time_between_train_steps": 0.003056049346923828, "step": 1466} {"info/global_step": 1467, "train_info/time_within_train_step": 2.6124932765960693, "step": 1467} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 1467} {"info/global_step": 1468, "train_info/time_within_train_step": 2.355741262435913, "step": 1468} {"train_info/time_between_train_steps": 0.0029325485229492188, "step": 1468} {"info/global_step": 1469, "train_info/time_within_train_step": 2.3568356037139893, "step": 1469} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 1469} {"info/global_step": 1470, "train_info/time_within_train_step": 2.357013702392578, "step": 1470} {"train_info/time_between_train_steps": 0.002995014190673828, "step": 1470} {"info/global_step": 1471, "train_info/time_within_train_step": 2.356637954711914, "step": 1471} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 1471} {"info/global_step": 1472, "train_info/time_within_train_step": 2.3548264503479004, "step": 1472} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 1472} {"info/global_step": 1473, "train_info/time_within_train_step": 2.356616735458374, "step": 1473} {"train_info/time_between_train_steps": 0.0028982162475585938, "step": 1473} {"info/global_step": 1474, "train_info/time_within_train_step": 2.3553194999694824, "step": 1474} {"train_info/time_between_train_steps": 0.0028960704803466797, "step": 1474} {"info/global_step": 1475, "train_info/time_within_train_step": 2.355513334274292, "step": 1475} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 1475} {"info/global_step": 1476, "train_info/time_within_train_step": 2.355982542037964, "step": 1476} {"train_info/time_between_train_steps": 0.0028972625732421875, "step": 1476} {"info/global_step": 1477, "train_info/time_within_train_step": 2.3555052280426025, "step": 1477} {"train_info/time_between_train_steps": 0.002966642379760742, "step": 1477} {"info/global_step": 1478, "train_info/time_within_train_step": 2.35575532913208, "step": 1478} {"train_info/time_between_train_steps": 0.0028896331787109375, "step": 1478} {"info/global_step": 1479, "train_info/time_within_train_step": 2.3564093112945557, "step": 1479} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 1479} {"info/global_step": 1480, "train_info/time_within_train_step": 2.3558943271636963, "step": 1480} {"train_info/time_between_train_steps": 0.0029463768005371094, "step": 1480} {"info/global_step": 1481, "train_info/time_within_train_step": 2.355433702468872, "step": 1481} {"train_info/time_between_train_steps": 0.002906322479248047, "step": 1481} {"info/global_step": 1482, "train_info/time_within_train_step": 2.3553617000579834, "step": 1482} {"train_info/time_between_train_steps": 0.0030045509338378906, "step": 1482} {"info/global_step": 1483, "train_info/time_within_train_step": 2.356257438659668, "step": 1483} {"train_info/time_between_train_steps": 0.0029256343841552734, "step": 1483} {"info/global_step": 1484, "train_info/time_within_train_step": 2.35646915435791, "step": 1484} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 1484} {"info/global_step": 1485, "train_info/time_within_train_step": 2.3550055027008057, "step": 1485} {"train_info/time_between_train_steps": 0.002889871597290039, "step": 1485} {"info/global_step": 1486, "train_info/time_within_train_step": 2.3562211990356445, "step": 1486} {"train_info/time_between_train_steps": 0.002946138381958008, "step": 1486} {"info/global_step": 1487, "train_info/time_within_train_step": 2.3565332889556885, "step": 1487} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 1487} {"info/global_step": 1488, "train_info/time_within_train_step": 2.356248140335083, "step": 1488} {"train_info/time_between_train_steps": 0.002949237823486328, "step": 1488} {"info/global_step": 1489, "train_info/time_within_train_step": 2.3568007946014404, "step": 1489} {"train_info/time_between_train_steps": 0.0029201507568359375, "step": 1489} {"info/global_step": 1490, "train_info/time_within_train_step": 2.3575260639190674, "step": 1490} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 1490} {"info/global_step": 1491, "train_info/time_within_train_step": 2.355905055999756, "step": 1491} {"train_info/time_between_train_steps": 0.0029268264770507812, "step": 1491} {"info/global_step": 1492, "train_info/time_within_train_step": 2.4950106143951416, "step": 1492} {"train_info/time_between_train_steps": 0.0029172897338867188, "step": 1492} {"info/global_step": 1493, "train_info/time_within_train_step": 2.3550424575805664, "step": 1493} {"train_info/time_between_train_steps": 0.0029098987579345703, "step": 1493} {"info/global_step": 1494, "train_info/time_within_train_step": 2.3566701412200928, "step": 1494} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 1494} {"info/global_step": 1495, "train_info/time_within_train_step": 2.355532646179199, "step": 1495} {"train_info/time_between_train_steps": 0.0029382705688476562, "step": 1495} {"info/global_step": 1496, "train_info/time_within_train_step": 2.3563756942749023, "step": 1496} {"train_info/time_between_train_steps": 0.003049135208129883, "step": 1496} {"info/global_step": 1497, "train_info/time_within_train_step": 2.356527328491211, "step": 1497} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 1497} {"info/global_step": 1498, "train_info/time_within_train_step": 2.35707426071167, "step": 1498} {"train_info/time_between_train_steps": 0.0029091835021972656, "step": 1498} {"info/global_step": 1499, "train_info/time_within_train_step": 2.3566558361053467, "step": 1499} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 1499} {"info/global_step": 1500, "train_info/time_within_train_step": 2.9141128063201904, "step": 1500} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746256071, "_runtime": 3890}, "step": 1500} {"logs": {"train/loss": 4.0696, "train/learning_rate": 0.0003333333333333333, "train/epoch": 1.21, "_timestamp": 1746256071, "_runtime": 3890}, "step": 1500} {"train_info/time_between_train_steps": 15.88038682937622, "step": 1500} {"info/global_step": 1501, "train_info/time_within_train_step": 2.201638698577881, "step": 1501} {"train_info/time_between_train_steps": 0.0029039382934570312, "step": 1501} {"info/global_step": 1502, "train_info/time_within_train_step": 2.1825263500213623, "step": 1502} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 1502} {"info/global_step": 1503, "train_info/time_within_train_step": 2.243778705596924, "step": 1503} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 1503} {"info/global_step": 1504, "train_info/time_within_train_step": 2.3476462364196777, "step": 1504} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 1504} {"info/global_step": 1505, "train_info/time_within_train_step": 2.3501009941101074, "step": 1505} {"train_info/time_between_train_steps": 0.00296783447265625, "step": 1505} {"info/global_step": 1506, "train_info/time_within_train_step": 2.353727340698242, "step": 1506} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 1506} {"info/global_step": 1507, "train_info/time_within_train_step": 2.3538644313812256, "step": 1507} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 1507} {"info/global_step": 1508, "train_info/time_within_train_step": 2.3543646335601807, "step": 1508} {"train_info/time_between_train_steps": 0.0028896331787109375, "step": 1508} {"info/global_step": 1509, "train_info/time_within_train_step": 2.355564832687378, "step": 1509} {"train_info/time_between_train_steps": 0.0029697418212890625, "step": 1509} {"info/global_step": 1510, "train_info/time_within_train_step": 2.355815887451172, "step": 1510} {"train_info/time_between_train_steps": 0.002925872802734375, "step": 1510} {"info/global_step": 1511, "train_info/time_within_train_step": 2.3558733463287354, "step": 1511} {"train_info/time_between_train_steps": 0.0029273033142089844, "step": 1511} {"info/global_step": 1512, "train_info/time_within_train_step": 2.3553125858306885, "step": 1512} {"train_info/time_between_train_steps": 0.0029189586639404297, "step": 1512} {"info/global_step": 1513, "train_info/time_within_train_step": 2.3563318252563477, "step": 1513} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 1513} {"info/global_step": 1514, "train_info/time_within_train_step": 2.3554162979125977, "step": 1514} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 1514} {"info/global_step": 1515, "train_info/time_within_train_step": 2.3550686836242676, "step": 1515} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 1515} {"info/global_step": 1516, "train_info/time_within_train_step": 2.3558757305145264, "step": 1516} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 1516} {"info/global_step": 1517, "train_info/time_within_train_step": 2.5082244873046875, "step": 1517} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 1517} {"info/global_step": 1518, "train_info/time_within_train_step": 2.3549699783325195, "step": 1518} {"train_info/time_between_train_steps": 0.0029740333557128906, "step": 1518} {"info/global_step": 1519, "train_info/time_within_train_step": 2.35581111907959, "step": 1519} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 1519} {"info/global_step": 1520, "train_info/time_within_train_step": 2.3547451496124268, "step": 1520} {"train_info/time_between_train_steps": 0.0029091835021972656, "step": 1520} {"info/global_step": 1521, "train_info/time_within_train_step": 2.3564860820770264, "step": 1521} {"train_info/time_between_train_steps": 0.002982616424560547, "step": 1521} {"info/global_step": 1522, "train_info/time_within_train_step": 2.3559160232543945, "step": 1522} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 1522} {"info/global_step": 1523, "train_info/time_within_train_step": 2.3556690216064453, "step": 1523} {"train_info/time_between_train_steps": 0.0029561519622802734, "step": 1523} {"info/global_step": 1524, "train_info/time_within_train_step": 2.3546512126922607, "step": 1524} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 1524} {"info/global_step": 1525, "train_info/time_within_train_step": 2.3553900718688965, "step": 1525} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 1525} {"info/global_step": 1526, "train_info/time_within_train_step": 2.3553946018218994, "step": 1526} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 1526} {"info/global_step": 1527, "train_info/time_within_train_step": 2.355426788330078, "step": 1527} {"train_info/time_between_train_steps": 0.002927541732788086, "step": 1527} {"info/global_step": 1528, "train_info/time_within_train_step": 2.3568320274353027, "step": 1528} {"train_info/time_between_train_steps": 0.002929210662841797, "step": 1528} {"info/global_step": 1529, "train_info/time_within_train_step": 2.3553683757781982, "step": 1529} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 1529} {"info/global_step": 1530, "train_info/time_within_train_step": 2.3549695014953613, "step": 1530} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 1530} {"info/global_step": 1531, "train_info/time_within_train_step": 2.3564963340759277, "step": 1531} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 1531} {"info/global_step": 1532, "train_info/time_within_train_step": 2.3552887439727783, "step": 1532} {"train_info/time_between_train_steps": 0.002903461456298828, "step": 1532} {"info/global_step": 1533, "train_info/time_within_train_step": 2.3555819988250732, "step": 1533} {"train_info/time_between_train_steps": 0.0028939247131347656, "step": 1533} {"info/global_step": 1534, "train_info/time_within_train_step": 2.3551642894744873, "step": 1534} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 1534} {"info/global_step": 1535, "train_info/time_within_train_step": 2.3559091091156006, "step": 1535} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 1535} {"info/global_step": 1536, "train_info/time_within_train_step": 2.356236457824707, "step": 1536} {"train_info/time_between_train_steps": 0.0029773712158203125, "step": 1536} {"info/global_step": 1537, "train_info/time_within_train_step": 2.354879856109619, "step": 1537} {"train_info/time_between_train_steps": 0.0029125213623046875, "step": 1537} {"info/global_step": 1538, "train_info/time_within_train_step": 2.3556764125823975, "step": 1538} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 1538} {"info/global_step": 1539, "train_info/time_within_train_step": 2.3554513454437256, "step": 1539} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 1539} {"info/global_step": 1540, "train_info/time_within_train_step": 2.3560633659362793, "step": 1540} {"train_info/time_between_train_steps": 0.0029540061950683594, "step": 1540} {"info/global_step": 1541, "train_info/time_within_train_step": 2.4917163848876953, "step": 1541} {"train_info/time_between_train_steps": 0.0029320716857910156, "step": 1541} {"info/global_step": 1542, "train_info/time_within_train_step": 2.356158971786499, "step": 1542} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 1542} {"info/global_step": 1543, "train_info/time_within_train_step": 2.3552141189575195, "step": 1543} {"train_info/time_between_train_steps": 0.0028891563415527344, "step": 1543} {"info/global_step": 1544, "train_info/time_within_train_step": 2.354722023010254, "step": 1544} {"train_info/time_between_train_steps": 0.002875804901123047, "step": 1544} {"info/global_step": 1545, "train_info/time_within_train_step": 2.3539741039276123, "step": 1545} {"train_info/time_between_train_steps": 0.002925395965576172, "step": 1545} {"info/global_step": 1546, "train_info/time_within_train_step": 2.353961706161499, "step": 1546} {"train_info/time_between_train_steps": 0.002880573272705078, "step": 1546} {"info/global_step": 1547, "train_info/time_within_train_step": 2.3543858528137207, "step": 1547} {"train_info/time_between_train_steps": 0.0029637813568115234, "step": 1547} {"info/global_step": 1548, "train_info/time_within_train_step": 2.354529619216919, "step": 1548} {"train_info/time_between_train_steps": 0.0029456615447998047, "step": 1548} {"info/global_step": 1549, "train_info/time_within_train_step": 2.3547346591949463, "step": 1549} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 1549} {"info/global_step": 1550, "train_info/time_within_train_step": 2.354710817337036, "step": 1550} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746256205, "_runtime": 4024}, "step": 1550} {"logs": {"train/loss": 4.0473, "train/learning_rate": 0.0003222222222222222, "train/epoch": 1.23, "_timestamp": 1746256205, "_runtime": 4024}, "step": 1550} {"train_info/time_between_train_steps": 0.02375173568725586, "step": 1550} {"info/global_step": 1551, "train_info/time_within_train_step": 2.3544440269470215, "step": 1551} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 1551} {"info/global_step": 1552, "train_info/time_within_train_step": 2.354565143585205, "step": 1552} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 1552} {"info/global_step": 1553, "train_info/time_within_train_step": 2.355464220046997, "step": 1553} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 1553} {"info/global_step": 1554, "train_info/time_within_train_step": 2.3550987243652344, "step": 1554} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 1554} {"info/global_step": 1555, "train_info/time_within_train_step": 2.35427188873291, "step": 1555} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 1555} {"info/global_step": 1556, "train_info/time_within_train_step": 2.3552634716033936, "step": 1556} {"train_info/time_between_train_steps": 0.002887725830078125, "step": 1556} {"info/global_step": 1557, "train_info/time_within_train_step": 2.3543684482574463, "step": 1557} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 1557} {"info/global_step": 1558, "train_info/time_within_train_step": 2.355950117111206, "step": 1558} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 1558} {"info/global_step": 1559, "train_info/time_within_train_step": 2.355297565460205, "step": 1559} {"train_info/time_between_train_steps": 0.0029261112213134766, "step": 1559} {"info/global_step": 1560, "train_info/time_within_train_step": 2.353346586227417, "step": 1560} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 1560} {"info/global_step": 1561, "train_info/time_within_train_step": 2.355402708053589, "step": 1561} {"train_info/time_between_train_steps": 0.002954721450805664, "step": 1561} {"info/global_step": 1562, "train_info/time_within_train_step": 2.355567693710327, "step": 1562} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 1562} {"info/global_step": 1563, "train_info/time_within_train_step": 2.3540053367614746, "step": 1563} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 1563} {"info/global_step": 1564, "train_info/time_within_train_step": 2.354421854019165, "step": 1564} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 1564} {"info/global_step": 1565, "train_info/time_within_train_step": 2.4772825241088867, "step": 1565} {"train_info/time_between_train_steps": 0.002969026565551758, "step": 1565} {"info/global_step": 1566, "train_info/time_within_train_step": 2.3555452823638916, "step": 1566} {"train_info/time_between_train_steps": 0.0029714107513427734, "step": 1566} {"info/global_step": 1567, "train_info/time_within_train_step": 2.354762315750122, "step": 1567} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 1567} {"info/global_step": 1568, "train_info/time_within_train_step": 2.354912757873535, "step": 1568} {"train_info/time_between_train_steps": 0.002961874008178711, "step": 1568} {"info/global_step": 1569, "train_info/time_within_train_step": 2.353368043899536, "step": 1569} {"train_info/time_between_train_steps": 0.0029714107513427734, "step": 1569} {"info/global_step": 1570, "train_info/time_within_train_step": 2.354074716567993, "step": 1570} {"train_info/time_between_train_steps": 0.0029349327087402344, "step": 1570} {"info/global_step": 1571, "train_info/time_within_train_step": 2.3536593914031982, "step": 1571} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 1571} {"info/global_step": 1572, "train_info/time_within_train_step": 2.3543572425842285, "step": 1572} {"train_info/time_between_train_steps": 0.002933502197265625, "step": 1572} {"info/global_step": 1573, "train_info/time_within_train_step": 2.355180263519287, "step": 1573} {"train_info/time_between_train_steps": 0.0029697418212890625, "step": 1573} {"info/global_step": 1574, "train_info/time_within_train_step": 2.3544840812683105, "step": 1574} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 1574} {"info/global_step": 1575, "train_info/time_within_train_step": 2.353996753692627, "step": 1575} {"train_info/time_between_train_steps": 0.0029287338256835938, "step": 1575} {"info/global_step": 1576, "train_info/time_within_train_step": 2.354369878768921, "step": 1576} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 1576} {"info/global_step": 1577, "train_info/time_within_train_step": 2.353865146636963, "step": 1577} {"train_info/time_between_train_steps": 0.0029172897338867188, "step": 1577} {"info/global_step": 1578, "train_info/time_within_train_step": 2.3534257411956787, "step": 1578} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 1578} {"info/global_step": 1579, "train_info/time_within_train_step": 2.3546557426452637, "step": 1579} {"train_info/time_between_train_steps": 0.0029897689819335938, "step": 1579} {"info/global_step": 1580, "train_info/time_within_train_step": 2.3538057804107666, "step": 1580} {"train_info/time_between_train_steps": 0.002886056900024414, "step": 1580} {"info/global_step": 1581, "train_info/time_within_train_step": 2.354538679122925, "step": 1581} {"train_info/time_between_train_steps": 0.0028831958770751953, "step": 1581} {"info/global_step": 1582, "train_info/time_within_train_step": 2.3535852432250977, "step": 1582} {"train_info/time_between_train_steps": 0.0029082298278808594, "step": 1582} {"info/global_step": 1583, "train_info/time_within_train_step": 2.3537964820861816, "step": 1583} {"train_info/time_between_train_steps": 0.00286865234375, "step": 1583} {"info/global_step": 1584, "train_info/time_within_train_step": 2.353726625442505, "step": 1584} {"train_info/time_between_train_steps": 0.0029020309448242188, "step": 1584} {"info/global_step": 1585, "train_info/time_within_train_step": 2.355034828186035, "step": 1585} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 1585} {"info/global_step": 1586, "train_info/time_within_train_step": 2.354123592376709, "step": 1586} {"train_info/time_between_train_steps": 0.002988100051879883, "step": 1586} {"info/global_step": 1587, "train_info/time_within_train_step": 2.3550870418548584, "step": 1587} {"train_info/time_between_train_steps": 0.002892017364501953, "step": 1587} {"info/global_step": 1588, "train_info/time_within_train_step": 2.354464530944824, "step": 1588} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 1588} {"info/global_step": 1589, "train_info/time_within_train_step": 2.4627585411071777, "step": 1589} {"train_info/time_between_train_steps": 0.0029077529907226562, "step": 1589} {"info/global_step": 1590, "train_info/time_within_train_step": 2.3532209396362305, "step": 1590} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 1590} {"info/global_step": 1591, "train_info/time_within_train_step": 2.353531837463379, "step": 1591} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 1591} {"info/global_step": 1592, "train_info/time_within_train_step": 2.3549253940582275, "step": 1592} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 1592} {"info/global_step": 1593, "train_info/time_within_train_step": 2.353243350982666, "step": 1593} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 1593} {"info/global_step": 1594, "train_info/time_within_train_step": 2.3543903827667236, "step": 1594} {"train_info/time_between_train_steps": 0.0029168128967285156, "step": 1594} {"info/global_step": 1595, "train_info/time_within_train_step": 2.354126214981079, "step": 1595} {"train_info/time_between_train_steps": 0.002899646759033203, "step": 1595} {"info/global_step": 1596, "train_info/time_within_train_step": 2.3543412685394287, "step": 1596} {"train_info/time_between_train_steps": 0.002888917922973633, "step": 1596} {"info/global_step": 1597, "train_info/time_within_train_step": 2.3532745838165283, "step": 1597} {"train_info/time_between_train_steps": 0.0029382705688476562, "step": 1597} {"info/global_step": 1598, "train_info/time_within_train_step": 2.3544952869415283, "step": 1598} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 1598} {"info/global_step": 1599, "train_info/time_within_train_step": 2.35469913482666, "step": 1599} {"train_info/time_between_train_steps": 0.0029158592224121094, "step": 1599} {"info/global_step": 1600, "train_info/time_within_train_step": 2.354247808456421, "step": 1600} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746256324, "_runtime": 4143}, "step": 1600} {"logs": {"train/loss": 4.0176, "train/learning_rate": 0.00031111111111111107, "train/epoch": 1.25, "_timestamp": 1746256324, "_runtime": 4143}, "step": 1600} {"train_info/time_between_train_steps": 15.709091901779175, "step": 1600} {"info/global_step": 1601, "train_info/time_within_train_step": 2.201004981994629, "step": 1601} {"train_info/time_between_train_steps": 0.0029251575469970703, "step": 1601} {"info/global_step": 1602, "train_info/time_within_train_step": 2.1826884746551514, "step": 1602} {"train_info/time_between_train_steps": 0.0028946399688720703, "step": 1602} {"info/global_step": 1603, "train_info/time_within_train_step": 2.2661170959472656, "step": 1603} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 1603} {"info/global_step": 1604, "train_info/time_within_train_step": 2.3476061820983887, "step": 1604} {"train_info/time_between_train_steps": 0.0029325485229492188, "step": 1604} {"info/global_step": 1605, "train_info/time_within_train_step": 2.351076126098633, "step": 1605} {"train_info/time_between_train_steps": 0.0029001235961914062, "step": 1605} {"info/global_step": 1606, "train_info/time_within_train_step": 2.353738307952881, "step": 1606} {"train_info/time_between_train_steps": 0.00289154052734375, "step": 1606} {"info/global_step": 1607, "train_info/time_within_train_step": 2.3533434867858887, "step": 1607} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 1607} {"info/global_step": 1608, "train_info/time_within_train_step": 2.3534626960754395, "step": 1608} {"train_info/time_between_train_steps": 0.0029227733612060547, "step": 1608} {"info/global_step": 1609, "train_info/time_within_train_step": 2.354327917098999, "step": 1609} {"train_info/time_between_train_steps": 0.0028791427612304688, "step": 1609} {"info/global_step": 1610, "train_info/time_within_train_step": 2.3544442653656006, "step": 1610} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 1610} {"info/global_step": 1611, "train_info/time_within_train_step": 2.3543922901153564, "step": 1611} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 1611} {"info/global_step": 1612, "train_info/time_within_train_step": 2.417203664779663, "step": 1612} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 1612} {"info/global_step": 1613, "train_info/time_within_train_step": 2.354645013809204, "step": 1613} {"train_info/time_between_train_steps": 0.002894163131713867, "step": 1613} {"info/global_step": 1614, "train_info/time_within_train_step": 2.3550338745117188, "step": 1614} {"train_info/time_between_train_steps": 0.0029115676879882812, "step": 1614} {"info/global_step": 1615, "train_info/time_within_train_step": 2.3551950454711914, "step": 1615} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 1615} {"info/global_step": 1616, "train_info/time_within_train_step": 2.3544890880584717, "step": 1616} {"train_info/time_between_train_steps": 0.002902507781982422, "step": 1616} {"info/global_step": 1617, "train_info/time_within_train_step": 2.355369806289673, "step": 1617} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 1617} {"info/global_step": 1618, "train_info/time_within_train_step": 2.3552134037017822, "step": 1618} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 1618} {"info/global_step": 1619, "train_info/time_within_train_step": 2.3548123836517334, "step": 1619} {"train_info/time_between_train_steps": 0.0028934478759765625, "step": 1619} {"info/global_step": 1620, "train_info/time_within_train_step": 2.3557348251342773, "step": 1620} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 1620} {"info/global_step": 1621, "train_info/time_within_train_step": 2.354193687438965, "step": 1621} {"train_info/time_between_train_steps": 0.002908945083618164, "step": 1621} {"info/global_step": 1622, "train_info/time_within_train_step": 2.354973554611206, "step": 1622} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 1622} {"info/global_step": 1623, "train_info/time_within_train_step": 2.3594913482666016, "step": 1623} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 1623} {"info/global_step": 1624, "train_info/time_within_train_step": 2.355482339859009, "step": 1624} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 1624} {"info/global_step": 1625, "train_info/time_within_train_step": 2.3543033599853516, "step": 1625} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 1625} {"info/global_step": 1626, "train_info/time_within_train_step": 2.354555606842041, "step": 1626} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 1626} {"info/global_step": 1627, "train_info/time_within_train_step": 2.3555283546447754, "step": 1627} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 1627} {"info/global_step": 1628, "train_info/time_within_train_step": 2.3549137115478516, "step": 1628} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 1628} {"info/global_step": 1629, "train_info/time_within_train_step": 2.354278087615967, "step": 1629} {"train_info/time_between_train_steps": 0.002905607223510742, "step": 1629} {"info/global_step": 1630, "train_info/time_within_train_step": 2.3558645248413086, "step": 1630} {"train_info/time_between_train_steps": 0.0029370784759521484, "step": 1630} {"info/global_step": 1631, "train_info/time_within_train_step": 2.3554651737213135, "step": 1631} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 1631} {"info/global_step": 1632, "train_info/time_within_train_step": 2.355222463607788, "step": 1632} {"train_info/time_between_train_steps": 0.0029108524322509766, "step": 1632} {"info/global_step": 1633, "train_info/time_within_train_step": 2.354149580001831, "step": 1633} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 1633} {"info/global_step": 1634, "train_info/time_within_train_step": 2.353565216064453, "step": 1634} {"train_info/time_between_train_steps": 0.002925395965576172, "step": 1634} {"info/global_step": 1635, "train_info/time_within_train_step": 2.354578971862793, "step": 1635} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 1635} {"info/global_step": 1636, "train_info/time_within_train_step": 2.4356603622436523, "step": 1636} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 1636} {"info/global_step": 1637, "train_info/time_within_train_step": 2.3542773723602295, "step": 1637} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 1637} {"info/global_step": 1638, "train_info/time_within_train_step": 2.354349136352539, "step": 1638} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 1638} {"info/global_step": 1639, "train_info/time_within_train_step": 2.355095624923706, "step": 1639} {"train_info/time_between_train_steps": 0.0029532909393310547, "step": 1639} {"info/global_step": 1640, "train_info/time_within_train_step": 2.354642868041992, "step": 1640} {"train_info/time_between_train_steps": 0.002897024154663086, "step": 1640} {"info/global_step": 1641, "train_info/time_within_train_step": 2.3548545837402344, "step": 1641} {"train_info/time_between_train_steps": 0.002894878387451172, "step": 1641} {"info/global_step": 1642, "train_info/time_within_train_step": 2.3538155555725098, "step": 1642} {"train_info/time_between_train_steps": 0.002886056900024414, "step": 1642} {"info/global_step": 1643, "train_info/time_within_train_step": 2.3534958362579346, "step": 1643} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 1643} {"info/global_step": 1644, "train_info/time_within_train_step": 2.353301525115967, "step": 1644} {"train_info/time_between_train_steps": 0.0029261112213134766, "step": 1644} {"info/global_step": 1645, "train_info/time_within_train_step": 2.353827476501465, "step": 1645} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 1645} {"info/global_step": 1646, "train_info/time_within_train_step": 2.35422682762146, "step": 1646} {"train_info/time_between_train_steps": 0.0028934478759765625, "step": 1646} {"info/global_step": 1647, "train_info/time_within_train_step": 2.3546864986419678, "step": 1647} {"train_info/time_between_train_steps": 0.002932310104370117, "step": 1647} {"info/global_step": 1648, "train_info/time_within_train_step": 2.3537368774414062, "step": 1648} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 1648} {"info/global_step": 1649, "train_info/time_within_train_step": 2.3539187908172607, "step": 1649} {"train_info/time_between_train_steps": 0.002887725830078125, "step": 1649} {"info/global_step": 1650, "train_info/time_within_train_step": 2.354811429977417, "step": 1650} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746256459, "_runtime": 4278}, "step": 1650} {"logs": {"train/loss": 4.0049, "train/learning_rate": 0.0003, "train/epoch": 1.26, "_timestamp": 1746256459, "_runtime": 4278}, "step": 1650} {"train_info/time_between_train_steps": 0.024446725845336914, "step": 1650} {"info/global_step": 1651, "train_info/time_within_train_step": 2.3552122116088867, "step": 1651} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 1651} {"info/global_step": 1652, "train_info/time_within_train_step": 2.3546977043151855, "step": 1652} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 1652} {"info/global_step": 1653, "train_info/time_within_train_step": 2.3543286323547363, "step": 1653} {"train_info/time_between_train_steps": 0.003477334976196289, "step": 1653} {"info/global_step": 1654, "train_info/time_within_train_step": 2.3548247814178467, "step": 1654} {"train_info/time_between_train_steps": 0.0029120445251464844, "step": 1654} {"info/global_step": 1655, "train_info/time_within_train_step": 2.354279041290283, "step": 1655} {"train_info/time_between_train_steps": 0.0029158592224121094, "step": 1655} {"info/global_step": 1656, "train_info/time_within_train_step": 2.3540608882904053, "step": 1656} {"train_info/time_between_train_steps": 0.002899169921875, "step": 1656} {"info/global_step": 1657, "train_info/time_within_train_step": 2.3545711040496826, "step": 1657} {"train_info/time_between_train_steps": 0.002899646759033203, "step": 1657} {"info/global_step": 1658, "train_info/time_within_train_step": 2.3556582927703857, "step": 1658} {"train_info/time_between_train_steps": 0.00292205810546875, "step": 1658} {"info/global_step": 1659, "train_info/time_within_train_step": 2.419567108154297, "step": 1659} {"train_info/time_between_train_steps": 0.0029268264770507812, "step": 1659} {"info/global_step": 1660, "train_info/time_within_train_step": 2.3544368743896484, "step": 1660} {"train_info/time_between_train_steps": 0.0029451847076416016, "step": 1660} {"info/global_step": 1661, "train_info/time_within_train_step": 2.3545777797698975, "step": 1661} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 1661} {"info/global_step": 1662, "train_info/time_within_train_step": 2.352750778198242, "step": 1662} {"train_info/time_between_train_steps": 0.002910614013671875, "step": 1662} {"info/global_step": 1663, "train_info/time_within_train_step": 2.3542730808258057, "step": 1663} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 1663} {"info/global_step": 1664, "train_info/time_within_train_step": 2.3539323806762695, "step": 1664} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 1664} {"info/global_step": 1665, "train_info/time_within_train_step": 2.3531858921051025, "step": 1665} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 1665} {"info/global_step": 1666, "train_info/time_within_train_step": 2.3536176681518555, "step": 1666} {"train_info/time_between_train_steps": 0.0029129981994628906, "step": 1666} {"info/global_step": 1667, "train_info/time_within_train_step": 2.3533315658569336, "step": 1667} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 1667} {"info/global_step": 1668, "train_info/time_within_train_step": 2.353938579559326, "step": 1668} {"train_info/time_between_train_steps": 0.0028786659240722656, "step": 1668} {"info/global_step": 1669, "train_info/time_within_train_step": 2.355318546295166, "step": 1669} {"train_info/time_between_train_steps": 0.0028982162475585938, "step": 1669} {"info/global_step": 1670, "train_info/time_within_train_step": 2.355081558227539, "step": 1670} {"train_info/time_between_train_steps": 0.002901315689086914, "step": 1670} {"info/global_step": 1671, "train_info/time_within_train_step": 2.3547213077545166, "step": 1671} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 1671} {"info/global_step": 1672, "train_info/time_within_train_step": 2.353670597076416, "step": 1672} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 1672} {"info/global_step": 1673, "train_info/time_within_train_step": 2.354886293411255, "step": 1673} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 1673} {"info/global_step": 1674, "train_info/time_within_train_step": 2.3545897006988525, "step": 1674} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 1674} {"info/global_step": 1675, "train_info/time_within_train_step": 2.355224847793579, "step": 1675} {"train_info/time_between_train_steps": 0.002929210662841797, "step": 1675} {"info/global_step": 1676, "train_info/time_within_train_step": 2.3539838790893555, "step": 1676} {"train_info/time_between_train_steps": 0.002964019775390625, "step": 1676} {"info/global_step": 1677, "train_info/time_within_train_step": 2.3549892902374268, "step": 1677} {"train_info/time_between_train_steps": 0.002927541732788086, "step": 1677} {"info/global_step": 1678, "train_info/time_within_train_step": 2.355363368988037, "step": 1678} {"train_info/time_between_train_steps": 0.0029714107513427734, "step": 1678} {"info/global_step": 1679, "train_info/time_within_train_step": 2.3546462059020996, "step": 1679} {"train_info/time_between_train_steps": 0.002907991409301758, "step": 1679} {"info/global_step": 1680, "train_info/time_within_train_step": 2.3544349670410156, "step": 1680} {"train_info/time_between_train_steps": 0.0029120445251464844, "step": 1680} {"info/global_step": 1681, "train_info/time_within_train_step": 2.404726028442383, "step": 1681} {"train_info/time_between_train_steps": 0.003479480743408203, "step": 1681} {"info/global_step": 1682, "train_info/time_within_train_step": 2.3534603118896484, "step": 1682} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 1682} {"info/global_step": 1683, "train_info/time_within_train_step": 2.3544576168060303, "step": 1683} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 1683} {"info/global_step": 1684, "train_info/time_within_train_step": 2.354001045227051, "step": 1684} {"train_info/time_between_train_steps": 0.0030138492584228516, "step": 1684} {"info/global_step": 1685, "train_info/time_within_train_step": 2.3544862270355225, "step": 1685} {"train_info/time_between_train_steps": 0.002970457077026367, "step": 1685} {"info/global_step": 1686, "train_info/time_within_train_step": 2.353800058364868, "step": 1686} {"train_info/time_between_train_steps": 0.0029261112213134766, "step": 1686} {"info/global_step": 1687, "train_info/time_within_train_step": 2.3536813259124756, "step": 1687} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 1687} {"info/global_step": 1688, "train_info/time_within_train_step": 2.3550851345062256, "step": 1688} {"train_info/time_between_train_steps": 0.0030126571655273438, "step": 1688} {"info/global_step": 1689, "train_info/time_within_train_step": 2.3533551692962646, "step": 1689} {"train_info/time_between_train_steps": 0.0029633045196533203, "step": 1689} {"info/global_step": 1690, "train_info/time_within_train_step": 2.3552958965301514, "step": 1690} {"train_info/time_between_train_steps": 0.003008127212524414, "step": 1690} {"info/global_step": 1691, "train_info/time_within_train_step": 2.3537724018096924, "step": 1691} {"train_info/time_between_train_steps": 0.0029854774475097656, "step": 1691} {"info/global_step": 1692, "train_info/time_within_train_step": 2.3544106483459473, "step": 1692} {"train_info/time_between_train_steps": 0.002979278564453125, "step": 1692} {"info/global_step": 1693, "train_info/time_within_train_step": 2.3541934490203857, "step": 1693} {"train_info/time_between_train_steps": 0.002895355224609375, "step": 1693} {"info/global_step": 1694, "train_info/time_within_train_step": 2.353532552719116, "step": 1694} {"train_info/time_between_train_steps": 0.002961397171020508, "step": 1694} {"info/global_step": 1695, "train_info/time_within_train_step": 2.354107141494751, "step": 1695} {"train_info/time_between_train_steps": 0.002927541732788086, "step": 1695} {"info/global_step": 1696, "train_info/time_within_train_step": 2.3539953231811523, "step": 1696} {"train_info/time_between_train_steps": 0.0030639171600341797, "step": 1696} {"info/global_step": 1697, "train_info/time_within_train_step": 2.3541622161865234, "step": 1697} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 1697} {"info/global_step": 1698, "train_info/time_within_train_step": 2.356112480163574, "step": 1698} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 1698} {"info/global_step": 1699, "train_info/time_within_train_step": 2.355463743209839, "step": 1699} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 1699} {"info/global_step": 1700, "train_info/time_within_train_step": 2.3555338382720947, "step": 1700} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746256578, "_runtime": 4397}, "step": 1700} {"logs": {"train/loss": 3.9955, "train/learning_rate": 0.0002888888888888888, "train/epoch": 1.28, "_timestamp": 1746256578, "_runtime": 4397}, "step": 1700} {"train_info/time_between_train_steps": 13.234841585159302, "step": 1700} {"info/global_step": 1701, "train_info/time_within_train_step": 2.1931710243225098, "step": 1701} {"train_info/time_between_train_steps": 0.0030870437622070312, "step": 1701} {"info/global_step": 1702, "train_info/time_within_train_step": 2.1856179237365723, "step": 1702} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 1702} {"info/global_step": 1703, "train_info/time_within_train_step": 2.3471453189849854, "step": 1703} {"train_info/time_between_train_steps": 0.003143310546875, "step": 1703} {"info/global_step": 1704, "train_info/time_within_train_step": 2.350095510482788, "step": 1704} {"train_info/time_between_train_steps": 0.003316164016723633, "step": 1704} {"info/global_step": 1705, "train_info/time_within_train_step": 2.3543903827667236, "step": 1705} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 1705} {"info/global_step": 1706, "train_info/time_within_train_step": 2.3564834594726562, "step": 1706} {"train_info/time_between_train_steps": 0.003116130828857422, "step": 1706} {"info/global_step": 1707, "train_info/time_within_train_step": 2.355912685394287, "step": 1707} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 1707} {"info/global_step": 1708, "train_info/time_within_train_step": 2.357046604156494, "step": 1708} {"train_info/time_between_train_steps": 0.0033097267150878906, "step": 1708} {"info/global_step": 1709, "train_info/time_within_train_step": 2.3564887046813965, "step": 1709} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 1709} {"info/global_step": 1710, "train_info/time_within_train_step": 2.355815887451172, "step": 1710} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 1710} {"info/global_step": 1711, "train_info/time_within_train_step": 2.3570542335510254, "step": 1711} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 1711} {"info/global_step": 1712, "train_info/time_within_train_step": 2.390822410583496, "step": 1712} {"train_info/time_between_train_steps": 0.0034546852111816406, "step": 1712} {"info/global_step": 1713, "train_info/time_within_train_step": 2.3577091693878174, "step": 1713} {"train_info/time_between_train_steps": 0.003644704818725586, "step": 1713} {"info/global_step": 1714, "train_info/time_within_train_step": 2.3583321571350098, "step": 1714} {"train_info/time_between_train_steps": 0.0036344528198242188, "step": 1714} {"info/global_step": 1715, "train_info/time_within_train_step": 2.357381820678711, "step": 1715} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 1715} {"info/global_step": 1716, "train_info/time_within_train_step": 2.3583974838256836, "step": 1716} {"train_info/time_between_train_steps": 0.0034368038177490234, "step": 1716} {"info/global_step": 1717, "train_info/time_within_train_step": 2.359210252761841, "step": 1717} {"train_info/time_between_train_steps": 0.003800630569458008, "step": 1717} {"info/global_step": 1718, "train_info/time_within_train_step": 2.358673334121704, "step": 1718} {"train_info/time_between_train_steps": 0.0035452842712402344, "step": 1718} {"info/global_step": 1719, "train_info/time_within_train_step": 2.359548330307007, "step": 1719} {"train_info/time_between_train_steps": 0.0038907527923583984, "step": 1719} {"info/global_step": 1720, "train_info/time_within_train_step": 2.3598146438598633, "step": 1720} {"train_info/time_between_train_steps": 0.0038881301879882812, "step": 1720} {"train_info/time_between_train_steps": 2.712829828262329, "step": 1720} {"info/global_step": 1721, "train_info/time_within_train_step": 2.373026132583618, "step": 1721} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 1721} {"info/global_step": 1722, "train_info/time_within_train_step": 2.3569953441619873, "step": 1722} {"train_info/time_between_train_steps": 0.0031223297119140625, "step": 1722} {"info/global_step": 1723, "train_info/time_within_train_step": 2.356720447540283, "step": 1723} {"train_info/time_between_train_steps": 0.003116130828857422, "step": 1723} {"info/global_step": 1724, "train_info/time_within_train_step": 2.3572285175323486, "step": 1724} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 1724} {"info/global_step": 1725, "train_info/time_within_train_step": 2.357151985168457, "step": 1725} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 1725} {"info/global_step": 1726, "train_info/time_within_train_step": 2.3572871685028076, "step": 1726} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 1726} {"info/global_step": 1727, "train_info/time_within_train_step": 2.357980728149414, "step": 1727} {"train_info/time_between_train_steps": 0.0031270980834960938, "step": 1727} {"info/global_step": 1728, "train_info/time_within_train_step": 2.3580029010772705, "step": 1728} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 1728} {"info/global_step": 1729, "train_info/time_within_train_step": 2.357883930206299, "step": 1729} {"train_info/time_between_train_steps": 0.0031244754791259766, "step": 1729} {"info/global_step": 1730, "train_info/time_within_train_step": 2.3578972816467285, "step": 1730} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 1730} {"info/global_step": 1731, "train_info/time_within_train_step": 2.3580591678619385, "step": 1731} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 1731} {"info/global_step": 1732, "train_info/time_within_train_step": 2.5168755054473877, "step": 1732} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 1732} {"info/global_step": 1733, "train_info/time_within_train_step": 2.3586840629577637, "step": 1733} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 1733} {"info/global_step": 1734, "train_info/time_within_train_step": 2.357700824737549, "step": 1734} {"train_info/time_between_train_steps": 0.0031197071075439453, "step": 1734} {"info/global_step": 1735, "train_info/time_within_train_step": 2.3586208820343018, "step": 1735} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 1735} {"info/global_step": 1736, "train_info/time_within_train_step": 2.3895349502563477, "step": 1736} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 1736} {"info/global_step": 1737, "train_info/time_within_train_step": 2.3572514057159424, "step": 1737} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 1737} {"info/global_step": 1738, "train_info/time_within_train_step": 2.3582677841186523, "step": 1738} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 1738} {"info/global_step": 1739, "train_info/time_within_train_step": 2.3573226928710938, "step": 1739} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 1739} {"info/global_step": 1740, "train_info/time_within_train_step": 2.3584439754486084, "step": 1740} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 1740} {"info/global_step": 1741, "train_info/time_within_train_step": 2.357455015182495, "step": 1741} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 1741} {"info/global_step": 1742, "train_info/time_within_train_step": 2.3580973148345947, "step": 1742} {"train_info/time_between_train_steps": 0.0031168460845947266, "step": 1742} {"info/global_step": 1743, "train_info/time_within_train_step": 2.3570594787597656, "step": 1743} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 1743} {"info/global_step": 1744, "train_info/time_within_train_step": 2.357969284057617, "step": 1744} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 1744} {"info/global_step": 1745, "train_info/time_within_train_step": 2.3574585914611816, "step": 1745} {"train_info/time_between_train_steps": 0.0031173229217529297, "step": 1745} {"info/global_step": 1746, "train_info/time_within_train_step": 2.3562369346618652, "step": 1746} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 1746} {"info/global_step": 1747, "train_info/time_within_train_step": 2.3564648628234863, "step": 1747} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 1747} {"info/global_step": 1748, "train_info/time_within_train_step": 2.356844186782837, "step": 1748} {"train_info/time_between_train_steps": 0.003116607666015625, "step": 1748} {"info/global_step": 1749, "train_info/time_within_train_step": 2.919372797012329, "step": 1749} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 1749} {"info/global_step": 1750, "train_info/time_within_train_step": 2.357084035873413, "step": 1750} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746256713, "_runtime": 4532}, "step": 1750} {"logs": {"train/loss": 4.0151, "train/learning_rate": 0.0002777777777777778, "train/epoch": 2.01, "_timestamp": 1746256713, "_runtime": 4532}, "step": 1750} {"train_info/time_between_train_steps": 0.02432417869567871, "step": 1750} {"info/global_step": 1751, "train_info/time_within_train_step": 2.3578622341156006, "step": 1751} {"train_info/time_between_train_steps": 0.0031108856201171875, "step": 1751} {"info/global_step": 1752, "train_info/time_within_train_step": 2.358444929122925, "step": 1752} {"train_info/time_between_train_steps": 0.0030908584594726562, "step": 1752} {"info/global_step": 1753, "train_info/time_within_train_step": 2.3576395511627197, "step": 1753} {"train_info/time_between_train_steps": 0.0030939579010009766, "step": 1753} {"info/global_step": 1754, "train_info/time_within_train_step": 2.3578097820281982, "step": 1754} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 1754} {"info/global_step": 1755, "train_info/time_within_train_step": 2.3574280738830566, "step": 1755} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 1755} {"info/global_step": 1756, "train_info/time_within_train_step": 2.3568270206451416, "step": 1756} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 1756} {"info/global_step": 1757, "train_info/time_within_train_step": 2.3567686080932617, "step": 1757} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 1757} {"info/global_step": 1758, "train_info/time_within_train_step": 2.5493338108062744, "step": 1758} {"train_info/time_between_train_steps": 0.003134012222290039, "step": 1758} {"info/global_step": 1759, "train_info/time_within_train_step": 2.3565752506256104, "step": 1759} {"train_info/time_between_train_steps": 0.003655672073364258, "step": 1759} {"info/global_step": 1760, "train_info/time_within_train_step": 2.3570666313171387, "step": 1760} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 1760} {"info/global_step": 1761, "train_info/time_within_train_step": 2.356375217437744, "step": 1761} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 1761} {"info/global_step": 1762, "train_info/time_within_train_step": 2.3575236797332764, "step": 1762} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 1762} {"info/global_step": 1763, "train_info/time_within_train_step": 2.357963800430298, "step": 1763} {"train_info/time_between_train_steps": 0.0031118392944335938, "step": 1763} {"info/global_step": 1764, "train_info/time_within_train_step": 2.3565683364868164, "step": 1764} {"train_info/time_between_train_steps": 0.003350973129272461, "step": 1764} {"info/global_step": 1765, "train_info/time_within_train_step": 2.3577616214752197, "step": 1765} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 1765} {"info/global_step": 1766, "train_info/time_within_train_step": 2.3564047813415527, "step": 1766} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 1766} {"info/global_step": 1767, "train_info/time_within_train_step": 2.3571765422821045, "step": 1767} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 1767} {"info/global_step": 1768, "train_info/time_within_train_step": 2.3574306964874268, "step": 1768} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 1768} {"info/global_step": 1769, "train_info/time_within_train_step": 2.356858253479004, "step": 1769} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 1769} {"info/global_step": 1770, "train_info/time_within_train_step": 2.356724739074707, "step": 1770} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 1770} {"info/global_step": 1771, "train_info/time_within_train_step": 2.3573901653289795, "step": 1771} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 1771} {"info/global_step": 1772, "train_info/time_within_train_step": 2.3575947284698486, "step": 1772} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 1772} {"info/global_step": 1773, "train_info/time_within_train_step": 2.3562583923339844, "step": 1773} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 1773} {"info/global_step": 1774, "train_info/time_within_train_step": 2.3578670024871826, "step": 1774} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 1774} {"info/global_step": 1775, "train_info/time_within_train_step": 2.358454942703247, "step": 1775} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 1775} {"info/global_step": 1776, "train_info/time_within_train_step": 2.3569722175598145, "step": 1776} {"train_info/time_between_train_steps": 0.0031218528747558594, "step": 1776} {"info/global_step": 1777, "train_info/time_within_train_step": 2.3571436405181885, "step": 1777} {"train_info/time_between_train_steps": 0.003100872039794922, "step": 1777} {"info/global_step": 1778, "train_info/time_within_train_step": 2.357261896133423, "step": 1778} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 1778} {"info/global_step": 1779, "train_info/time_within_train_step": 2.3943285942077637, "step": 1779} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 1779} {"info/global_step": 1780, "train_info/time_within_train_step": 2.355829954147339, "step": 1780} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 1780} {"info/global_step": 1781, "train_info/time_within_train_step": 2.3566150665283203, "step": 1781} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 1781} {"info/global_step": 1782, "train_info/time_within_train_step": 2.5499942302703857, "step": 1782} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 1782} {"info/global_step": 1783, "train_info/time_within_train_step": 2.474436044692993, "step": 1783} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 1783} {"info/global_step": 1784, "train_info/time_within_train_step": 2.356459140777588, "step": 1784} {"train_info/time_between_train_steps": 0.0034055709838867188, "step": 1784} {"info/global_step": 1785, "train_info/time_within_train_step": 2.3565874099731445, "step": 1785} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 1785} {"info/global_step": 1786, "train_info/time_within_train_step": 2.3896870613098145, "step": 1786} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 1786} {"info/global_step": 1787, "train_info/time_within_train_step": 2.3569223880767822, "step": 1787} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 1787} {"info/global_step": 1788, "train_info/time_within_train_step": 2.356729507446289, "step": 1788} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 1788} {"info/global_step": 1789, "train_info/time_within_train_step": 2.3560922145843506, "step": 1789} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 1789} {"info/global_step": 1790, "train_info/time_within_train_step": 2.3565714359283447, "step": 1790} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 1790} {"info/global_step": 1791, "train_info/time_within_train_step": 2.357261896133423, "step": 1791} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 1791} {"info/global_step": 1792, "train_info/time_within_train_step": 2.357435941696167, "step": 1792} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 1792} {"info/global_step": 1793, "train_info/time_within_train_step": 2.357945442199707, "step": 1793} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 1793} {"info/global_step": 1794, "train_info/time_within_train_step": 2.3580081462860107, "step": 1794} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 1794} {"info/global_step": 1795, "train_info/time_within_train_step": 2.356656074523926, "step": 1795} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 1795} {"info/global_step": 1796, "train_info/time_within_train_step": 2.380032777786255, "step": 1796} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 1796} {"info/global_step": 1797, "train_info/time_within_train_step": 2.3557968139648438, "step": 1797} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 1797} {"info/global_step": 1798, "train_info/time_within_train_step": 2.356173515319824, "step": 1798} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 1798} {"info/global_step": 1799, "train_info/time_within_train_step": 2.3573384284973145, "step": 1799} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 1799} {"info/global_step": 1800, "train_info/time_within_train_step": 2.3572604656219482, "step": 1800} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746256833, "_runtime": 4652}, "step": 1800} {"logs": {"train/loss": 3.9645, "train/learning_rate": 0.0002666666666666666, "train/epoch": 2.03, "_timestamp": 1746256833, "_runtime": 4652}, "step": 1800} {"train_info/time_between_train_steps": 20.022494077682495, "step": 1800} {"info/global_step": 1801, "train_info/time_within_train_step": 2.200087070465088, "step": 1801} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 1801} {"info/global_step": 1802, "train_info/time_within_train_step": 2.180041790008545, "step": 1802} {"train_info/time_between_train_steps": 0.003131866455078125, "step": 1802} {"info/global_step": 1803, "train_info/time_within_train_step": 2.2264552116394043, "step": 1803} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 1803} {"info/global_step": 1804, "train_info/time_within_train_step": 2.338958263397217, "step": 1804} {"train_info/time_between_train_steps": 0.0031249523162841797, "step": 1804} {"info/global_step": 1805, "train_info/time_within_train_step": 2.5257818698883057, "step": 1805} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 1805} {"info/global_step": 1806, "train_info/time_within_train_step": 2.3554136753082275, "step": 1806} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 1806} {"info/global_step": 1807, "train_info/time_within_train_step": 2.357161521911621, "step": 1807} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 1807} {"info/global_step": 1808, "train_info/time_within_train_step": 2.3562750816345215, "step": 1808} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 1808} {"info/global_step": 1809, "train_info/time_within_train_step": 2.357367992401123, "step": 1809} {"train_info/time_between_train_steps": 0.003116130828857422, "step": 1809} {"info/global_step": 1810, "train_info/time_within_train_step": 2.3627359867095947, "step": 1810} {"train_info/time_between_train_steps": 0.006551027297973633, "step": 1810} {"info/global_step": 1811, "train_info/time_within_train_step": 2.3573291301727295, "step": 1811} {"train_info/time_between_train_steps": 0.00312042236328125, "step": 1811} {"info/global_step": 1812, "train_info/time_within_train_step": 2.3569142818450928, "step": 1812} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 1812} {"info/global_step": 1813, "train_info/time_within_train_step": 2.3818721771240234, "step": 1813} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 1813} {"info/global_step": 1814, "train_info/time_within_train_step": 2.3581507205963135, "step": 1814} {"train_info/time_between_train_steps": 0.0031175613403320312, "step": 1814} {"info/global_step": 1815, "train_info/time_within_train_step": 2.357929229736328, "step": 1815} {"train_info/time_between_train_steps": 0.0031070709228515625, "step": 1815} {"info/global_step": 1816, "train_info/time_within_train_step": 2.3594021797180176, "step": 1816} {"train_info/time_between_train_steps": 0.003120899200439453, "step": 1816} {"info/global_step": 1817, "train_info/time_within_train_step": 2.3570210933685303, "step": 1817} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 1817} {"info/global_step": 1818, "train_info/time_within_train_step": 2.35648775100708, "step": 1818} {"train_info/time_between_train_steps": 0.0031366348266601562, "step": 1818} {"info/global_step": 1819, "train_info/time_within_train_step": 2.357724666595459, "step": 1819} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 1819} {"info/global_step": 1820, "train_info/time_within_train_step": 2.356726884841919, "step": 1820} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 1820} {"info/global_step": 1821, "train_info/time_within_train_step": 2.357442855834961, "step": 1821} {"train_info/time_between_train_steps": 0.0031003952026367188, "step": 1821} {"info/global_step": 1822, "train_info/time_within_train_step": 2.357652425765991, "step": 1822} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 1822} {"info/global_step": 1823, "train_info/time_within_train_step": 2.357323408126831, "step": 1823} {"train_info/time_between_train_steps": 0.003094911575317383, "step": 1823} {"info/global_step": 1824, "train_info/time_within_train_step": 2.3576393127441406, "step": 1824} {"train_info/time_between_train_steps": 0.0030820369720458984, "step": 1824} {"info/global_step": 1825, "train_info/time_within_train_step": 2.3569552898406982, "step": 1825} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 1825} {"info/global_step": 1826, "train_info/time_within_train_step": 2.357625961303711, "step": 1826} {"train_info/time_between_train_steps": 0.003236055374145508, "step": 1826} {"info/global_step": 1827, "train_info/time_within_train_step": 2.3576178550720215, "step": 1827} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 1827} {"info/global_step": 1828, "train_info/time_within_train_step": 2.356273651123047, "step": 1828} {"train_info/time_between_train_steps": 0.0031032562255859375, "step": 1828} {"info/global_step": 1829, "train_info/time_within_train_step": 2.357233762741089, "step": 1829} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 1829} {"info/global_step": 1830, "train_info/time_within_train_step": 2.5640292167663574, "step": 1830} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 1830} {"info/global_step": 1831, "train_info/time_within_train_step": 2.357346773147583, "step": 1831} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 1831} {"info/global_step": 1832, "train_info/time_within_train_step": 2.357496500015259, "step": 1832} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 1832} {"info/global_step": 1833, "train_info/time_within_train_step": 2.3576269149780273, "step": 1833} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 1833} {"info/global_step": 1834, "train_info/time_within_train_step": 2.356403350830078, "step": 1834} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 1834} {"info/global_step": 1835, "train_info/time_within_train_step": 2.3570778369903564, "step": 1835} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 1835} {"info/global_step": 1836, "train_info/time_within_train_step": 2.35792875289917, "step": 1836} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 1836} {"info/global_step": 1837, "train_info/time_within_train_step": 2.3567798137664795, "step": 1837} {"train_info/time_between_train_steps": 0.0031201839447021484, "step": 1837} {"info/global_step": 1838, "train_info/time_within_train_step": 2.3569564819335938, "step": 1838} {"train_info/time_between_train_steps": 0.003122091293334961, "step": 1838} {"info/global_step": 1839, "train_info/time_within_train_step": 2.3570990562438965, "step": 1839} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 1839} {"info/global_step": 1840, "train_info/time_within_train_step": 2.3564822673797607, "step": 1840} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 1840} {"info/global_step": 1841, "train_info/time_within_train_step": 2.3581364154815674, "step": 1841} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 1841} {"info/global_step": 1842, "train_info/time_within_train_step": 2.3568575382232666, "step": 1842} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 1842} {"info/global_step": 1843, "train_info/time_within_train_step": 2.3580899238586426, "step": 1843} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 1843} {"info/global_step": 1844, "train_info/time_within_train_step": 2.3572328090667725, "step": 1844} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 1844} {"info/global_step": 1845, "train_info/time_within_train_step": 2.356982946395874, "step": 1845} {"train_info/time_between_train_steps": 0.12166213989257812, "step": 1845} {"info/global_step": 1846, "train_info/time_within_train_step": 2.3728816509246826, "step": 1846} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 1846} {"info/global_step": 1847, "train_info/time_within_train_step": 2.3564980030059814, "step": 1847} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 1847} {"info/global_step": 1848, "train_info/time_within_train_step": 2.356282949447632, "step": 1848} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 1848} {"info/global_step": 1849, "train_info/time_within_train_step": 2.357264518737793, "step": 1849} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 1849} {"info/global_step": 1850, "train_info/time_within_train_step": 2.357252836227417, "step": 1850} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746256972, "_runtime": 4791}, "step": 1850} {"logs": {"train/loss": 3.944, "train/learning_rate": 0.00025555555555555553, "train/epoch": 2.04, "_timestamp": 1746256972, "_runtime": 4791}, "step": 1850} {"train_info/time_between_train_steps": 0.025182247161865234, "step": 1850} {"info/global_step": 1851, "train_info/time_within_train_step": 2.3575825691223145, "step": 1851} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 1851} {"info/global_step": 1852, "train_info/time_within_train_step": 2.3577404022216797, "step": 1852} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 1852} {"info/global_step": 1853, "train_info/time_within_train_step": 2.3572020530700684, "step": 1853} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 1853} {"info/global_step": 1854, "train_info/time_within_train_step": 2.3569347858428955, "step": 1854} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 1854} {"info/global_step": 1855, "train_info/time_within_train_step": 2.5506112575531006, "step": 1855} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 1855} {"info/global_step": 1856, "train_info/time_within_train_step": 2.3569111824035645, "step": 1856} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 1856} {"info/global_step": 1857, "train_info/time_within_train_step": 2.356651544570923, "step": 1857} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 1857} {"info/global_step": 1858, "train_info/time_within_train_step": 2.3569371700286865, "step": 1858} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 1858} {"info/global_step": 1859, "train_info/time_within_train_step": 2.356200695037842, "step": 1859} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 1859} {"info/global_step": 1860, "train_info/time_within_train_step": 2.3570897579193115, "step": 1860} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 1860} {"info/global_step": 1861, "train_info/time_within_train_step": 2.3582122325897217, "step": 1861} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 1861} {"info/global_step": 1862, "train_info/time_within_train_step": 2.357943534851074, "step": 1862} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 1862} {"info/global_step": 1863, "train_info/time_within_train_step": 2.3569226264953613, "step": 1863} {"train_info/time_between_train_steps": 0.003154277801513672, "step": 1863} {"info/global_step": 1864, "train_info/time_within_train_step": 2.3564789295196533, "step": 1864} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 1864} {"info/global_step": 1865, "train_info/time_within_train_step": 2.3581905364990234, "step": 1865} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 1865} {"info/global_step": 1866, "train_info/time_within_train_step": 2.355684280395508, "step": 1866} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 1866} {"info/global_step": 1867, "train_info/time_within_train_step": 2.357028007507324, "step": 1867} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 1867} {"info/global_step": 1868, "train_info/time_within_train_step": 2.3568408489227295, "step": 1868} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 1868} {"info/global_step": 1869, "train_info/time_within_train_step": 2.357525110244751, "step": 1869} {"train_info/time_between_train_steps": 0.0035190582275390625, "step": 1869} {"info/global_step": 1870, "train_info/time_within_train_step": 2.3564133644104004, "step": 1870} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 1870} {"info/global_step": 1871, "train_info/time_within_train_step": 2.35748028755188, "step": 1871} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 1871} {"info/global_step": 1872, "train_info/time_within_train_step": 2.3580665588378906, "step": 1872} {"train_info/time_between_train_steps": 0.0031528472900390625, "step": 1872} {"info/global_step": 1873, "train_info/time_within_train_step": 2.356750726699829, "step": 1873} {"train_info/time_between_train_steps": 0.006469249725341797, "step": 1873} {"info/global_step": 1874, "train_info/time_within_train_step": 2.355959892272949, "step": 1874} {"train_info/time_between_train_steps": 0.006518840789794922, "step": 1874} {"info/global_step": 1875, "train_info/time_within_train_step": 2.3572750091552734, "step": 1875} {"train_info/time_between_train_steps": 0.006564617156982422, "step": 1875} {"info/global_step": 1876, "train_info/time_within_train_step": 2.3562090396881104, "step": 1876} {"train_info/time_between_train_steps": 0.0065135955810546875, "step": 1876} {"info/global_step": 1877, "train_info/time_within_train_step": 2.3560378551483154, "step": 1877} {"train_info/time_between_train_steps": 0.0031218528747558594, "step": 1877} {"info/global_step": 1878, "train_info/time_within_train_step": 2.3570969104766846, "step": 1878} {"train_info/time_between_train_steps": 0.006448268890380859, "step": 1878} {"info/global_step": 1879, "train_info/time_within_train_step": 2.565049171447754, "step": 1879} {"train_info/time_between_train_steps": 0.006467342376708984, "step": 1879} {"info/global_step": 1880, "train_info/time_within_train_step": 2.356837034225464, "step": 1880} {"train_info/time_between_train_steps": 0.006480693817138672, "step": 1880} {"info/global_step": 1881, "train_info/time_within_train_step": 2.3564541339874268, "step": 1881} {"train_info/time_between_train_steps": 0.006472110748291016, "step": 1881} {"info/global_step": 1882, "train_info/time_within_train_step": 2.3566019535064697, "step": 1882} {"train_info/time_between_train_steps": 0.006481647491455078, "step": 1882} {"info/global_step": 1883, "train_info/time_within_train_step": 2.356778860092163, "step": 1883} {"train_info/time_between_train_steps": 0.006443500518798828, "step": 1883} {"info/global_step": 1884, "train_info/time_within_train_step": 2.3560924530029297, "step": 1884} {"train_info/time_between_train_steps": 0.006498575210571289, "step": 1884} {"info/global_step": 1885, "train_info/time_within_train_step": 2.3613224029541016, "step": 1885} {"train_info/time_between_train_steps": 0.006470203399658203, "step": 1885} {"info/global_step": 1886, "train_info/time_within_train_step": 2.3568882942199707, "step": 1886} {"train_info/time_between_train_steps": 0.006529092788696289, "step": 1886} {"info/global_step": 1887, "train_info/time_within_train_step": 2.3575148582458496, "step": 1887} {"train_info/time_between_train_steps": 0.0064580440521240234, "step": 1887} {"info/global_step": 1888, "train_info/time_within_train_step": 2.357929229736328, "step": 1888} {"train_info/time_between_train_steps": 0.006540060043334961, "step": 1888} {"info/global_step": 1889, "train_info/time_within_train_step": 2.3567607402801514, "step": 1889} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 1889} {"info/global_step": 1890, "train_info/time_within_train_step": 2.3572912216186523, "step": 1890} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 1890} {"info/global_step": 1891, "train_info/time_within_train_step": 2.3573994636535645, "step": 1891} {"train_info/time_between_train_steps": 0.006461143493652344, "step": 1891} {"info/global_step": 1892, "train_info/time_within_train_step": 2.3608694076538086, "step": 1892} {"train_info/time_between_train_steps": 0.0065081119537353516, "step": 1892} {"info/global_step": 1893, "train_info/time_within_train_step": 2.3576083183288574, "step": 1893} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 1893} {"info/global_step": 1894, "train_info/time_within_train_step": 2.3562746047973633, "step": 1894} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 1894} {"info/global_step": 1895, "train_info/time_within_train_step": 2.3570163249969482, "step": 1895} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 1895} {"info/global_step": 1896, "train_info/time_within_train_step": 2.356874704360962, "step": 1896} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 1896} {"info/global_step": 1897, "train_info/time_within_train_step": 2.3568437099456787, "step": 1897} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 1897} {"info/global_step": 1898, "train_info/time_within_train_step": 2.3578712940216064, "step": 1898} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 1898} {"info/global_step": 1899, "train_info/time_within_train_step": 2.358004570007324, "step": 1899} {"train_info/time_between_train_steps": 0.0032372474670410156, "step": 1899} {"info/global_step": 1900, "train_info/time_within_train_step": 2.357524871826172, "step": 1900} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746257091, "_runtime": 4910}, "step": 1900} {"logs": {"train/loss": 3.935, "train/learning_rate": 0.00024444444444444443, "train/epoch": 2.06, "_timestamp": 1746257091, "_runtime": 4910}, "step": 1900} {"train_info/time_between_train_steps": 15.1534423828125, "step": 1900} {"info/global_step": 1901, "train_info/time_within_train_step": 2.194054365158081, "step": 1901} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 1901} {"info/global_step": 1902, "train_info/time_within_train_step": 2.1837966442108154, "step": 1902} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 1902} {"info/global_step": 1903, "train_info/time_within_train_step": 2.2725353240966797, "step": 1903} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 1903} {"info/global_step": 1904, "train_info/time_within_train_step": 2.568065881729126, "step": 1904} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 1904} {"info/global_step": 1905, "train_info/time_within_train_step": 2.3523571491241455, "step": 1905} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 1905} {"info/global_step": 1906, "train_info/time_within_train_step": 2.3556225299835205, "step": 1906} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 1906} {"info/global_step": 1907, "train_info/time_within_train_step": 2.355820417404175, "step": 1907} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 1907} {"info/global_step": 1908, "train_info/time_within_train_step": 2.4755351543426514, "step": 1908} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 1908} {"info/global_step": 1909, "train_info/time_within_train_step": 2.35642409324646, "step": 1909} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 1909} {"info/global_step": 1910, "train_info/time_within_train_step": 2.356358528137207, "step": 1910} {"train_info/time_between_train_steps": 0.0032873153686523438, "step": 1910} {"info/global_step": 1911, "train_info/time_within_train_step": 2.356520175933838, "step": 1911} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 1911} {"info/global_step": 1912, "train_info/time_within_train_step": 2.3565664291381836, "step": 1912} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 1912} {"info/global_step": 1913, "train_info/time_within_train_step": 2.357295274734497, "step": 1913} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 1913} {"info/global_step": 1914, "train_info/time_within_train_step": 2.3560125827789307, "step": 1914} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 1914} {"info/global_step": 1915, "train_info/time_within_train_step": 2.3567841053009033, "step": 1915} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 1915} {"info/global_step": 1916, "train_info/time_within_train_step": 2.357407808303833, "step": 1916} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 1916} {"info/global_step": 1917, "train_info/time_within_train_step": 2.356564998626709, "step": 1917} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 1917} {"info/global_step": 1918, "train_info/time_within_train_step": 2.357255458831787, "step": 1918} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 1918} {"info/global_step": 1919, "train_info/time_within_train_step": 2.3557326793670654, "step": 1919} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 1919} {"info/global_step": 1920, "train_info/time_within_train_step": 2.356733560562134, "step": 1920} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 1920} {"info/global_step": 1921, "train_info/time_within_train_step": 2.357205390930176, "step": 1921} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 1921} {"info/global_step": 1922, "train_info/time_within_train_step": 2.357358455657959, "step": 1922} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 1922} {"info/global_step": 1923, "train_info/time_within_train_step": 2.357832193374634, "step": 1923} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 1923} {"info/global_step": 1924, "train_info/time_within_train_step": 2.3573431968688965, "step": 1924} {"train_info/time_between_train_steps": 0.003276824951171875, "step": 1924} {"info/global_step": 1925, "train_info/time_within_train_step": 2.357938051223755, "step": 1925} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 1925} {"info/global_step": 1926, "train_info/time_within_train_step": 2.357349395751953, "step": 1926} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 1926} {"info/global_step": 1927, "train_info/time_within_train_step": 2.356889009475708, "step": 1927} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 1927} {"info/global_step": 1928, "train_info/time_within_train_step": 2.576465606689453, "step": 1928} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 1928} {"info/global_step": 1929, "train_info/time_within_train_step": 2.356914758682251, "step": 1929} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 1929} {"info/global_step": 1930, "train_info/time_within_train_step": 2.357600212097168, "step": 1930} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 1930} {"info/global_step": 1931, "train_info/time_within_train_step": 2.3567728996276855, "step": 1931} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 1931} {"info/global_step": 1932, "train_info/time_within_train_step": 2.357452869415283, "step": 1932} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 1932} {"info/global_step": 1933, "train_info/time_within_train_step": 2.3574774265289307, "step": 1933} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 1933} {"info/global_step": 1934, "train_info/time_within_train_step": 2.3560478687286377, "step": 1934} {"train_info/time_between_train_steps": 0.00333404541015625, "step": 1934} {"info/global_step": 1935, "train_info/time_within_train_step": 2.356508255004883, "step": 1935} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 1935} {"info/global_step": 1936, "train_info/time_within_train_step": 2.3575122356414795, "step": 1936} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 1936} {"info/global_step": 1937, "train_info/time_within_train_step": 2.3572521209716797, "step": 1937} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 1937} {"info/global_step": 1938, "train_info/time_within_train_step": 2.35601544380188, "step": 1938} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 1938} {"info/global_step": 1939, "train_info/time_within_train_step": 2.3570380210876465, "step": 1939} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 1939} {"info/global_step": 1940, "train_info/time_within_train_step": 2.3571839332580566, "step": 1940} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 1940} {"info/global_step": 1941, "train_info/time_within_train_step": 2.356982946395874, "step": 1941} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 1941} {"info/global_step": 1942, "train_info/time_within_train_step": 2.3567378520965576, "step": 1942} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 1942} {"info/global_step": 1943, "train_info/time_within_train_step": 2.3562958240509033, "step": 1943} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 1943} {"info/global_step": 1944, "train_info/time_within_train_step": 2.356501579284668, "step": 1944} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 1944} {"info/global_step": 1945, "train_info/time_within_train_step": 2.3571126461029053, "step": 1945} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 1945} {"info/global_step": 1946, "train_info/time_within_train_step": 2.355769634246826, "step": 1946} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 1946} {"info/global_step": 1947, "train_info/time_within_train_step": 2.355933427810669, "step": 1947} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 1947} {"info/global_step": 1948, "train_info/time_within_train_step": 2.355905294418335, "step": 1948} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 1948} {"info/global_step": 1949, "train_info/time_within_train_step": 2.356959581375122, "step": 1949} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 1949} {"info/global_step": 1950, "train_info/time_within_train_step": 2.3565101623535156, "step": 1950} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746257226, "_runtime": 5045}, "step": 1950} {"logs": {"train/loss": 3.9153, "train/learning_rate": 0.0002333333333333333, "train/epoch": 2.08, "_timestamp": 1746257226, "_runtime": 5045}, "step": 1950} {"train_info/time_between_train_steps": 0.024884700775146484, "step": 1950} {"info/global_step": 1951, "train_info/time_within_train_step": 2.3570098876953125, "step": 1951} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 1951} {"info/global_step": 1952, "train_info/time_within_train_step": 2.356139659881592, "step": 1952} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 1952} {"info/global_step": 1953, "train_info/time_within_train_step": 2.577955722808838, "step": 1953} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 1953} {"info/global_step": 1954, "train_info/time_within_train_step": 2.3563642501831055, "step": 1954} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 1954} {"info/global_step": 1955, "train_info/time_within_train_step": 2.3614330291748047, "step": 1955} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 1955} {"info/global_step": 1956, "train_info/time_within_train_step": 2.356137752532959, "step": 1956} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 1956} {"info/global_step": 1957, "train_info/time_within_train_step": 2.356983184814453, "step": 1957} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 1957} {"info/global_step": 1958, "train_info/time_within_train_step": 2.378868579864502, "step": 1958} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 1958} {"info/global_step": 1959, "train_info/time_within_train_step": 2.35534930229187, "step": 1959} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 1959} {"info/global_step": 1960, "train_info/time_within_train_step": 2.3567371368408203, "step": 1960} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 1960} {"info/global_step": 1961, "train_info/time_within_train_step": 2.3541481494903564, "step": 1961} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 1961} {"info/global_step": 1962, "train_info/time_within_train_step": 2.355865478515625, "step": 1962} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 1962} {"info/global_step": 1963, "train_info/time_within_train_step": 2.354761838912964, "step": 1963} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 1963} {"info/global_step": 1964, "train_info/time_within_train_step": 2.3555238246917725, "step": 1964} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 1964} {"info/global_step": 1965, "train_info/time_within_train_step": 2.355508804321289, "step": 1965} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 1965} {"info/global_step": 1966, "train_info/time_within_train_step": 2.3555941581726074, "step": 1966} {"train_info/time_between_train_steps": 0.003204345703125, "step": 1966} {"info/global_step": 1967, "train_info/time_within_train_step": 2.3560872077941895, "step": 1967} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 1967} {"info/global_step": 1968, "train_info/time_within_train_step": 2.3555679321289062, "step": 1968} {"train_info/time_between_train_steps": 0.0031328201293945312, "step": 1968} {"info/global_step": 1969, "train_info/time_within_train_step": 2.355182409286499, "step": 1969} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 1969} {"info/global_step": 1970, "train_info/time_within_train_step": 2.3556442260742188, "step": 1970} {"train_info/time_between_train_steps": 0.12258291244506836, "step": 1970} {"info/global_step": 1971, "train_info/time_within_train_step": 2.356527805328369, "step": 1971} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 1971} {"info/global_step": 1972, "train_info/time_within_train_step": 2.3560128211975098, "step": 1972} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 1972} {"info/global_step": 1973, "train_info/time_within_train_step": 2.3557980060577393, "step": 1973} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 1973} {"info/global_step": 1974, "train_info/time_within_train_step": 2.3562731742858887, "step": 1974} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 1974} {"info/global_step": 1975, "train_info/time_within_train_step": 2.3559069633483887, "step": 1975} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 1975} {"info/global_step": 1976, "train_info/time_within_train_step": 2.355651617050171, "step": 1976} {"train_info/time_between_train_steps": 0.003143310546875, "step": 1976} {"info/global_step": 1977, "train_info/time_within_train_step": 2.579291343688965, "step": 1977} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 1977} {"info/global_step": 1978, "train_info/time_within_train_step": 2.3548810482025146, "step": 1978} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 1978} {"info/global_step": 1979, "train_info/time_within_train_step": 2.3558218479156494, "step": 1979} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 1979} {"info/global_step": 1980, "train_info/time_within_train_step": 2.354689836502075, "step": 1980} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 1980} {"info/global_step": 1981, "train_info/time_within_train_step": 2.355283260345459, "step": 1981} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 1981} {"info/global_step": 1982, "train_info/time_within_train_step": 2.354405164718628, "step": 1982} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 1982} {"info/global_step": 1983, "train_info/time_within_train_step": 2.3561694622039795, "step": 1983} {"train_info/time_between_train_steps": 0.003170490264892578, "step": 1983} {"info/global_step": 1984, "train_info/time_within_train_step": 2.3557071685791016, "step": 1984} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 1984} {"info/global_step": 1985, "train_info/time_within_train_step": 2.3570716381073, "step": 1985} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 1985} {"info/global_step": 1986, "train_info/time_within_train_step": 2.3568365573883057, "step": 1986} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 1986} {"info/global_step": 1987, "train_info/time_within_train_step": 2.356099843978882, "step": 1987} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 1987} {"info/global_step": 1988, "train_info/time_within_train_step": 2.3554561138153076, "step": 1988} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 1988} {"info/global_step": 1989, "train_info/time_within_train_step": 2.355929136276245, "step": 1989} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 1989} {"info/global_step": 1990, "train_info/time_within_train_step": 2.3555495738983154, "step": 1990} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 1990} {"info/global_step": 1991, "train_info/time_within_train_step": 2.3558945655822754, "step": 1991} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 1991} {"info/global_step": 1992, "train_info/time_within_train_step": 2.355679988861084, "step": 1992} {"train_info/time_between_train_steps": 0.003296375274658203, "step": 1992} {"info/global_step": 1993, "train_info/time_within_train_step": 2.356067419052124, "step": 1993} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 1993} {"info/global_step": 1994, "train_info/time_within_train_step": 2.3558108806610107, "step": 1994} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 1994} {"info/global_step": 1995, "train_info/time_within_train_step": 2.3557071685791016, "step": 1995} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 1995} {"info/global_step": 1996, "train_info/time_within_train_step": 2.3561971187591553, "step": 1996} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 1996} {"info/global_step": 1997, "train_info/time_within_train_step": 2.3934056758880615, "step": 1997} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 1997} {"info/global_step": 1998, "train_info/time_within_train_step": 2.355977773666382, "step": 1998} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 1998} {"info/global_step": 1999, "train_info/time_within_train_step": 2.923224449157715, "step": 1999} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 1999} {"info/global_step": 2000, "train_info/time_within_train_step": 2.3554203510284424, "step": 2000} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746257346, "_runtime": 5165}, "step": 2000} {"logs": {"train/loss": 3.9011, "train/learning_rate": 0.00022222222222222218, "train/epoch": 2.09, "_timestamp": 1746257346, "_runtime": 5165}, "step": 2000} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746257350, "_runtime": 5169}, "step": 2000} {"logs": {"eval/loss": 4.376309871673584, "eval/runtime": 4.365, "eval/samples_per_second": 45.819, "eval/steps_per_second": 1.145, "train/epoch": 2.09, "_timestamp": 1746257350, "_runtime": 5169}, "step": 2000} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746257350, "_runtime": 5169}, "step": 2000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.376309871673584, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 79.5439637276111, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.365, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 45.819, "train/epoch": 2.09, "_timestamp": 1746257350, "_runtime": 5169}, "step": 2000} {"train_info/time_between_train_steps": 18.033282041549683, "step": 2000} {"info/global_step": 2001, "train_info/time_within_train_step": 2.194451093673706, "step": 2001} {"train_info/time_between_train_steps": 0.0037124156951904297, "step": 2001} {"info/global_step": 2002, "train_info/time_within_train_step": 2.181727647781372, "step": 2002} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 2002} {"info/global_step": 2003, "train_info/time_within_train_step": 2.2967755794525146, "step": 2003} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 2003} {"info/global_step": 2004, "train_info/time_within_train_step": 2.348630666732788, "step": 2004} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 2004} {"info/global_step": 2005, "train_info/time_within_train_step": 2.3523812294006348, "step": 2005} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 2005} {"info/global_step": 2006, "train_info/time_within_train_step": 2.3537275791168213, "step": 2006} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 2006} {"info/global_step": 2007, "train_info/time_within_train_step": 2.3540618419647217, "step": 2007} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 2007} {"info/global_step": 2008, "train_info/time_within_train_step": 2.355365753173828, "step": 2008} {"train_info/time_between_train_steps": 0.003183126449584961, "step": 2008} {"info/global_step": 2009, "train_info/time_within_train_step": 2.3546698093414307, "step": 2009} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 2009} {"info/global_step": 2010, "train_info/time_within_train_step": 2.355076313018799, "step": 2010} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 2010} {"info/global_step": 2011, "train_info/time_within_train_step": 2.354560613632202, "step": 2011} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 2011} {"info/global_step": 2012, "train_info/time_within_train_step": 2.354607582092285, "step": 2012} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 2012} {"info/global_step": 2013, "train_info/time_within_train_step": 2.3543858528137207, "step": 2013} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 2013} {"info/global_step": 2014, "train_info/time_within_train_step": 2.355067014694214, "step": 2014} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 2014} {"info/global_step": 2015, "train_info/time_within_train_step": 2.354250431060791, "step": 2015} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 2015} {"info/global_step": 2016, "train_info/time_within_train_step": 2.355786085128784, "step": 2016} {"train_info/time_between_train_steps": 0.003236055374145508, "step": 2016} {"info/global_step": 2017, "train_info/time_within_train_step": 2.3556578159332275, "step": 2017} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 2017} {"info/global_step": 2018, "train_info/time_within_train_step": 2.355929136276245, "step": 2018} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 2018} {"info/global_step": 2019, "train_info/time_within_train_step": 2.3569412231445312, "step": 2019} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 2019} {"info/global_step": 2020, "train_info/time_within_train_step": 2.3568670749664307, "step": 2020} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 2020} {"info/global_step": 2021, "train_info/time_within_train_step": 2.3569467067718506, "step": 2021} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 2021} {"info/global_step": 2022, "train_info/time_within_train_step": 2.3571197986602783, "step": 2022} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 2022} {"info/global_step": 2023, "train_info/time_within_train_step": 2.3561601638793945, "step": 2023} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 2023} {"info/global_step": 2024, "train_info/time_within_train_step": 2.3561198711395264, "step": 2024} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 2024} {"info/global_step": 2025, "train_info/time_within_train_step": 2.584789752960205, "step": 2025} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 2025} {"info/global_step": 2026, "train_info/time_within_train_step": 2.378674030303955, "step": 2026} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 2026} {"info/global_step": 2027, "train_info/time_within_train_step": 2.355800151824951, "step": 2027} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 2027} {"info/global_step": 2028, "train_info/time_within_train_step": 2.355510711669922, "step": 2028} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 2028} {"info/global_step": 2029, "train_info/time_within_train_step": 2.3565962314605713, "step": 2029} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 2029} {"info/global_step": 2030, "train_info/time_within_train_step": 2.3559389114379883, "step": 2030} {"train_info/time_between_train_steps": 0.0063629150390625, "step": 2030} {"info/global_step": 2031, "train_info/time_within_train_step": 2.355012893676758, "step": 2031} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 2031} {"info/global_step": 2032, "train_info/time_within_train_step": 2.3555095195770264, "step": 2032} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 2032} {"info/global_step": 2033, "train_info/time_within_train_step": 2.4953415393829346, "step": 2033} {"train_info/time_between_train_steps": 0.003170490264892578, "step": 2033} {"info/global_step": 2034, "train_info/time_within_train_step": 2.3559999465942383, "step": 2034} {"train_info/time_between_train_steps": 0.0032241344451904297, "step": 2034} {"info/global_step": 2035, "train_info/time_within_train_step": 2.3554069995880127, "step": 2035} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 2035} {"info/global_step": 2036, "train_info/time_within_train_step": 2.356039047241211, "step": 2036} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 2036} {"info/global_step": 2037, "train_info/time_within_train_step": 2.3567190170288086, "step": 2037} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 2037} {"info/global_step": 2038, "train_info/time_within_train_step": 2.356269598007202, "step": 2038} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 2038} {"info/global_step": 2039, "train_info/time_within_train_step": 2.356482744216919, "step": 2039} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 2039} {"info/global_step": 2040, "train_info/time_within_train_step": 2.356161594390869, "step": 2040} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 2040} {"info/global_step": 2041, "train_info/time_within_train_step": 2.356117010116577, "step": 2041} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 2041} {"info/global_step": 2042, "train_info/time_within_train_step": 2.3557279109954834, "step": 2042} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 2042} {"info/global_step": 2043, "train_info/time_within_train_step": 2.355510711669922, "step": 2043} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 2043} {"info/global_step": 2044, "train_info/time_within_train_step": 2.3899495601654053, "step": 2044} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 2044} {"info/global_step": 2045, "train_info/time_within_train_step": 2.3547072410583496, "step": 2045} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 2045} {"info/global_step": 2046, "train_info/time_within_train_step": 2.3551485538482666, "step": 2046} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 2046} {"info/global_step": 2047, "train_info/time_within_train_step": 2.35579514503479, "step": 2047} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 2047} {"info/global_step": 2048, "train_info/time_within_train_step": 2.3612325191497803, "step": 2048} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 2048} {"info/global_step": 2049, "train_info/time_within_train_step": 2.5883381366729736, "step": 2049} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 2049} {"info/global_step": 2050, "train_info/time_within_train_step": 2.3564705848693848, "step": 2050} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746257483, "_runtime": 5302}, "step": 2050} {"logs": {"train/loss": 3.8929, "train/learning_rate": 0.0002111111111111111, "train/epoch": 2.11, "_timestamp": 1746257483, "_runtime": 5302}, "step": 2050} {"train_info/time_between_train_steps": 0.024339675903320312, "step": 2050} {"info/global_step": 2051, "train_info/time_within_train_step": 2.354539632797241, "step": 2051} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 2051} {"info/global_step": 2052, "train_info/time_within_train_step": 2.3549413681030273, "step": 2052} {"train_info/time_between_train_steps": 0.003329038619995117, "step": 2052} {"info/global_step": 2053, "train_info/time_within_train_step": 2.354872465133667, "step": 2053} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 2053} {"info/global_step": 2054, "train_info/time_within_train_step": 2.35506010055542, "step": 2054} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 2054} {"info/global_step": 2055, "train_info/time_within_train_step": 2.356382369995117, "step": 2055} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 2055} {"info/global_step": 2056, "train_info/time_within_train_step": 2.357060432434082, "step": 2056} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 2056} {"info/global_step": 2057, "train_info/time_within_train_step": 2.356350898742676, "step": 2057} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 2057} {"info/global_step": 2058, "train_info/time_within_train_step": 2.35646915435791, "step": 2058} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 2058} {"info/global_step": 2059, "train_info/time_within_train_step": 2.355865955352783, "step": 2059} {"train_info/time_between_train_steps": 0.0032434463500976562, "step": 2059} {"info/global_step": 2060, "train_info/time_within_train_step": 2.3561999797821045, "step": 2060} {"train_info/time_between_train_steps": 0.0034623146057128906, "step": 2060} {"info/global_step": 2061, "train_info/time_within_train_step": 2.3570568561553955, "step": 2061} {"train_info/time_between_train_steps": 0.0033979415893554688, "step": 2061} {"info/global_step": 2062, "train_info/time_within_train_step": 2.3555257320404053, "step": 2062} {"train_info/time_between_train_steps": 0.0033512115478515625, "step": 2062} {"info/global_step": 2063, "train_info/time_within_train_step": 2.3559370040893555, "step": 2063} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 2063} {"info/global_step": 2064, "train_info/time_within_train_step": 2.3551838397979736, "step": 2064} {"train_info/time_between_train_steps": 0.003346681594848633, "step": 2064} {"info/global_step": 2065, "train_info/time_within_train_step": 2.3920865058898926, "step": 2065} {"train_info/time_between_train_steps": 0.0034227371215820312, "step": 2065} {"info/global_step": 2066, "train_info/time_within_train_step": 2.3554015159606934, "step": 2066} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 2066} {"info/global_step": 2067, "train_info/time_within_train_step": 2.355299949645996, "step": 2067} {"train_info/time_between_train_steps": 0.003391265869140625, "step": 2067} {"info/global_step": 2068, "train_info/time_within_train_step": 2.3561489582061768, "step": 2068} {"train_info/time_between_train_steps": 0.003305673599243164, "step": 2068} {"info/global_step": 2069, "train_info/time_within_train_step": 2.3568508625030518, "step": 2069} {"train_info/time_between_train_steps": 0.003390789031982422, "step": 2069} {"info/global_step": 2070, "train_info/time_within_train_step": 2.3554091453552246, "step": 2070} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 2070} {"info/global_step": 2071, "train_info/time_within_train_step": 2.3546030521392822, "step": 2071} {"train_info/time_between_train_steps": 0.0033690929412841797, "step": 2071} {"info/global_step": 2072, "train_info/time_within_train_step": 2.355613946914673, "step": 2072} {"train_info/time_between_train_steps": 0.003398418426513672, "step": 2072} {"info/global_step": 2073, "train_info/time_within_train_step": 2.357114553451538, "step": 2073} {"train_info/time_between_train_steps": 0.0034837722778320312, "step": 2073} {"info/global_step": 2074, "train_info/time_within_train_step": 2.654001474380493, "step": 2074} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 2074} {"info/global_step": 2075, "train_info/time_within_train_step": 2.3553526401519775, "step": 2075} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 2075} {"info/global_step": 2076, "train_info/time_within_train_step": 2.3547909259796143, "step": 2076} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 2076} {"info/global_step": 2077, "train_info/time_within_train_step": 2.354555130004883, "step": 2077} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 2077} {"info/global_step": 2078, "train_info/time_within_train_step": 2.3554136753082275, "step": 2078} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 2078} {"info/global_step": 2079, "train_info/time_within_train_step": 2.3555643558502197, "step": 2079} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 2079} {"info/global_step": 2080, "train_info/time_within_train_step": 2.3553597927093506, "step": 2080} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 2080} {"info/global_step": 2081, "train_info/time_within_train_step": 2.3556020259857178, "step": 2081} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 2081} {"info/global_step": 2082, "train_info/time_within_train_step": 2.3560571670532227, "step": 2082} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 2082} {"info/global_step": 2083, "train_info/time_within_train_step": 2.3543460369110107, "step": 2083} {"train_info/time_between_train_steps": 0.0032901763916015625, "step": 2083} {"info/global_step": 2084, "train_info/time_within_train_step": 2.3554763793945312, "step": 2084} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 2084} {"info/global_step": 2085, "train_info/time_within_train_step": 2.3553340435028076, "step": 2085} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 2085} {"info/global_step": 2086, "train_info/time_within_train_step": 2.3542168140411377, "step": 2086} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 2086} {"info/global_step": 2087, "train_info/time_within_train_step": 2.355257749557495, "step": 2087} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 2087} {"info/global_step": 2088, "train_info/time_within_train_step": 2.3567116260528564, "step": 2088} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 2088} {"info/global_step": 2089, "train_info/time_within_train_step": 2.3550381660461426, "step": 2089} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 2089} {"info/global_step": 2090, "train_info/time_within_train_step": 2.3552746772766113, "step": 2090} {"train_info/time_between_train_steps": 0.006641387939453125, "step": 2090} {"info/global_step": 2091, "train_info/time_within_train_step": 2.3562421798706055, "step": 2091} {"train_info/time_between_train_steps": 0.006598949432373047, "step": 2091} {"info/global_step": 2092, "train_info/time_within_train_step": 2.354849338531494, "step": 2092} {"train_info/time_between_train_steps": 0.0065555572509765625, "step": 2092} {"info/global_step": 2093, "train_info/time_within_train_step": 2.354731798171997, "step": 2093} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 2093} {"info/global_step": 2094, "train_info/time_within_train_step": 2.355363368988037, "step": 2094} {"train_info/time_between_train_steps": 0.006566047668457031, "step": 2094} {"info/global_step": 2095, "train_info/time_within_train_step": 2.3550467491149902, "step": 2095} {"train_info/time_between_train_steps": 0.1314840316772461, "step": 2095} {"info/global_step": 2096, "train_info/time_within_train_step": 2.3741250038146973, "step": 2096} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 2096} {"info/global_step": 2097, "train_info/time_within_train_step": 2.35457181930542, "step": 2097} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 2097} {"info/global_step": 2098, "train_info/time_within_train_step": 2.3542563915252686, "step": 2098} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 2098} {"info/global_step": 2099, "train_info/time_within_train_step": 2.5900683403015137, "step": 2099} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 2099} {"info/global_step": 2100, "train_info/time_within_train_step": 2.3548519611358643, "step": 2100} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746257603, "_runtime": 5422}, "step": 2100} {"logs": {"train/loss": 3.8651, "train/learning_rate": 0.00019999999999999998, "train/epoch": 2.13, "_timestamp": 1746257603, "_runtime": 5422}, "step": 2100} {"train_info/time_between_train_steps": 15.055116891860962, "step": 2100} {"info/global_step": 2101, "train_info/time_within_train_step": 2.1963279247283936, "step": 2101} {"train_info/time_between_train_steps": 0.003222942352294922, "step": 2101} {"info/global_step": 2102, "train_info/time_within_train_step": 2.1823952198028564, "step": 2102} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 2102} {"info/global_step": 2103, "train_info/time_within_train_step": 2.2789456844329834, "step": 2103} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 2103} {"info/global_step": 2104, "train_info/time_within_train_step": 2.3478140830993652, "step": 2104} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 2104} {"info/global_step": 2105, "train_info/time_within_train_step": 2.3516435623168945, "step": 2105} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 2105} {"info/global_step": 2106, "train_info/time_within_train_step": 2.3548920154571533, "step": 2106} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 2106} {"info/global_step": 2107, "train_info/time_within_train_step": 2.3549835681915283, "step": 2107} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 2107} {"info/global_step": 2108, "train_info/time_within_train_step": 2.355109453201294, "step": 2108} {"train_info/time_between_train_steps": 0.00323486328125, "step": 2108} {"info/global_step": 2109, "train_info/time_within_train_step": 2.355365037918091, "step": 2109} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 2109} {"info/global_step": 2110, "train_info/time_within_train_step": 2.3558521270751953, "step": 2110} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2110} {"info/global_step": 2111, "train_info/time_within_train_step": 2.356444835662842, "step": 2111} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 2111} {"info/global_step": 2112, "train_info/time_within_train_step": 2.3568904399871826, "step": 2112} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 2112} {"info/global_step": 2113, "train_info/time_within_train_step": 2.356046438217163, "step": 2113} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 2113} {"info/global_step": 2114, "train_info/time_within_train_step": 2.358102560043335, "step": 2114} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 2114} {"info/global_step": 2115, "train_info/time_within_train_step": 2.3566644191741943, "step": 2115} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 2115} {"info/global_step": 2116, "train_info/time_within_train_step": 2.3563151359558105, "step": 2116} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 2116} {"info/global_step": 2117, "train_info/time_within_train_step": 2.357044219970703, "step": 2117} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 2117} {"info/global_step": 2118, "train_info/time_within_train_step": 2.3559775352478027, "step": 2118} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 2118} {"info/global_step": 2119, "train_info/time_within_train_step": 2.3565001487731934, "step": 2119} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 2119} {"info/global_step": 2120, "train_info/time_within_train_step": 2.3565478324890137, "step": 2120} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 2120} {"info/global_step": 2121, "train_info/time_within_train_step": 2.3570711612701416, "step": 2121} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 2121} {"info/global_step": 2122, "train_info/time_within_train_step": 2.568153142929077, "step": 2122} {"train_info/time_between_train_steps": 0.003265857696533203, "step": 2122} {"info/global_step": 2123, "train_info/time_within_train_step": 2.356599807739258, "step": 2123} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 2123} {"info/global_step": 2124, "train_info/time_within_train_step": 2.357292413711548, "step": 2124} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 2124} {"info/global_step": 2125, "train_info/time_within_train_step": 2.3551323413848877, "step": 2125} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 2125} {"info/global_step": 2126, "train_info/time_within_train_step": 2.3572144508361816, "step": 2126} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 2126} {"info/global_step": 2127, "train_info/time_within_train_step": 2.356428384780884, "step": 2127} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 2127} {"info/global_step": 2128, "train_info/time_within_train_step": 2.357442617416382, "step": 2128} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 2128} {"info/global_step": 2129, "train_info/time_within_train_step": 2.3567590713500977, "step": 2129} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 2129} {"info/global_step": 2130, "train_info/time_within_train_step": 2.356736183166504, "step": 2130} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 2130} {"info/global_step": 2131, "train_info/time_within_train_step": 2.3574116230010986, "step": 2131} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 2131} {"info/global_step": 2132, "train_info/time_within_train_step": 2.356567859649658, "step": 2132} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 2132} {"info/global_step": 2133, "train_info/time_within_train_step": 2.355928897857666, "step": 2133} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 2133} {"info/global_step": 2134, "train_info/time_within_train_step": 2.3566834926605225, "step": 2134} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 2134} {"info/global_step": 2135, "train_info/time_within_train_step": 2.3560638427734375, "step": 2135} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 2135} {"info/global_step": 2136, "train_info/time_within_train_step": 2.3562982082366943, "step": 2136} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 2136} {"info/global_step": 2137, "train_info/time_within_train_step": 2.3560519218444824, "step": 2137} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 2137} {"info/global_step": 2138, "train_info/time_within_train_step": 2.3567914962768555, "step": 2138} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 2138} {"info/global_step": 2139, "train_info/time_within_train_step": 2.3550589084625244, "step": 2139} {"train_info/time_between_train_steps": 0.0050754547119140625, "step": 2139} {"info/global_step": 2140, "train_info/time_within_train_step": 2.3570430278778076, "step": 2140} {"train_info/time_between_train_steps": 0.003173828125, "step": 2140} {"info/global_step": 2141, "train_info/time_within_train_step": 2.357041597366333, "step": 2141} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 2141} {"info/global_step": 2142, "train_info/time_within_train_step": 2.3563663959503174, "step": 2142} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 2142} {"info/global_step": 2143, "train_info/time_within_train_step": 2.3620288372039795, "step": 2143} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 2143} {"info/global_step": 2144, "train_info/time_within_train_step": 2.3570590019226074, "step": 2144} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 2144} {"info/global_step": 2145, "train_info/time_within_train_step": 2.3560919761657715, "step": 2145} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 2145} {"info/global_step": 2146, "train_info/time_within_train_step": 2.355759620666504, "step": 2146} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 2146} {"info/global_step": 2147, "train_info/time_within_train_step": 2.3563618659973145, "step": 2147} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 2147} {"info/global_step": 2148, "train_info/time_within_train_step": 2.5969715118408203, "step": 2148} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 2148} {"info/global_step": 2149, "train_info/time_within_train_step": 2.3556134700775146, "step": 2149} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 2149} {"info/global_step": 2150, "train_info/time_within_train_step": 2.3569204807281494, "step": 2150} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746257737, "_runtime": 5556}, "step": 2150} {"logs": {"train/loss": 3.847, "train/learning_rate": 0.00018888888888888888, "train/epoch": 2.14, "_timestamp": 1746257737, "_runtime": 5556}, "step": 2150} {"train_info/time_between_train_steps": 0.02492547035217285, "step": 2150} {"info/global_step": 2151, "train_info/time_within_train_step": 2.3571979999542236, "step": 2151} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 2151} {"info/global_step": 2152, "train_info/time_within_train_step": 2.356919050216675, "step": 2152} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 2152} {"info/global_step": 2153, "train_info/time_within_train_step": 2.356419801712036, "step": 2153} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 2153} {"info/global_step": 2154, "train_info/time_within_train_step": 2.3567287921905518, "step": 2154} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 2154} {"info/global_step": 2155, "train_info/time_within_train_step": 2.3560919761657715, "step": 2155} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 2155} {"info/global_step": 2156, "train_info/time_within_train_step": 2.355656385421753, "step": 2156} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 2156} {"info/global_step": 2157, "train_info/time_within_train_step": 2.355593204498291, "step": 2157} {"train_info/time_between_train_steps": 0.003344297409057617, "step": 2157} {"info/global_step": 2158, "train_info/time_within_train_step": 2.4792592525482178, "step": 2158} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 2158} {"info/global_step": 2159, "train_info/time_within_train_step": 2.3566243648529053, "step": 2159} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 2159} {"info/global_step": 2160, "train_info/time_within_train_step": 2.356764793395996, "step": 2160} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 2160} {"info/global_step": 2161, "train_info/time_within_train_step": 2.3558921813964844, "step": 2161} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 2161} {"info/global_step": 2162, "train_info/time_within_train_step": 2.354901075363159, "step": 2162} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 2162} {"info/global_step": 2163, "train_info/time_within_train_step": 2.3553013801574707, "step": 2163} {"train_info/time_between_train_steps": 0.003530740737915039, "step": 2163} {"info/global_step": 2164, "train_info/time_within_train_step": 2.356088161468506, "step": 2164} {"train_info/time_between_train_steps": 0.00342559814453125, "step": 2164} {"info/global_step": 2165, "train_info/time_within_train_step": 2.3560543060302734, "step": 2165} {"train_info/time_between_train_steps": 0.003420591354370117, "step": 2165} {"info/global_step": 2166, "train_info/time_within_train_step": 2.356177806854248, "step": 2166} {"train_info/time_between_train_steps": 0.003421783447265625, "step": 2166} {"info/global_step": 2167, "train_info/time_within_train_step": 2.3572776317596436, "step": 2167} {"train_info/time_between_train_steps": 0.0034062862396240234, "step": 2167} {"info/global_step": 2168, "train_info/time_within_train_step": 2.3563730716705322, "step": 2168} {"train_info/time_between_train_steps": 0.0034554004669189453, "step": 2168} {"info/global_step": 2169, "train_info/time_within_train_step": 2.3567628860473633, "step": 2169} {"train_info/time_between_train_steps": 0.003457307815551758, "step": 2169} {"info/global_step": 2170, "train_info/time_within_train_step": 2.357008457183838, "step": 2170} {"train_info/time_between_train_steps": 0.003487110137939453, "step": 2170} {"info/global_step": 2171, "train_info/time_within_train_step": 2.35615873336792, "step": 2171} {"train_info/time_between_train_steps": 0.0034203529357910156, "step": 2171} {"info/global_step": 2172, "train_info/time_within_train_step": 2.3567471504211426, "step": 2172} {"train_info/time_between_train_steps": 0.0034165382385253906, "step": 2172} {"info/global_step": 2173, "train_info/time_within_train_step": 2.6795265674591064, "step": 2173} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 2173} {"info/global_step": 2174, "train_info/time_within_train_step": 2.3551690578460693, "step": 2174} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 2174} {"info/global_step": 2175, "train_info/time_within_train_step": 2.356193780899048, "step": 2175} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 2175} {"info/global_step": 2176, "train_info/time_within_train_step": 2.3555445671081543, "step": 2176} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 2176} {"info/global_step": 2177, "train_info/time_within_train_step": 2.3546206951141357, "step": 2177} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 2177} {"info/global_step": 2178, "train_info/time_within_train_step": 2.3557772636413574, "step": 2178} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 2178} {"info/global_step": 2179, "train_info/time_within_train_step": 2.356867790222168, "step": 2179} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 2179} {"info/global_step": 2180, "train_info/time_within_train_step": 2.3558709621429443, "step": 2180} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 2180} {"info/global_step": 2181, "train_info/time_within_train_step": 2.3562369346618652, "step": 2181} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 2181} {"info/global_step": 2182, "train_info/time_within_train_step": 2.356752872467041, "step": 2182} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 2182} {"info/global_step": 2183, "train_info/time_within_train_step": 2.355729341506958, "step": 2183} {"train_info/time_between_train_steps": 0.0032570362091064453, "step": 2183} {"info/global_step": 2184, "train_info/time_within_train_step": 2.356865644454956, "step": 2184} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 2184} {"info/global_step": 2185, "train_info/time_within_train_step": 2.356351613998413, "step": 2185} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 2185} {"info/global_step": 2186, "train_info/time_within_train_step": 2.3556151390075684, "step": 2186} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 2186} {"info/global_step": 2187, "train_info/time_within_train_step": 2.3570239543914795, "step": 2187} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 2187} {"info/global_step": 2188, "train_info/time_within_train_step": 2.3558883666992188, "step": 2188} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 2188} {"info/global_step": 2189, "train_info/time_within_train_step": 2.390212059020996, "step": 2189} {"train_info/time_between_train_steps": 0.0032720565795898438, "step": 2189} {"info/global_step": 2190, "train_info/time_within_train_step": 2.3568506240844727, "step": 2190} {"train_info/time_between_train_steps": 0.003244638442993164, "step": 2190} {"info/global_step": 2191, "train_info/time_within_train_step": 2.3559443950653076, "step": 2191} {"train_info/time_between_train_steps": 0.003302335739135742, "step": 2191} {"info/global_step": 2192, "train_info/time_within_train_step": 2.3563365936279297, "step": 2192} {"train_info/time_between_train_steps": 0.003429889678955078, "step": 2192} {"info/global_step": 2193, "train_info/time_within_train_step": 2.360846757888794, "step": 2193} {"train_info/time_between_train_steps": 0.0034246444702148438, "step": 2193} {"info/global_step": 2194, "train_info/time_within_train_step": 2.356414318084717, "step": 2194} {"train_info/time_between_train_steps": 0.003485441207885742, "step": 2194} {"info/global_step": 2195, "train_info/time_within_train_step": 2.3564553260803223, "step": 2195} {"train_info/time_between_train_steps": 0.0033843517303466797, "step": 2195} {"info/global_step": 2196, "train_info/time_within_train_step": 2.356397867202759, "step": 2196} {"train_info/time_between_train_steps": 0.003361940383911133, "step": 2196} {"info/global_step": 2197, "train_info/time_within_train_step": 2.3790810108184814, "step": 2197} {"train_info/time_between_train_steps": 0.003390789031982422, "step": 2197} {"info/global_step": 2198, "train_info/time_within_train_step": 2.667217493057251, "step": 2198} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 2198} {"info/global_step": 2199, "train_info/time_within_train_step": 2.3566665649414062, "step": 2199} {"train_info/time_between_train_steps": 0.0038678646087646484, "step": 2199} {"info/global_step": 2200, "train_info/time_within_train_step": 2.3556103706359863, "step": 2200} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746257857, "_runtime": 5676}, "step": 2200} {"logs": {"train/loss": 3.8403, "train/learning_rate": 0.00017777777777777776, "train/epoch": 2.16, "_timestamp": 1746257857, "_runtime": 5676}, "step": 2200} {"train_info/time_between_train_steps": 15.142832040786743, "step": 2200} {"info/global_step": 2201, "train_info/time_within_train_step": 2.1987597942352295, "step": 2201} {"train_info/time_between_train_steps": 0.0032455921173095703, "step": 2201} {"info/global_step": 2202, "train_info/time_within_train_step": 2.181131601333618, "step": 2202} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 2202} {"info/global_step": 2203, "train_info/time_within_train_step": 2.2615644931793213, "step": 2203} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 2203} {"info/global_step": 2204, "train_info/time_within_train_step": 2.349602222442627, "step": 2204} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 2204} {"info/global_step": 2205, "train_info/time_within_train_step": 2.352391481399536, "step": 2205} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 2205} {"info/global_step": 2206, "train_info/time_within_train_step": 2.3547544479370117, "step": 2206} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 2206} {"info/global_step": 2207, "train_info/time_within_train_step": 2.3540661334991455, "step": 2207} {"train_info/time_between_train_steps": 0.0032241344451904297, "step": 2207} {"info/global_step": 2208, "train_info/time_within_train_step": 2.3865668773651123, "step": 2208} {"train_info/time_between_train_steps": 0.00324249267578125, "step": 2208} {"info/global_step": 2209, "train_info/time_within_train_step": 2.3549745082855225, "step": 2209} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 2209} {"info/global_step": 2210, "train_info/time_within_train_step": 2.355581045150757, "step": 2210} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 2210} {"info/global_step": 2211, "train_info/time_within_train_step": 2.3549652099609375, "step": 2211} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 2211} {"info/global_step": 2212, "train_info/time_within_train_step": 2.3552308082580566, "step": 2212} {"train_info/time_between_train_steps": 0.0032820701599121094, "step": 2212} {"info/global_step": 2213, "train_info/time_within_train_step": 2.3561744689941406, "step": 2213} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 2213} {"info/global_step": 2214, "train_info/time_within_train_step": 2.3559021949768066, "step": 2214} {"train_info/time_between_train_steps": 0.0032460689544677734, "step": 2214} {"info/global_step": 2215, "train_info/time_within_train_step": 2.356004476547241, "step": 2215} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 2215} {"info/global_step": 2216, "train_info/time_within_train_step": 2.3786189556121826, "step": 2216} {"train_info/time_between_train_steps": 0.0032482147216796875, "step": 2216} {"info/global_step": 2217, "train_info/time_within_train_step": 2.3554368019104004, "step": 2217} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 2217} {"info/global_step": 2218, "train_info/time_within_train_step": 2.3555147647857666, "step": 2218} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 2218} {"info/global_step": 2219, "train_info/time_within_train_step": 2.3564610481262207, "step": 2219} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 2219} {"info/global_step": 2220, "train_info/time_within_train_step": 2.356109619140625, "step": 2220} {"train_info/time_between_train_steps": 0.1096963882446289, "step": 2220} {"info/global_step": 2221, "train_info/time_within_train_step": 2.357252359390259, "step": 2221} {"train_info/time_between_train_steps": 0.003541707992553711, "step": 2221} {"info/global_step": 2222, "train_info/time_within_train_step": 2.356165647506714, "step": 2222} {"train_info/time_between_train_steps": 0.003225564956665039, "step": 2222} {"info/global_step": 2223, "train_info/time_within_train_step": 2.6075663566589355, "step": 2223} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 2223} {"info/global_step": 2224, "train_info/time_within_train_step": 2.356353998184204, "step": 2224} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 2224} {"info/global_step": 2225, "train_info/time_within_train_step": 2.3556485176086426, "step": 2225} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 2225} {"info/global_step": 2226, "train_info/time_within_train_step": 2.356797695159912, "step": 2226} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 2226} {"info/global_step": 2227, "train_info/time_within_train_step": 2.3570516109466553, "step": 2227} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 2227} {"info/global_step": 2228, "train_info/time_within_train_step": 2.35669207572937, "step": 2228} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 2228} {"info/global_step": 2229, "train_info/time_within_train_step": 2.3940327167510986, "step": 2229} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 2229} {"info/global_step": 2230, "train_info/time_within_train_step": 2.3563332557678223, "step": 2230} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 2230} {"info/global_step": 2231, "train_info/time_within_train_step": 2.356844902038574, "step": 2231} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 2231} {"info/global_step": 2232, "train_info/time_within_train_step": 2.357111692428589, "step": 2232} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 2232} {"info/global_step": 2233, "train_info/time_within_train_step": 2.3561954498291016, "step": 2233} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 2233} {"info/global_step": 2234, "train_info/time_within_train_step": 2.3557991981506348, "step": 2234} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 2234} {"info/global_step": 2235, "train_info/time_within_train_step": 2.3553431034088135, "step": 2235} {"train_info/time_between_train_steps": 0.003268718719482422, "step": 2235} {"info/global_step": 2236, "train_info/time_within_train_step": 2.356323719024658, "step": 2236} {"train_info/time_between_train_steps": 0.0032567977905273438, "step": 2236} {"info/global_step": 2237, "train_info/time_within_train_step": 2.360250234603882, "step": 2237} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 2237} {"info/global_step": 2238, "train_info/time_within_train_step": 2.355539083480835, "step": 2238} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 2238} {"info/global_step": 2239, "train_info/time_within_train_step": 2.3554811477661133, "step": 2239} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 2239} {"info/global_step": 2240, "train_info/time_within_train_step": 2.355381965637207, "step": 2240} {"train_info/time_between_train_steps": 0.0033991336822509766, "step": 2240} {"info/global_step": 2241, "train_info/time_within_train_step": 2.355506658554077, "step": 2241} {"train_info/time_between_train_steps": 0.0032863616943359375, "step": 2241} {"info/global_step": 2242, "train_info/time_within_train_step": 2.3553287982940674, "step": 2242} {"train_info/time_between_train_steps": 0.003246307373046875, "step": 2242} {"info/global_step": 2243, "train_info/time_within_train_step": 2.356039047241211, "step": 2243} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 2243} {"info/global_step": 2244, "train_info/time_within_train_step": 2.3561575412750244, "step": 2244} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 2244} {"info/global_step": 2245, "train_info/time_within_train_step": 2.355247974395752, "step": 2245} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 2245} {"info/global_step": 2246, "train_info/time_within_train_step": 2.3555285930633545, "step": 2246} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 2246} {"info/global_step": 2247, "train_info/time_within_train_step": 2.3545138835906982, "step": 2247} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 2247} {"info/global_step": 2248, "train_info/time_within_train_step": 2.5989561080932617, "step": 2248} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 2248} {"info/global_step": 2249, "train_info/time_within_train_step": 2.895986318588257, "step": 2249} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 2249} {"info/global_step": 2250, "train_info/time_within_train_step": 2.355314016342163, "step": 2250} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746257992, "_runtime": 5811}, "step": 2250} {"logs": {"train/loss": 3.8203, "train/learning_rate": 0.00016666666666666666, "train/epoch": 2.18, "_timestamp": 1746257992, "_runtime": 5811}, "step": 2250} {"train_info/time_between_train_steps": 0.024729490280151367, "step": 2250} {"info/global_step": 2251, "train_info/time_within_train_step": 2.356224298477173, "step": 2251} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 2251} {"info/global_step": 2252, "train_info/time_within_train_step": 2.3556649684906006, "step": 2252} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 2252} {"info/global_step": 2253, "train_info/time_within_train_step": 2.3555846214294434, "step": 2253} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 2253} {"info/global_step": 2254, "train_info/time_within_train_step": 2.35483455657959, "step": 2254} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 2254} {"info/global_step": 2255, "train_info/time_within_train_step": 2.3555893898010254, "step": 2255} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 2255} {"info/global_step": 2256, "train_info/time_within_train_step": 2.3550643920898438, "step": 2256} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 2256} {"info/global_step": 2257, "train_info/time_within_train_step": 2.355473279953003, "step": 2257} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 2257} {"info/global_step": 2258, "train_info/time_within_train_step": 2.3546628952026367, "step": 2258} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 2258} {"info/global_step": 2259, "train_info/time_within_train_step": 2.354524850845337, "step": 2259} {"train_info/time_between_train_steps": 0.0032820701599121094, "step": 2259} {"info/global_step": 2260, "train_info/time_within_train_step": 2.3555996417999268, "step": 2260} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 2260} {"info/global_step": 2261, "train_info/time_within_train_step": 2.354631185531616, "step": 2261} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 2261} {"info/global_step": 2262, "train_info/time_within_train_step": 2.355152130126953, "step": 2262} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 2262} {"info/global_step": 2263, "train_info/time_within_train_step": 2.3553435802459717, "step": 2263} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 2263} {"info/global_step": 2264, "train_info/time_within_train_step": 2.356886148452759, "step": 2264} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 2264} {"info/global_step": 2265, "train_info/time_within_train_step": 2.3559017181396484, "step": 2265} {"train_info/time_between_train_steps": 0.0032334327697753906, "step": 2265} {"info/global_step": 2266, "train_info/time_within_train_step": 2.3555848598480225, "step": 2266} {"train_info/time_between_train_steps": 0.0032396316528320312, "step": 2266} {"info/global_step": 2267, "train_info/time_within_train_step": 2.3546791076660156, "step": 2267} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 2267} {"info/global_step": 2268, "train_info/time_within_train_step": 2.3738226890563965, "step": 2268} {"train_info/time_between_train_steps": 0.002885580062866211, "step": 2268} {"info/global_step": 2269, "train_info/time_within_train_step": 2.3548660278320312, "step": 2269} {"train_info/time_between_train_steps": 0.002887725830078125, "step": 2269} {"info/global_step": 2270, "train_info/time_within_train_step": 2.3541314601898193, "step": 2270} {"train_info/time_between_train_steps": 0.0028972625732421875, "step": 2270} {"info/global_step": 2271, "train_info/time_within_train_step": 2.353592872619629, "step": 2271} {"train_info/time_between_train_steps": 0.0029168128967285156, "step": 2271} {"info/global_step": 2272, "train_info/time_within_train_step": 2.3556935787200928, "step": 2272} {"train_info/time_between_train_steps": 0.0030176639556884766, "step": 2272} {"info/global_step": 2273, "train_info/time_within_train_step": 2.354226589202881, "step": 2273} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 2273} {"info/global_step": 2274, "train_info/time_within_train_step": 2.5718140602111816, "step": 2274} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 2274} {"info/global_step": 2275, "train_info/time_within_train_step": 2.354276180267334, "step": 2275} {"train_info/time_between_train_steps": 0.0029206275939941406, "step": 2275} {"info/global_step": 2276, "train_info/time_within_train_step": 2.3533236980438232, "step": 2276} {"train_info/time_between_train_steps": 0.0029754638671875, "step": 2276} {"info/global_step": 2277, "train_info/time_within_train_step": 2.3539581298828125, "step": 2277} {"train_info/time_between_train_steps": 0.0029184818267822266, "step": 2277} {"info/global_step": 2278, "train_info/time_within_train_step": 2.3543806076049805, "step": 2278} {"train_info/time_between_train_steps": 0.0029022693634033203, "step": 2278} {"info/global_step": 2279, "train_info/time_within_train_step": 2.3917770385742188, "step": 2279} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 2279} {"info/global_step": 2280, "train_info/time_within_train_step": 2.353905200958252, "step": 2280} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 2280} {"info/global_step": 2281, "train_info/time_within_train_step": 2.354234218597412, "step": 2281} {"train_info/time_between_train_steps": 0.0028815269470214844, "step": 2281} {"info/global_step": 2282, "train_info/time_within_train_step": 2.35404372215271, "step": 2282} {"train_info/time_between_train_steps": 0.0029010772705078125, "step": 2282} {"info/global_step": 2283, "train_info/time_within_train_step": 2.3532462120056152, "step": 2283} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 2283} {"info/global_step": 2284, "train_info/time_within_train_step": 2.3544511795043945, "step": 2284} {"train_info/time_between_train_steps": 0.0029675960540771484, "step": 2284} {"info/global_step": 2285, "train_info/time_within_train_step": 2.3542113304138184, "step": 2285} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 2285} {"info/global_step": 2286, "train_info/time_within_train_step": 2.3534743785858154, "step": 2286} {"train_info/time_between_train_steps": 0.0029222965240478516, "step": 2286} {"info/global_step": 2287, "train_info/time_within_train_step": 2.358891248703003, "step": 2287} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 2287} {"info/global_step": 2288, "train_info/time_within_train_step": 2.3545725345611572, "step": 2288} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 2288} {"info/global_step": 2289, "train_info/time_within_train_step": 2.3536760807037354, "step": 2289} {"train_info/time_between_train_steps": 0.002920389175415039, "step": 2289} {"info/global_step": 2290, "train_info/time_within_train_step": 2.35306715965271, "step": 2290} {"train_info/time_between_train_steps": 0.002899169921875, "step": 2290} {"info/global_step": 2291, "train_info/time_within_train_step": 2.3535478115081787, "step": 2291} {"train_info/time_between_train_steps": 0.0029478073120117188, "step": 2291} {"info/global_step": 2292, "train_info/time_within_train_step": 2.3537251949310303, "step": 2292} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 2292} {"info/global_step": 2293, "train_info/time_within_train_step": 2.3539228439331055, "step": 2293} {"train_info/time_between_train_steps": 0.0028836727142333984, "step": 2293} {"info/global_step": 2294, "train_info/time_within_train_step": 2.3538453578948975, "step": 2294} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 2294} {"info/global_step": 2295, "train_info/time_within_train_step": 2.3539202213287354, "step": 2295} {"train_info/time_between_train_steps": 0.0028960704803466797, "step": 2295} {"info/global_step": 2296, "train_info/time_within_train_step": 2.353433132171631, "step": 2296} {"train_info/time_between_train_steps": 0.0029163360595703125, "step": 2296} {"info/global_step": 2297, "train_info/time_within_train_step": 2.3536689281463623, "step": 2297} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 2297} {"info/global_step": 2298, "train_info/time_within_train_step": 2.353830099105835, "step": 2298} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 2298} {"info/global_step": 2299, "train_info/time_within_train_step": 2.5570948123931885, "step": 2299} {"train_info/time_between_train_steps": 0.002871274948120117, "step": 2299} {"info/global_step": 2300, "train_info/time_within_train_step": 2.353471279144287, "step": 2300} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746258111, "_runtime": 5930}, "step": 2300} {"logs": {"train/loss": 3.7985, "train/learning_rate": 0.00015555555555555554, "train/epoch": 2.19, "_timestamp": 1746258111, "_runtime": 5930}, "step": 2300} {"train_info/time_between_train_steps": 23.91586208343506, "step": 2300} {"info/global_step": 2301, "train_info/time_within_train_step": 2.2011735439300537, "step": 2301} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 2301} {"info/global_step": 2302, "train_info/time_within_train_step": 2.181056261062622, "step": 2302} {"train_info/time_between_train_steps": 0.002908468246459961, "step": 2302} {"info/global_step": 2303, "train_info/time_within_train_step": 2.1802818775177, "step": 2303} {"train_info/time_between_train_steps": 0.002919912338256836, "step": 2303} {"info/global_step": 2304, "train_info/time_within_train_step": 2.3092687129974365, "step": 2304} {"train_info/time_between_train_steps": 0.0029311180114746094, "step": 2304} {"info/global_step": 2305, "train_info/time_within_train_step": 2.348875045776367, "step": 2305} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 2305} {"info/global_step": 2306, "train_info/time_within_train_step": 2.35200572013855, "step": 2306} {"train_info/time_between_train_steps": 0.0029096603393554688, "step": 2306} {"info/global_step": 2307, "train_info/time_within_train_step": 2.354952812194824, "step": 2307} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 2307} {"info/global_step": 2308, "train_info/time_within_train_step": 2.356034994125366, "step": 2308} {"train_info/time_between_train_steps": 0.0028917789459228516, "step": 2308} {"info/global_step": 2309, "train_info/time_within_train_step": 2.3554694652557373, "step": 2309} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 2309} {"info/global_step": 2310, "train_info/time_within_train_step": 2.3561322689056396, "step": 2310} {"train_info/time_between_train_steps": 0.0028917789459228516, "step": 2310} {"info/global_step": 2311, "train_info/time_within_train_step": 2.356473684310913, "step": 2311} {"train_info/time_between_train_steps": 0.002887248992919922, "step": 2311} {"info/global_step": 2312, "train_info/time_within_train_step": 2.3559584617614746, "step": 2312} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 2312} {"info/global_step": 2313, "train_info/time_within_train_step": 2.355480194091797, "step": 2313} {"train_info/time_between_train_steps": 0.0029036998748779297, "step": 2313} {"info/global_step": 2314, "train_info/time_within_train_step": 2.356877088546753, "step": 2314} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 2314} {"info/global_step": 2315, "train_info/time_within_train_step": 2.3557088375091553, "step": 2315} {"train_info/time_between_train_steps": 0.0029036998748779297, "step": 2315} {"info/global_step": 2316, "train_info/time_within_train_step": 2.3557980060577393, "step": 2316} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 2316} {"info/global_step": 2317, "train_info/time_within_train_step": 2.354968309402466, "step": 2317} {"train_info/time_between_train_steps": 0.0028824806213378906, "step": 2317} {"info/global_step": 2318, "train_info/time_within_train_step": 2.356668710708618, "step": 2318} {"train_info/time_between_train_steps": 0.002932310104370117, "step": 2318} {"info/global_step": 2319, "train_info/time_within_train_step": 2.3562450408935547, "step": 2319} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 2319} {"info/global_step": 2320, "train_info/time_within_train_step": 2.3565917015075684, "step": 2320} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 2320} {"info/global_step": 2321, "train_info/time_within_train_step": 2.3555655479431152, "step": 2321} {"train_info/time_between_train_steps": 0.0029060840606689453, "step": 2321} {"info/global_step": 2322, "train_info/time_within_train_step": 2.355560064315796, "step": 2322} {"train_info/time_between_train_steps": 0.002896547317504883, "step": 2322} {"info/global_step": 2323, "train_info/time_within_train_step": 2.3553812503814697, "step": 2323} {"train_info/time_between_train_steps": 0.002885580062866211, "step": 2323} {"info/global_step": 2324, "train_info/time_within_train_step": 2.544447422027588, "step": 2324} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 2324} {"info/global_step": 2325, "train_info/time_within_train_step": 2.3568813800811768, "step": 2325} {"train_info/time_between_train_steps": 0.0028994083404541016, "step": 2325} {"info/global_step": 2326, "train_info/time_within_train_step": 2.3550608158111572, "step": 2326} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 2326} {"info/global_step": 2327, "train_info/time_within_train_step": 2.355407238006592, "step": 2327} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 2327} {"info/global_step": 2328, "train_info/time_within_train_step": 2.3545455932617188, "step": 2328} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 2328} {"info/global_step": 2329, "train_info/time_within_train_step": 2.3556325435638428, "step": 2329} {"train_info/time_between_train_steps": 0.0028662681579589844, "step": 2329} {"info/global_step": 2330, "train_info/time_within_train_step": 2.3556854724884033, "step": 2330} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 2330} {"info/global_step": 2331, "train_info/time_within_train_step": 2.3550665378570557, "step": 2331} {"train_info/time_between_train_steps": 0.0028967857360839844, "step": 2331} {"info/global_step": 2332, "train_info/time_within_train_step": 2.3541152477264404, "step": 2332} {"train_info/time_between_train_steps": 0.002897024154663086, "step": 2332} {"info/global_step": 2333, "train_info/time_within_train_step": 2.354203224182129, "step": 2333} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 2333} {"info/global_step": 2334, "train_info/time_within_train_step": 2.354717969894409, "step": 2334} {"train_info/time_between_train_steps": 0.002964496612548828, "step": 2334} {"info/global_step": 2335, "train_info/time_within_train_step": 2.3565235137939453, "step": 2335} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 2335} {"info/global_step": 2336, "train_info/time_within_train_step": 2.3552308082580566, "step": 2336} {"train_info/time_between_train_steps": 0.002887248992919922, "step": 2336} {"info/global_step": 2337, "train_info/time_within_train_step": 2.3551385402679443, "step": 2337} {"train_info/time_between_train_steps": 0.002972841262817383, "step": 2337} {"info/global_step": 2338, "train_info/time_within_train_step": 2.354658603668213, "step": 2338} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 2338} {"info/global_step": 2339, "train_info/time_within_train_step": 2.3553848266601562, "step": 2339} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 2339} {"info/global_step": 2340, "train_info/time_within_train_step": 2.355198621749878, "step": 2340} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 2340} {"info/global_step": 2341, "train_info/time_within_train_step": 2.355829954147339, "step": 2341} {"train_info/time_between_train_steps": 0.002933502197265625, "step": 2341} {"info/global_step": 2342, "train_info/time_within_train_step": 2.354642868041992, "step": 2342} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 2342} {"info/global_step": 2343, "train_info/time_within_train_step": 2.3559768199920654, "step": 2343} {"train_info/time_between_train_steps": 0.0028858184814453125, "step": 2343} {"info/global_step": 2344, "train_info/time_within_train_step": 2.3560593128204346, "step": 2344} {"train_info/time_between_train_steps": 0.0028946399688720703, "step": 2344} {"info/global_step": 2345, "train_info/time_within_train_step": 2.354686975479126, "step": 2345} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 2345} {"info/global_step": 2346, "train_info/time_within_train_step": 2.355539083480835, "step": 2346} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 2346} {"info/global_step": 2347, "train_info/time_within_train_step": 2.356255292892456, "step": 2347} {"train_info/time_between_train_steps": 0.0029184818267822266, "step": 2347} {"info/global_step": 2348, "train_info/time_within_train_step": 2.3572592735290527, "step": 2348} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 2348} {"info/global_step": 2349, "train_info/time_within_train_step": 2.53096604347229, "step": 2349} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 2349} {"info/global_step": 2350, "train_info/time_within_train_step": 2.354863405227661, "step": 2350} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746258254, "_runtime": 6073}, "step": 2350} {"logs": {"train/loss": 3.7979, "train/learning_rate": 0.0001444444444444444, "train/epoch": 2.21, "_timestamp": 1746258254, "_runtime": 6073}, "step": 2350} {"train_info/time_between_train_steps": 0.023746013641357422, "step": 2350} {"info/global_step": 2351, "train_info/time_within_train_step": 2.354687452316284, "step": 2351} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 2351} {"info/global_step": 2352, "train_info/time_within_train_step": 2.355635404586792, "step": 2352} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 2352} {"info/global_step": 2353, "train_info/time_within_train_step": 2.355523109436035, "step": 2353} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 2353} {"info/global_step": 2354, "train_info/time_within_train_step": 2.3558762073516846, "step": 2354} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 2354} {"info/global_step": 2355, "train_info/time_within_train_step": 2.3569109439849854, "step": 2355} {"train_info/time_between_train_steps": 0.0029010772705078125, "step": 2355} {"info/global_step": 2356, "train_info/time_within_train_step": 2.3561363220214844, "step": 2356} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 2356} {"info/global_step": 2357, "train_info/time_within_train_step": 2.3559958934783936, "step": 2357} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 2357} {"info/global_step": 2358, "train_info/time_within_train_step": 2.354726552963257, "step": 2358} {"train_info/time_between_train_steps": 0.0029532909393310547, "step": 2358} {"info/global_step": 2359, "train_info/time_within_train_step": 2.3557887077331543, "step": 2359} {"train_info/time_between_train_steps": 0.0028944015502929688, "step": 2359} {"info/global_step": 2360, "train_info/time_within_train_step": 2.3553271293640137, "step": 2360} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 2360} {"info/global_step": 2361, "train_info/time_within_train_step": 2.3545212745666504, "step": 2361} {"train_info/time_between_train_steps": 0.00289154052734375, "step": 2361} {"info/global_step": 2362, "train_info/time_within_train_step": 2.354684591293335, "step": 2362} {"train_info/time_between_train_steps": 0.0029354095458984375, "step": 2362} {"info/global_step": 2363, "train_info/time_within_train_step": 2.3544530868530273, "step": 2363} {"train_info/time_between_train_steps": 0.002899169921875, "step": 2363} {"info/global_step": 2364, "train_info/time_within_train_step": 2.3542840480804443, "step": 2364} {"train_info/time_between_train_steps": 0.0029451847076416016, "step": 2364} {"info/global_step": 2365, "train_info/time_within_train_step": 2.3548145294189453, "step": 2365} {"train_info/time_between_train_steps": 0.0029392242431640625, "step": 2365} {"info/global_step": 2366, "train_info/time_within_train_step": 2.356137990951538, "step": 2366} {"train_info/time_between_train_steps": 0.002872467041015625, "step": 2366} {"info/global_step": 2367, "train_info/time_within_train_step": 2.3560807704925537, "step": 2367} {"train_info/time_between_train_steps": 0.0029320716857910156, "step": 2367} {"info/global_step": 2368, "train_info/time_within_train_step": 2.355578660964966, "step": 2368} {"train_info/time_between_train_steps": 0.0028884410858154297, "step": 2368} {"info/global_step": 2369, "train_info/time_within_train_step": 2.3552494049072266, "step": 2369} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 2369} {"info/global_step": 2370, "train_info/time_within_train_step": 2.3551852703094482, "step": 2370} {"train_info/time_between_train_steps": 0.0028960704803466797, "step": 2370} {"info/global_step": 2371, "train_info/time_within_train_step": 2.355285882949829, "step": 2371} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 2371} {"info/global_step": 2372, "train_info/time_within_train_step": 2.355842351913452, "step": 2372} {"train_info/time_between_train_steps": 0.002896547317504883, "step": 2372} {"info/global_step": 2373, "train_info/time_within_train_step": 2.3545963764190674, "step": 2373} {"train_info/time_between_train_steps": 0.002902507781982422, "step": 2373} {"info/global_step": 2374, "train_info/time_within_train_step": 2.5161049365997314, "step": 2374} {"train_info/time_between_train_steps": 0.0029268264770507812, "step": 2374} {"info/global_step": 2375, "train_info/time_within_train_step": 2.3556175231933594, "step": 2375} {"train_info/time_between_train_steps": 0.0029129981994628906, "step": 2375} {"info/global_step": 2376, "train_info/time_within_train_step": 2.355973958969116, "step": 2376} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 2376} {"info/global_step": 2377, "train_info/time_within_train_step": 2.3557848930358887, "step": 2377} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 2377} {"info/global_step": 2378, "train_info/time_within_train_step": 2.3555307388305664, "step": 2378} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 2378} {"info/global_step": 2379, "train_info/time_within_train_step": 2.3543503284454346, "step": 2379} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 2379} {"info/global_step": 2380, "train_info/time_within_train_step": 2.3555119037628174, "step": 2380} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 2380} {"info/global_step": 2381, "train_info/time_within_train_step": 2.355161190032959, "step": 2381} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 2381} {"info/global_step": 2382, "train_info/time_within_train_step": 2.355077028274536, "step": 2382} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 2382} {"info/global_step": 2383, "train_info/time_within_train_step": 2.355441093444824, "step": 2383} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 2383} {"info/global_step": 2384, "train_info/time_within_train_step": 2.3555941581726074, "step": 2384} {"train_info/time_between_train_steps": 0.002889871597290039, "step": 2384} {"info/global_step": 2385, "train_info/time_within_train_step": 2.354644775390625, "step": 2385} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 2385} {"info/global_step": 2386, "train_info/time_within_train_step": 2.3562042713165283, "step": 2386} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 2386} {"info/global_step": 2387, "train_info/time_within_train_step": 2.35548734664917, "step": 2387} {"train_info/time_between_train_steps": 0.002888917922973633, "step": 2387} {"info/global_step": 2388, "train_info/time_within_train_step": 2.3548355102539062, "step": 2388} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 2388} {"info/global_step": 2389, "train_info/time_within_train_step": 2.353919506072998, "step": 2389} {"train_info/time_between_train_steps": 0.002901792526245117, "step": 2389} {"info/global_step": 2390, "train_info/time_within_train_step": 2.3544700145721436, "step": 2390} {"train_info/time_between_train_steps": 0.0029497146606445312, "step": 2390} {"info/global_step": 2391, "train_info/time_within_train_step": 2.35394549369812, "step": 2391} {"train_info/time_between_train_steps": 0.002899169921875, "step": 2391} {"info/global_step": 2392, "train_info/time_within_train_step": 2.3542983531951904, "step": 2392} {"train_info/time_between_train_steps": 0.0029387474060058594, "step": 2392} {"info/global_step": 2393, "train_info/time_within_train_step": 2.355253219604492, "step": 2393} {"train_info/time_between_train_steps": 0.002881288528442383, "step": 2393} {"info/global_step": 2394, "train_info/time_within_train_step": 2.3546340465545654, "step": 2394} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 2394} {"info/global_step": 2395, "train_info/time_within_train_step": 2.354306936264038, "step": 2395} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 2395} {"info/global_step": 2396, "train_info/time_within_train_step": 2.3554134368896484, "step": 2396} {"train_info/time_between_train_steps": 0.002923727035522461, "step": 2396} {"info/global_step": 2397, "train_info/time_within_train_step": 2.355874538421631, "step": 2397} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 2397} {"info/global_step": 2398, "train_info/time_within_train_step": 2.5014126300811768, "step": 2398} {"train_info/time_between_train_steps": 0.002944469451904297, "step": 2398} {"info/global_step": 2399, "train_info/time_within_train_step": 2.3550150394439697, "step": 2399} {"train_info/time_between_train_steps": 0.002871274948120117, "step": 2399} {"info/global_step": 2400, "train_info/time_within_train_step": 2.3554694652557373, "step": 2400} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746258373, "_runtime": 6192}, "step": 2400} {"logs": {"train/loss": 3.7792, "train/learning_rate": 0.0001333333333333333, "train/epoch": 2.23, "_timestamp": 1746258373, "_runtime": 6192}, "step": 2400} {"train_info/time_between_train_steps": 29.675501108169556, "step": 2400} {"info/global_step": 2401, "train_info/time_within_train_step": 2.1998531818389893, "step": 2401} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 2401} {"info/global_step": 2402, "train_info/time_within_train_step": 2.181077480316162, "step": 2402} {"train_info/time_between_train_steps": 0.002955198287963867, "step": 2402} {"info/global_step": 2403, "train_info/time_within_train_step": 2.1817123889923096, "step": 2403} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 2403} {"info/global_step": 2404, "train_info/time_within_train_step": 2.2732436656951904, "step": 2404} {"train_info/time_between_train_steps": 0.0029077529907226562, "step": 2404} {"info/global_step": 2405, "train_info/time_within_train_step": 2.3488478660583496, "step": 2405} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 2405} {"info/global_step": 2406, "train_info/time_within_train_step": 2.353173017501831, "step": 2406} {"train_info/time_between_train_steps": 0.0029647350311279297, "step": 2406} {"info/global_step": 2407, "train_info/time_within_train_step": 2.3552322387695312, "step": 2407} {"train_info/time_between_train_steps": 0.002926349639892578, "step": 2407} {"info/global_step": 2408, "train_info/time_within_train_step": 2.356147289276123, "step": 2408} {"train_info/time_between_train_steps": 0.002959728240966797, "step": 2408} {"info/global_step": 2409, "train_info/time_within_train_step": 2.356816291809082, "step": 2409} {"train_info/time_between_train_steps": 0.002883434295654297, "step": 2409} {"info/global_step": 2410, "train_info/time_within_train_step": 2.3564679622650146, "step": 2410} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 2410} {"info/global_step": 2411, "train_info/time_within_train_step": 2.3553895950317383, "step": 2411} {"train_info/time_between_train_steps": 0.002901315689086914, "step": 2411} {"info/global_step": 2412, "train_info/time_within_train_step": 2.356386184692383, "step": 2412} {"train_info/time_between_train_steps": 0.0029120445251464844, "step": 2412} {"info/global_step": 2413, "train_info/time_within_train_step": 2.3562140464782715, "step": 2413} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 2413} {"info/global_step": 2414, "train_info/time_within_train_step": 2.3571712970733643, "step": 2414} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 2414} {"info/global_step": 2415, "train_info/time_within_train_step": 2.3567416667938232, "step": 2415} {"train_info/time_between_train_steps": 0.0028769969940185547, "step": 2415} {"info/global_step": 2416, "train_info/time_within_train_step": 2.356091260910034, "step": 2416} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 2416} {"info/global_step": 2417, "train_info/time_within_train_step": 2.3576104640960693, "step": 2417} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 2417} {"info/global_step": 2418, "train_info/time_within_train_step": 2.3561739921569824, "step": 2418} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 2418} {"info/global_step": 2419, "train_info/time_within_train_step": 2.3570237159729004, "step": 2419} {"train_info/time_between_train_steps": 0.002918720245361328, "step": 2419} {"info/global_step": 2420, "train_info/time_within_train_step": 2.3566267490386963, "step": 2420} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 2420} {"info/global_step": 2421, "train_info/time_within_train_step": 2.356205940246582, "step": 2421} {"train_info/time_between_train_steps": 0.002901792526245117, "step": 2421} {"info/global_step": 2422, "train_info/time_within_train_step": 2.4560940265655518, "step": 2422} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 2422} {"info/global_step": 2423, "train_info/time_within_train_step": 2.3555948734283447, "step": 2423} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 2423} {"info/global_step": 2424, "train_info/time_within_train_step": 2.3554892539978027, "step": 2424} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 2424} {"info/global_step": 2425, "train_info/time_within_train_step": 2.357032537460327, "step": 2425} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 2425} {"info/global_step": 2426, "train_info/time_within_train_step": 2.3574752807617188, "step": 2426} {"train_info/time_between_train_steps": 0.0030176639556884766, "step": 2426} {"info/global_step": 2427, "train_info/time_within_train_step": 2.356626272201538, "step": 2427} {"train_info/time_between_train_steps": 0.002877950668334961, "step": 2427} {"info/global_step": 2428, "train_info/time_within_train_step": 2.3565049171447754, "step": 2428} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 2428} {"info/global_step": 2429, "train_info/time_within_train_step": 2.354979991912842, "step": 2429} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 2429} {"info/global_step": 2430, "train_info/time_within_train_step": 2.3559441566467285, "step": 2430} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 2430} {"info/global_step": 2431, "train_info/time_within_train_step": 2.356067419052124, "step": 2431} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 2431} {"info/global_step": 2432, "train_info/time_within_train_step": 2.3562090396881104, "step": 2432} {"train_info/time_between_train_steps": 0.002920389175415039, "step": 2432} {"info/global_step": 2433, "train_info/time_within_train_step": 2.3551037311553955, "step": 2433} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 2433} {"info/global_step": 2434, "train_info/time_within_train_step": 2.3561131954193115, "step": 2434} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 2434} {"info/global_step": 2435, "train_info/time_within_train_step": 2.3571763038635254, "step": 2435} {"train_info/time_between_train_steps": 0.002905130386352539, "step": 2435} {"info/global_step": 2436, "train_info/time_within_train_step": 2.356003522872925, "step": 2436} {"train_info/time_between_train_steps": 0.002915620803833008, "step": 2436} {"info/global_step": 2437, "train_info/time_within_train_step": 2.355879306793213, "step": 2437} {"train_info/time_between_train_steps": 0.0029304027557373047, "step": 2437} {"info/global_step": 2438, "train_info/time_within_train_step": 2.3564260005950928, "step": 2438} {"train_info/time_between_train_steps": 0.002965688705444336, "step": 2438} {"info/global_step": 2439, "train_info/time_within_train_step": 2.3556461334228516, "step": 2439} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 2439} {"info/global_step": 2440, "train_info/time_within_train_step": 2.356245994567871, "step": 2440} {"train_info/time_between_train_steps": 0.002936124801635742, "step": 2440} {"info/global_step": 2441, "train_info/time_within_train_step": 2.356372356414795, "step": 2441} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 2441} {"info/global_step": 2442, "train_info/time_within_train_step": 2.3558101654052734, "step": 2442} {"train_info/time_between_train_steps": 0.0029125213623046875, "step": 2442} {"info/global_step": 2443, "train_info/time_within_train_step": 2.3555634021759033, "step": 2443} {"train_info/time_between_train_steps": 0.0028786659240722656, "step": 2443} {"info/global_step": 2444, "train_info/time_within_train_step": 2.3553919792175293, "step": 2444} {"train_info/time_between_train_steps": 0.002911806106567383, "step": 2444} {"info/global_step": 2445, "train_info/time_within_train_step": 2.3560633659362793, "step": 2445} {"train_info/time_between_train_steps": 0.0029096603393554688, "step": 2445} {"info/global_step": 2446, "train_info/time_within_train_step": 2.3557403087615967, "step": 2446} {"train_info/time_between_train_steps": 0.0029325485229492188, "step": 2446} {"info/global_step": 2447, "train_info/time_within_train_step": 2.4688515663146973, "step": 2447} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 2447} {"info/global_step": 2448, "train_info/time_within_train_step": 2.3555545806884766, "step": 2448} {"train_info/time_between_train_steps": 0.0030813217163085938, "step": 2448} {"info/global_step": 2449, "train_info/time_within_train_step": 2.355560302734375, "step": 2449} {"train_info/time_between_train_steps": 0.002945423126220703, "step": 2449} {"info/global_step": 2450, "train_info/time_within_train_step": 2.3558101654052734, "step": 2450} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746258521, "_runtime": 6340}, "step": 2450} {"logs": {"train/loss": 3.7544, "train/learning_rate": 0.00012222222222222221, "train/epoch": 2.24, "_timestamp": 1746258521, "_runtime": 6340}, "step": 2450} {"train_info/time_between_train_steps": 0.024584531784057617, "step": 2450} {"info/global_step": 2451, "train_info/time_within_train_step": 2.3561906814575195, "step": 2451} {"train_info/time_between_train_steps": 0.002901792526245117, "step": 2451} {"info/global_step": 2452, "train_info/time_within_train_step": 2.355600118637085, "step": 2452} {"train_info/time_between_train_steps": 0.0028886795043945312, "step": 2452} {"info/global_step": 2453, "train_info/time_within_train_step": 2.3547518253326416, "step": 2453} {"train_info/time_between_train_steps": 0.002906322479248047, "step": 2453} {"info/global_step": 2454, "train_info/time_within_train_step": 2.3555045127868652, "step": 2454} {"train_info/time_between_train_steps": 0.002874612808227539, "step": 2454} {"info/global_step": 2455, "train_info/time_within_train_step": 2.3557839393615723, "step": 2455} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 2455} {"info/global_step": 2456, "train_info/time_within_train_step": 2.354579210281372, "step": 2456} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 2456} {"info/global_step": 2457, "train_info/time_within_train_step": 2.356196165084839, "step": 2457} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 2457} {"info/global_step": 2458, "train_info/time_within_train_step": 2.3554115295410156, "step": 2458} {"train_info/time_between_train_steps": 0.0028929710388183594, "step": 2458} {"info/global_step": 2459, "train_info/time_within_train_step": 2.356736660003662, "step": 2459} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 2459} {"info/global_step": 2460, "train_info/time_within_train_step": 2.355954647064209, "step": 2460} {"train_info/time_between_train_steps": 0.00287628173828125, "step": 2460} {"info/global_step": 2461, "train_info/time_within_train_step": 2.3542990684509277, "step": 2461} {"train_info/time_between_train_steps": 0.0029108524322509766, "step": 2461} {"info/global_step": 2462, "train_info/time_within_train_step": 2.3558945655822754, "step": 2462} {"train_info/time_between_train_steps": 0.002878904342651367, "step": 2462} {"info/global_step": 2463, "train_info/time_within_train_step": 2.3559257984161377, "step": 2463} {"train_info/time_between_train_steps": 0.0029382705688476562, "step": 2463} {"info/global_step": 2464, "train_info/time_within_train_step": 2.3565521240234375, "step": 2464} {"train_info/time_between_train_steps": 0.002939939498901367, "step": 2464} {"info/global_step": 2465, "train_info/time_within_train_step": 2.3554766178131104, "step": 2465} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 2465} {"info/global_step": 2466, "train_info/time_within_train_step": 2.355708599090576, "step": 2466} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 2466} {"info/global_step": 2467, "train_info/time_within_train_step": 2.356902599334717, "step": 2467} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 2467} {"info/global_step": 2468, "train_info/time_within_train_step": 2.355775833129883, "step": 2468} {"train_info/time_between_train_steps": 0.002877950668334961, "step": 2468} {"info/global_step": 2469, "train_info/time_within_train_step": 2.3555660247802734, "step": 2469} {"train_info/time_between_train_steps": 0.0028803348541259766, "step": 2469} {"info/global_step": 2470, "train_info/time_within_train_step": 2.4260451793670654, "step": 2470} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 2470} {"info/global_step": 2471, "train_info/time_within_train_step": 2.3566107749938965, "step": 2471} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 2471} {"info/global_step": 2472, "train_info/time_within_train_step": 2.355509042739868, "step": 2472} {"train_info/time_between_train_steps": 0.002941131591796875, "step": 2472} {"info/global_step": 2473, "train_info/time_within_train_step": 2.3551578521728516, "step": 2473} {"train_info/time_between_train_steps": 0.002880096435546875, "step": 2473} {"info/global_step": 2474, "train_info/time_within_train_step": 2.3547523021698, "step": 2474} {"train_info/time_between_train_steps": 0.002861499786376953, "step": 2474} {"info/global_step": 2475, "train_info/time_within_train_step": 2.356724977493286, "step": 2475} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 2475} {"info/global_step": 2476, "train_info/time_within_train_step": 2.3564672470092773, "step": 2476} {"train_info/time_between_train_steps": 0.0028858184814453125, "step": 2476} {"info/global_step": 2477, "train_info/time_within_train_step": 2.3563930988311768, "step": 2477} {"train_info/time_between_train_steps": 0.0028884410858154297, "step": 2477} {"info/global_step": 2478, "train_info/time_within_train_step": 2.3561418056488037, "step": 2478} {"train_info/time_between_train_steps": 0.002931833267211914, "step": 2478} {"info/global_step": 2479, "train_info/time_within_train_step": 2.355069398880005, "step": 2479} {"train_info/time_between_train_steps": 0.002876758575439453, "step": 2479} {"info/global_step": 2480, "train_info/time_within_train_step": 2.3560354709625244, "step": 2480} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 2480} {"info/global_step": 2481, "train_info/time_within_train_step": 2.3549246788024902, "step": 2481} {"train_info/time_between_train_steps": 0.002875804901123047, "step": 2481} {"info/global_step": 2482, "train_info/time_within_train_step": 2.3556315898895264, "step": 2482} {"train_info/time_between_train_steps": 0.0029108524322509766, "step": 2482} {"info/global_step": 2483, "train_info/time_within_train_step": 2.356231927871704, "step": 2483} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 2483} {"info/global_step": 2484, "train_info/time_within_train_step": 2.3563785552978516, "step": 2484} {"train_info/time_between_train_steps": 0.0028967857360839844, "step": 2484} {"info/global_step": 2485, "train_info/time_within_train_step": 2.3548953533172607, "step": 2485} {"train_info/time_between_train_steps": 0.0029337406158447266, "step": 2485} {"info/global_step": 2486, "train_info/time_within_train_step": 2.3556160926818848, "step": 2486} {"train_info/time_between_train_steps": 0.002885580062866211, "step": 2486} {"info/global_step": 2487, "train_info/time_within_train_step": 2.3551809787750244, "step": 2487} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 2487} {"info/global_step": 2488, "train_info/time_within_train_step": 2.355210781097412, "step": 2488} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 2488} {"info/global_step": 2489, "train_info/time_within_train_step": 2.3553977012634277, "step": 2489} {"train_info/time_between_train_steps": 0.002941608428955078, "step": 2489} {"info/global_step": 2490, "train_info/time_within_train_step": 2.355475425720215, "step": 2490} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 2490} {"info/global_step": 2491, "train_info/time_within_train_step": 2.3558619022369385, "step": 2491} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 2491} {"info/global_step": 2492, "train_info/time_within_train_step": 2.3559341430664062, "step": 2492} {"train_info/time_between_train_steps": 0.002899646759033203, "step": 2492} {"info/global_step": 2493, "train_info/time_within_train_step": 2.355835437774658, "step": 2493} {"train_info/time_between_train_steps": 0.002930879592895508, "step": 2493} {"info/global_step": 2494, "train_info/time_within_train_step": 2.413334608078003, "step": 2494} {"train_info/time_between_train_steps": 0.002882719039916992, "step": 2494} {"info/global_step": 2495, "train_info/time_within_train_step": 2.3546388149261475, "step": 2495} {"train_info/time_between_train_steps": 0.002931356430053711, "step": 2495} {"info/global_step": 2496, "train_info/time_within_train_step": 2.354703187942505, "step": 2496} {"train_info/time_between_train_steps": 0.0029082298278808594, "step": 2496} {"info/global_step": 2497, "train_info/time_within_train_step": 2.3552544116973877, "step": 2497} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 2497} {"info/global_step": 2498, "train_info/time_within_train_step": 2.3539681434631348, "step": 2498} {"train_info/time_between_train_steps": 0.002882242202758789, "step": 2498} {"info/global_step": 2499, "train_info/time_within_train_step": 2.911245346069336, "step": 2499} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 2499} {"info/global_step": 2500, "train_info/time_within_train_step": 2.3561413288116455, "step": 2500} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746258641, "_runtime": 6460}, "step": 2500} {"logs": {"train/loss": 3.7501, "train/learning_rate": 0.00011111111111111109, "train/epoch": 2.26, "_timestamp": 1746258641, "_runtime": 6460}, "step": 2500} {"train_info/time_between_train_steps": 15.285306215286255, "step": 2500} {"info/global_step": 2501, "train_info/time_within_train_step": 2.196168899536133, "step": 2501} {"train_info/time_between_train_steps": 0.002875804901123047, "step": 2501} {"info/global_step": 2502, "train_info/time_within_train_step": 2.1812210083007812, "step": 2502} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 2502} {"info/global_step": 2503, "train_info/time_within_train_step": 2.267653703689575, "step": 2503} {"train_info/time_between_train_steps": 0.002889871597290039, "step": 2503} {"info/global_step": 2504, "train_info/time_within_train_step": 2.3467509746551514, "step": 2504} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 2504} {"info/global_step": 2505, "train_info/time_within_train_step": 2.350531578063965, "step": 2505} {"train_info/time_between_train_steps": 0.002888917922973633, "step": 2505} {"info/global_step": 2506, "train_info/time_within_train_step": 2.3522064685821533, "step": 2506} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 2506} {"info/global_step": 2507, "train_info/time_within_train_step": 2.3538782596588135, "step": 2507} {"train_info/time_between_train_steps": 0.0028839111328125, "step": 2507} {"info/global_step": 2508, "train_info/time_within_train_step": 2.354264259338379, "step": 2508} {"train_info/time_between_train_steps": 0.002869844436645508, "step": 2508} {"info/global_step": 2509, "train_info/time_within_train_step": 2.354949474334717, "step": 2509} {"train_info/time_between_train_steps": 0.002874135971069336, "step": 2509} {"info/global_step": 2510, "train_info/time_within_train_step": 2.355473756790161, "step": 2510} {"train_info/time_between_train_steps": 0.0028693675994873047, "step": 2510} {"info/global_step": 2511, "train_info/time_within_train_step": 2.359675884246826, "step": 2511} {"train_info/time_between_train_steps": 0.0029036998748779297, "step": 2511} {"info/global_step": 2512, "train_info/time_within_train_step": 2.3549745082855225, "step": 2512} {"train_info/time_between_train_steps": 0.002975940704345703, "step": 2512} {"info/global_step": 2513, "train_info/time_within_train_step": 2.355877161026001, "step": 2513} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 2513} {"info/global_step": 2514, "train_info/time_within_train_step": 2.355368137359619, "step": 2514} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 2514} {"info/global_step": 2515, "train_info/time_within_train_step": 2.3560900688171387, "step": 2515} {"train_info/time_between_train_steps": 0.002866983413696289, "step": 2515} {"info/global_step": 2516, "train_info/time_within_train_step": 2.355264663696289, "step": 2516} {"train_info/time_between_train_steps": 0.0028777122497558594, "step": 2516} {"info/global_step": 2517, "train_info/time_within_train_step": 2.3963139057159424, "step": 2517} {"train_info/time_between_train_steps": 0.0029103755950927734, "step": 2517} {"info/global_step": 2518, "train_info/time_within_train_step": 2.356224298477173, "step": 2518} {"train_info/time_between_train_steps": 0.002895355224609375, "step": 2518} {"info/global_step": 2519, "train_info/time_within_train_step": 2.354691743850708, "step": 2519} {"train_info/time_between_train_steps": 0.002888917922973633, "step": 2519} {"info/global_step": 2520, "train_info/time_within_train_step": 2.3563649654388428, "step": 2520} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 2520} {"info/global_step": 2521, "train_info/time_within_train_step": 2.3553848266601562, "step": 2521} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 2521} {"info/global_step": 2522, "train_info/time_within_train_step": 2.3539326190948486, "step": 2522} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 2522} {"info/global_step": 2523, "train_info/time_within_train_step": 2.354841947555542, "step": 2523} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 2523} {"info/global_step": 2524, "train_info/time_within_train_step": 2.3558156490325928, "step": 2524} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 2524} {"info/global_step": 2525, "train_info/time_within_train_step": 2.356151819229126, "step": 2525} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 2525} {"info/global_step": 2526, "train_info/time_within_train_step": 2.356658697128296, "step": 2526} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 2526} {"info/global_step": 2527, "train_info/time_within_train_step": 2.355499267578125, "step": 2527} {"train_info/time_between_train_steps": 0.0029442310333251953, "step": 2527} {"info/global_step": 2528, "train_info/time_within_train_step": 2.356091260910034, "step": 2528} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 2528} {"info/global_step": 2529, "train_info/time_within_train_step": 2.3540539741516113, "step": 2529} {"train_info/time_between_train_steps": 0.002886056900024414, "step": 2529} {"info/global_step": 2530, "train_info/time_within_train_step": 2.3551793098449707, "step": 2530} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 2530} {"info/global_step": 2531, "train_info/time_within_train_step": 2.354491710662842, "step": 2531} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 2531} {"info/global_step": 2532, "train_info/time_within_train_step": 2.3558623790740967, "step": 2532} {"train_info/time_between_train_steps": 0.0028896331787109375, "step": 2532} {"info/global_step": 2533, "train_info/time_within_train_step": 2.354429006576538, "step": 2533} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 2533} {"info/global_step": 2534, "train_info/time_within_train_step": 2.355792760848999, "step": 2534} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 2534} {"info/global_step": 2535, "train_info/time_within_train_step": 2.3553683757781982, "step": 2535} {"train_info/time_between_train_steps": 0.0028536319732666016, "step": 2535} {"info/global_step": 2536, "train_info/time_within_train_step": 2.355556011199951, "step": 2536} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 2536} {"info/global_step": 2537, "train_info/time_within_train_step": 2.3554234504699707, "step": 2537} {"train_info/time_between_train_steps": 0.0029511451721191406, "step": 2537} {"info/global_step": 2538, "train_info/time_within_train_step": 2.355164051055908, "step": 2538} {"train_info/time_between_train_steps": 0.0029854774475097656, "step": 2538} {"info/global_step": 2539, "train_info/time_within_train_step": 2.355642318725586, "step": 2539} {"train_info/time_between_train_steps": 0.002954244613647461, "step": 2539} {"info/global_step": 2540, "train_info/time_within_train_step": 2.355679512023926, "step": 2540} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 2540} {"info/global_step": 2541, "train_info/time_within_train_step": 2.4117021560668945, "step": 2541} {"train_info/time_between_train_steps": 0.0029592514038085938, "step": 2541} {"info/global_step": 2542, "train_info/time_within_train_step": 2.355182647705078, "step": 2542} {"train_info/time_between_train_steps": 0.002946138381958008, "step": 2542} {"info/global_step": 2543, "train_info/time_within_train_step": 2.356494426727295, "step": 2543} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 2543} {"info/global_step": 2544, "train_info/time_within_train_step": 2.3561480045318604, "step": 2544} {"train_info/time_between_train_steps": 0.002931356430053711, "step": 2544} {"info/global_step": 2545, "train_info/time_within_train_step": 2.3557639122009277, "step": 2545} {"train_info/time_between_train_steps": 0.002965688705444336, "step": 2545} {"info/global_step": 2546, "train_info/time_within_train_step": 2.3563525676727295, "step": 2546} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 2546} {"info/global_step": 2547, "train_info/time_within_train_step": 2.355886697769165, "step": 2547} {"train_info/time_between_train_steps": 0.002926349639892578, "step": 2547} {"info/global_step": 2548, "train_info/time_within_train_step": 2.355600595474243, "step": 2548} {"train_info/time_between_train_steps": 0.0029664039611816406, "step": 2548} {"info/global_step": 2549, "train_info/time_within_train_step": 2.3550572395324707, "step": 2549} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 2549} {"info/global_step": 2550, "train_info/time_within_train_step": 2.354841709136963, "step": 2550} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746258775, "_runtime": 6594}, "step": 2550} {"logs": {"train/loss": 3.7408, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 2.28, "_timestamp": 1746258775, "_runtime": 6594}, "step": 2550} {"train_info/time_between_train_steps": 0.024853944778442383, "step": 2550} {"info/global_step": 2551, "train_info/time_within_train_step": 2.3555567264556885, "step": 2551} {"train_info/time_between_train_steps": 0.003023386001586914, "step": 2551} {"info/global_step": 2552, "train_info/time_within_train_step": 2.3548665046691895, "step": 2552} {"train_info/time_between_train_steps": 0.002912282943725586, "step": 2552} {"info/global_step": 2553, "train_info/time_within_train_step": 2.354283094406128, "step": 2553} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 2553} {"info/global_step": 2554, "train_info/time_within_train_step": 2.355543851852417, "step": 2554} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 2554} {"info/global_step": 2555, "train_info/time_within_train_step": 2.355625867843628, "step": 2555} {"train_info/time_between_train_steps": 0.0030498504638671875, "step": 2555} {"info/global_step": 2556, "train_info/time_within_train_step": 2.3551833629608154, "step": 2556} {"train_info/time_between_train_steps": 0.003064393997192383, "step": 2556} {"info/global_step": 2557, "train_info/time_within_train_step": 2.355386734008789, "step": 2557} {"train_info/time_between_train_steps": 0.0030515193939208984, "step": 2557} {"info/global_step": 2558, "train_info/time_within_train_step": 2.3558695316314697, "step": 2558} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 2558} {"info/global_step": 2559, "train_info/time_within_train_step": 2.3557493686676025, "step": 2559} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 2559} {"info/global_step": 2560, "train_info/time_within_train_step": 2.3558144569396973, "step": 2560} {"train_info/time_between_train_steps": 0.0030176639556884766, "step": 2560} {"info/global_step": 2561, "train_info/time_within_train_step": 2.3550424575805664, "step": 2561} {"train_info/time_between_train_steps": 0.00304412841796875, "step": 2561} {"info/global_step": 2562, "train_info/time_within_train_step": 2.355907440185547, "step": 2562} {"train_info/time_between_train_steps": 0.002975940704345703, "step": 2562} {"info/global_step": 2563, "train_info/time_within_train_step": 2.356052875518799, "step": 2563} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 2563} {"info/global_step": 2564, "train_info/time_within_train_step": 2.396463394165039, "step": 2564} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 2564} {"info/global_step": 2565, "train_info/time_within_train_step": 2.3552467823028564, "step": 2565} {"train_info/time_between_train_steps": 0.003113269805908203, "step": 2565} {"info/global_step": 2566, "train_info/time_within_train_step": 2.354949712753296, "step": 2566} {"train_info/time_between_train_steps": 0.003080129623413086, "step": 2566} {"info/global_step": 2567, "train_info/time_within_train_step": 2.356886625289917, "step": 2567} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 2567} {"info/global_step": 2568, "train_info/time_within_train_step": 2.3552398681640625, "step": 2568} {"train_info/time_between_train_steps": 0.003116607666015625, "step": 2568} {"info/global_step": 2569, "train_info/time_within_train_step": 2.355895757675171, "step": 2569} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 2569} {"info/global_step": 2570, "train_info/time_within_train_step": 2.3548924922943115, "step": 2570} {"train_info/time_between_train_steps": 0.0031337738037109375, "step": 2570} {"info/global_step": 2571, "train_info/time_within_train_step": 2.354482650756836, "step": 2571} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 2571} {"info/global_step": 2572, "train_info/time_within_train_step": 2.355471134185791, "step": 2572} {"train_info/time_between_train_steps": 0.003301382064819336, "step": 2572} {"info/global_step": 2573, "train_info/time_within_train_step": 2.3550832271575928, "step": 2573} {"train_info/time_between_train_steps": 0.0034639835357666016, "step": 2573} {"info/global_step": 2574, "train_info/time_within_train_step": 2.357118606567383, "step": 2574} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 2574} {"info/global_step": 2575, "train_info/time_within_train_step": 2.356614351272583, "step": 2575} {"train_info/time_between_train_steps": 0.003336668014526367, "step": 2575} {"info/global_step": 2576, "train_info/time_within_train_step": 2.3564562797546387, "step": 2576} {"train_info/time_between_train_steps": 0.0034513473510742188, "step": 2576} {"info/global_step": 2577, "train_info/time_within_train_step": 2.356619358062744, "step": 2577} {"train_info/time_between_train_steps": 0.003681182861328125, "step": 2577} {"info/global_step": 2578, "train_info/time_within_train_step": 2.357154130935669, "step": 2578} {"train_info/time_between_train_steps": 0.0035500526428222656, "step": 2578} {"info/global_step": 2579, "train_info/time_within_train_step": 2.356318712234497, "step": 2579} {"train_info/time_between_train_steps": 0.0036995410919189453, "step": 2579} {"info/global_step": 2580, "train_info/time_within_train_step": 2.3561766147613525, "step": 2580} {"train_info/time_between_train_steps": 0.0036880970001220703, "step": 2580} {"train_info/time_between_train_steps": 2.692291736602783, "step": 2580} {"info/global_step": 2581, "train_info/time_within_train_step": 2.352452039718628, "step": 2581} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 2581} {"info/global_step": 2582, "train_info/time_within_train_step": 2.3546035289764404, "step": 2582} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 2582} {"info/global_step": 2583, "train_info/time_within_train_step": 2.355271816253662, "step": 2583} {"train_info/time_between_train_steps": 0.0031023025512695312, "step": 2583} {"info/global_step": 2584, "train_info/time_within_train_step": 2.3552963733673096, "step": 2584} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 2584} {"info/global_step": 2585, "train_info/time_within_train_step": 2.353790521621704, "step": 2585} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 2585} {"info/global_step": 2586, "train_info/time_within_train_step": 2.354152202606201, "step": 2586} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 2586} {"info/global_step": 2587, "train_info/time_within_train_step": 2.35461163520813, "step": 2587} {"train_info/time_between_train_steps": 0.00311279296875, "step": 2587} {"info/global_step": 2588, "train_info/time_within_train_step": 2.3555850982666016, "step": 2588} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 2588} {"info/global_step": 2589, "train_info/time_within_train_step": 2.354426383972168, "step": 2589} {"train_info/time_between_train_steps": 0.0030951499938964844, "step": 2589} {"info/global_step": 2590, "train_info/time_within_train_step": 2.3553307056427, "step": 2590} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 2590} {"info/global_step": 2591, "train_info/time_within_train_step": 2.356362819671631, "step": 2591} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 2591} {"info/global_step": 2592, "train_info/time_within_train_step": 2.354349136352539, "step": 2592} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 2592} {"info/global_step": 2593, "train_info/time_within_train_step": 2.3548061847686768, "step": 2593} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 2593} {"info/global_step": 2594, "train_info/time_within_train_step": 2.354537010192871, "step": 2594} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 2594} {"info/global_step": 2595, "train_info/time_within_train_step": 2.5535941123962402, "step": 2595} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 2595} {"info/global_step": 2596, "train_info/time_within_train_step": 2.356550455093384, "step": 2596} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 2596} {"info/global_step": 2597, "train_info/time_within_train_step": 2.3548977375030518, "step": 2597} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 2597} {"info/global_step": 2598, "train_info/time_within_train_step": 2.3561458587646484, "step": 2598} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 2598} {"info/global_step": 2599, "train_info/time_within_train_step": 2.3565714359283447, "step": 2599} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 2599} {"info/global_step": 2600, "train_info/time_within_train_step": 2.3551366329193115, "step": 2600} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746258897, "_runtime": 6716}, "step": 2600} {"logs": {"train/loss": 3.7642, "train/learning_rate": 8.888888888888888e-05, "train/epoch": 3.01, "_timestamp": 1746258897, "_runtime": 6716}, "step": 2600} {"train_info/time_between_train_steps": 14.144765377044678, "step": 2600} {"info/global_step": 2601, "train_info/time_within_train_step": 2.1962392330169678, "step": 2601} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 2601} {"info/global_step": 2602, "train_info/time_within_train_step": 2.182636260986328, "step": 2602} {"train_info/time_between_train_steps": 0.0031270980834960938, "step": 2602} {"info/global_step": 2603, "train_info/time_within_train_step": 2.279914140701294, "step": 2603} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 2603} {"info/global_step": 2604, "train_info/time_within_train_step": 2.350792169570923, "step": 2604} {"train_info/time_between_train_steps": 0.003114938735961914, "step": 2604} {"info/global_step": 2605, "train_info/time_within_train_step": 2.4264328479766846, "step": 2605} {"train_info/time_between_train_steps": 0.0031185150146484375, "step": 2605} {"info/global_step": 2606, "train_info/time_within_train_step": 2.355628728866577, "step": 2606} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 2606} {"info/global_step": 2607, "train_info/time_within_train_step": 2.3553972244262695, "step": 2607} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 2607} {"info/global_step": 2608, "train_info/time_within_train_step": 2.355787992477417, "step": 2608} {"train_info/time_between_train_steps": 0.0031163692474365234, "step": 2608} {"info/global_step": 2609, "train_info/time_within_train_step": 2.3568661212921143, "step": 2609} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 2609} {"info/global_step": 2610, "train_info/time_within_train_step": 2.35504412651062, "step": 2610} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 2610} {"info/global_step": 2611, "train_info/time_within_train_step": 2.3560447692871094, "step": 2611} {"train_info/time_between_train_steps": 0.0031118392944335938, "step": 2611} {"info/global_step": 2612, "train_info/time_within_train_step": 2.3553831577301025, "step": 2612} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 2612} {"info/global_step": 2613, "train_info/time_within_train_step": 2.356336832046509, "step": 2613} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 2613} {"info/global_step": 2614, "train_info/time_within_train_step": 2.355647563934326, "step": 2614} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 2614} {"info/global_step": 2615, "train_info/time_within_train_step": 2.356332540512085, "step": 2615} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 2615} {"info/global_step": 2616, "train_info/time_within_train_step": 2.356816291809082, "step": 2616} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 2616} {"info/global_step": 2617, "train_info/time_within_train_step": 2.356842517852783, "step": 2617} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 2617} {"info/global_step": 2618, "train_info/time_within_train_step": 2.357023000717163, "step": 2618} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 2618} {"info/global_step": 2619, "train_info/time_within_train_step": 2.5569045543670654, "step": 2619} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 2619} {"info/global_step": 2620, "train_info/time_within_train_step": 2.3564493656158447, "step": 2620} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 2620} {"info/global_step": 2621, "train_info/time_within_train_step": 2.3564510345458984, "step": 2621} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 2621} {"info/global_step": 2622, "train_info/time_within_train_step": 2.357226610183716, "step": 2622} {"train_info/time_between_train_steps": 0.0031118392944335938, "step": 2622} {"info/global_step": 2623, "train_info/time_within_train_step": 2.356292963027954, "step": 2623} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 2623} {"info/global_step": 2624, "train_info/time_within_train_step": 2.3553285598754883, "step": 2624} {"train_info/time_between_train_steps": 0.003099679946899414, "step": 2624} {"info/global_step": 2625, "train_info/time_within_train_step": 2.357482671737671, "step": 2625} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 2625} {"info/global_step": 2626, "train_info/time_within_train_step": 2.3571956157684326, "step": 2626} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 2626} {"info/global_step": 2627, "train_info/time_within_train_step": 2.356544017791748, "step": 2627} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 2627} {"info/global_step": 2628, "train_info/time_within_train_step": 2.3570408821105957, "step": 2628} {"train_info/time_between_train_steps": 0.0031099319458007812, "step": 2628} {"info/global_step": 2629, "train_info/time_within_train_step": 2.356255292892456, "step": 2629} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 2629} {"info/global_step": 2630, "train_info/time_within_train_step": 2.356243848800659, "step": 2630} {"train_info/time_between_train_steps": 0.003111124038696289, "step": 2630} {"info/global_step": 2631, "train_info/time_within_train_step": 2.356398582458496, "step": 2631} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 2631} {"info/global_step": 2632, "train_info/time_within_train_step": 2.3559534549713135, "step": 2632} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 2632} {"info/global_step": 2633, "train_info/time_within_train_step": 2.3561925888061523, "step": 2633} {"train_info/time_between_train_steps": 0.003307819366455078, "step": 2633} {"info/global_step": 2634, "train_info/time_within_train_step": 2.355468273162842, "step": 2634} {"train_info/time_between_train_steps": 0.003106355667114258, "step": 2634} {"info/global_step": 2635, "train_info/time_within_train_step": 2.3559556007385254, "step": 2635} {"train_info/time_between_train_steps": 0.0030825138092041016, "step": 2635} {"info/global_step": 2636, "train_info/time_within_train_step": 2.3558034896850586, "step": 2636} {"train_info/time_between_train_steps": 0.0030989646911621094, "step": 2636} {"info/global_step": 2637, "train_info/time_within_train_step": 2.3556065559387207, "step": 2637} {"train_info/time_between_train_steps": 0.0031104087829589844, "step": 2637} {"info/global_step": 2638, "train_info/time_within_train_step": 2.3551247119903564, "step": 2638} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 2638} {"info/global_step": 2639, "train_info/time_within_train_step": 2.35622239112854, "step": 2639} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 2639} {"info/global_step": 2640, "train_info/time_within_train_step": 2.3549256324768066, "step": 2640} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 2640} {"info/global_step": 2641, "train_info/time_within_train_step": 2.3792645931243896, "step": 2641} {"train_info/time_between_train_steps": 0.00310516357421875, "step": 2641} {"info/global_step": 2642, "train_info/time_within_train_step": 2.3560855388641357, "step": 2642} {"train_info/time_between_train_steps": 0.0030965805053710938, "step": 2642} {"info/global_step": 2643, "train_info/time_within_train_step": 2.4739153385162354, "step": 2643} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 2643} {"info/global_step": 2644, "train_info/time_within_train_step": 2.355682849884033, "step": 2644} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 2644} {"info/global_step": 2645, "train_info/time_within_train_step": 2.5591506958007812, "step": 2645} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 2645} {"info/global_step": 2646, "train_info/time_within_train_step": 2.354957103729248, "step": 2646} {"train_info/time_between_train_steps": 0.0031175613403320312, "step": 2646} {"info/global_step": 2647, "train_info/time_within_train_step": 2.354527473449707, "step": 2647} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 2647} {"info/global_step": 2648, "train_info/time_within_train_step": 2.3550381660461426, "step": 2648} {"train_info/time_between_train_steps": 0.003122091293334961, "step": 2648} {"info/global_step": 2649, "train_info/time_within_train_step": 2.35526967048645, "step": 2649} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 2649} {"info/global_step": 2650, "train_info/time_within_train_step": 2.35524582862854, "step": 2650} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259030, "_runtime": 6849}, "step": 2650} {"logs": {"train/loss": 3.7206, "train/learning_rate": 7.777777777777777e-05, "train/epoch": 3.02, "_timestamp": 1746259030, "_runtime": 6849}, "step": 2650} {"train_info/time_between_train_steps": 0.024163246154785156, "step": 2650} {"info/global_step": 2651, "train_info/time_within_train_step": 2.3552069664001465, "step": 2651} {"train_info/time_between_train_steps": 0.0033354759216308594, "step": 2651} {"info/global_step": 2652, "train_info/time_within_train_step": 2.355862617492676, "step": 2652} {"train_info/time_between_train_steps": 0.0033147335052490234, "step": 2652} {"info/global_step": 2653, "train_info/time_within_train_step": 2.354928731918335, "step": 2653} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 2653} {"info/global_step": 2654, "train_info/time_within_train_step": 2.3563733100891113, "step": 2654} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 2654} {"info/global_step": 2655, "train_info/time_within_train_step": 2.3558976650238037, "step": 2655} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 2655} {"info/global_step": 2656, "train_info/time_within_train_step": 2.355358123779297, "step": 2656} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 2656} {"info/global_step": 2657, "train_info/time_within_train_step": 2.3561131954193115, "step": 2657} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 2657} {"info/global_step": 2658, "train_info/time_within_train_step": 2.3556807041168213, "step": 2658} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 2658} {"info/global_step": 2659, "train_info/time_within_train_step": 2.355522632598877, "step": 2659} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 2659} {"info/global_step": 2660, "train_info/time_within_train_step": 2.3564555644989014, "step": 2660} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 2660} {"info/global_step": 2661, "train_info/time_within_train_step": 2.354987621307373, "step": 2661} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 2661} {"info/global_step": 2662, "train_info/time_within_train_step": 2.3554744720458984, "step": 2662} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 2662} {"info/global_step": 2663, "train_info/time_within_train_step": 2.3558192253112793, "step": 2663} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 2663} {"info/global_step": 2664, "train_info/time_within_train_step": 2.3560686111450195, "step": 2664} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 2664} {"info/global_step": 2665, "train_info/time_within_train_step": 2.355438232421875, "step": 2665} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 2665} {"info/global_step": 2666, "train_info/time_within_train_step": 2.356710910797119, "step": 2666} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 2666} {"info/global_step": 2667, "train_info/time_within_train_step": 2.3549644947052, "step": 2667} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 2667} {"info/global_step": 2668, "train_info/time_within_train_step": 2.3551759719848633, "step": 2668} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 2668} {"info/global_step": 2669, "train_info/time_within_train_step": 2.5693910121917725, "step": 2669} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 2669} {"info/global_step": 2670, "train_info/time_within_train_step": 2.3559439182281494, "step": 2670} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 2670} {"info/global_step": 2671, "train_info/time_within_train_step": 2.3561511039733887, "step": 2671} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 2671} {"info/global_step": 2672, "train_info/time_within_train_step": 2.3553307056427, "step": 2672} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 2672} {"info/global_step": 2673, "train_info/time_within_train_step": 2.3547632694244385, "step": 2673} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 2673} {"info/global_step": 2674, "train_info/time_within_train_step": 2.3552920818328857, "step": 2674} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 2674} {"info/global_step": 2675, "train_info/time_within_train_step": 2.354264974594116, "step": 2675} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 2675} {"info/global_step": 2676, "train_info/time_within_train_step": 2.3553051948547363, "step": 2676} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 2676} {"info/global_step": 2677, "train_info/time_within_train_step": 2.3564352989196777, "step": 2677} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 2677} {"info/global_step": 2678, "train_info/time_within_train_step": 2.3553359508514404, "step": 2678} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 2678} {"info/global_step": 2679, "train_info/time_within_train_step": 2.3555877208709717, "step": 2679} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 2679} {"info/global_step": 2680, "train_info/time_within_train_step": 2.3551712036132812, "step": 2680} {"train_info/time_between_train_steps": 0.0031478404998779297, "step": 2680} {"info/global_step": 2681, "train_info/time_within_train_step": 2.3555188179016113, "step": 2681} {"train_info/time_between_train_steps": 0.0031244754791259766, "step": 2681} {"info/global_step": 2682, "train_info/time_within_train_step": 2.3542046546936035, "step": 2682} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 2682} {"info/global_step": 2683, "train_info/time_within_train_step": 2.354661226272583, "step": 2683} {"train_info/time_between_train_steps": 0.0031194686889648438, "step": 2683} {"info/global_step": 2684, "train_info/time_within_train_step": 2.3547427654266357, "step": 2684} {"train_info/time_between_train_steps": 0.003104686737060547, "step": 2684} {"info/global_step": 2685, "train_info/time_within_train_step": 2.3544559478759766, "step": 2685} {"train_info/time_between_train_steps": 0.0031075477600097656, "step": 2685} {"info/global_step": 2686, "train_info/time_within_train_step": 2.3548450469970703, "step": 2686} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 2686} {"info/global_step": 2687, "train_info/time_within_train_step": 2.3559701442718506, "step": 2687} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 2687} {"info/global_step": 2688, "train_info/time_within_train_step": 2.354808807373047, "step": 2688} {"train_info/time_between_train_steps": 0.003126859664916992, "step": 2688} {"info/global_step": 2689, "train_info/time_within_train_step": 2.356010913848877, "step": 2689} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 2689} {"info/global_step": 2690, "train_info/time_within_train_step": 2.3550822734832764, "step": 2690} {"train_info/time_between_train_steps": 0.0031197071075439453, "step": 2690} {"info/global_step": 2691, "train_info/time_within_train_step": 2.356194257736206, "step": 2691} {"train_info/time_between_train_steps": 0.0031082630157470703, "step": 2691} {"info/global_step": 2692, "train_info/time_within_train_step": 2.3560903072357178, "step": 2692} {"train_info/time_between_train_steps": 0.003104686737060547, "step": 2692} {"info/global_step": 2693, "train_info/time_within_train_step": 2.3541009426116943, "step": 2693} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 2693} {"info/global_step": 2694, "train_info/time_within_train_step": 2.5651683807373047, "step": 2694} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 2694} {"info/global_step": 2695, "train_info/time_within_train_step": 2.3543143272399902, "step": 2695} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 2695} {"info/global_step": 2696, "train_info/time_within_train_step": 2.353349447250366, "step": 2696} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 2696} {"info/global_step": 2697, "train_info/time_within_train_step": 2.3551013469696045, "step": 2697} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 2697} {"info/global_step": 2698, "train_info/time_within_train_step": 2.354938268661499, "step": 2698} {"train_info/time_between_train_steps": 0.0031218528747558594, "step": 2698} {"info/global_step": 2699, "train_info/time_within_train_step": 2.355727195739746, "step": 2699} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 2699} {"info/global_step": 2700, "train_info/time_within_train_step": 2.3554251194000244, "step": 2700} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259150, "_runtime": 6969}, "step": 2700} {"logs": {"train/loss": 3.7077, "train/learning_rate": 6.666666666666666e-05, "train/epoch": 3.04, "_timestamp": 1746259150, "_runtime": 6969}, "step": 2700} {"train_info/time_between_train_steps": 18.525125980377197, "step": 2700} {"info/global_step": 2701, "train_info/time_within_train_step": 2.204319715499878, "step": 2701} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 2701} {"info/global_step": 2702, "train_info/time_within_train_step": 2.1813621520996094, "step": 2702} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 2702} {"info/global_step": 2703, "train_info/time_within_train_step": 2.2295751571655273, "step": 2703} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 2703} {"info/global_step": 2704, "train_info/time_within_train_step": 2.348335027694702, "step": 2704} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 2704} {"info/global_step": 2705, "train_info/time_within_train_step": 2.351865291595459, "step": 2705} {"train_info/time_between_train_steps": 0.12287282943725586, "step": 2705} {"info/global_step": 2706, "train_info/time_within_train_step": 2.371678113937378, "step": 2706} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 2706} {"info/global_step": 2707, "train_info/time_within_train_step": 2.3549766540527344, "step": 2707} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 2707} {"info/global_step": 2708, "train_info/time_within_train_step": 2.3553402423858643, "step": 2708} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 2708} {"info/global_step": 2709, "train_info/time_within_train_step": 2.3567535877227783, "step": 2709} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 2709} {"info/global_step": 2710, "train_info/time_within_train_step": 2.3567659854888916, "step": 2710} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 2710} {"info/global_step": 2711, "train_info/time_within_train_step": 2.356602430343628, "step": 2711} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 2711} {"info/global_step": 2712, "train_info/time_within_train_step": 2.3556125164031982, "step": 2712} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 2712} {"info/global_step": 2713, "train_info/time_within_train_step": 2.356523036956787, "step": 2713} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 2713} {"info/global_step": 2714, "train_info/time_within_train_step": 2.3571815490722656, "step": 2714} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 2714} {"info/global_step": 2715, "train_info/time_within_train_step": 2.356968402862549, "step": 2715} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 2715} {"info/global_step": 2716, "train_info/time_within_train_step": 2.357203245162964, "step": 2716} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 2716} {"info/global_step": 2717, "train_info/time_within_train_step": 2.357438802719116, "step": 2717} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 2717} {"info/global_step": 2718, "train_info/time_within_train_step": 2.357232093811035, "step": 2718} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 2718} {"info/global_step": 2719, "train_info/time_within_train_step": 2.539531946182251, "step": 2719} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 2719} {"info/global_step": 2720, "train_info/time_within_train_step": 2.356771230697632, "step": 2720} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 2720} {"info/global_step": 2721, "train_info/time_within_train_step": 2.3564674854278564, "step": 2721} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 2721} {"info/global_step": 2722, "train_info/time_within_train_step": 2.3570563793182373, "step": 2722} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 2722} {"info/global_step": 2723, "train_info/time_within_train_step": 2.3569998741149902, "step": 2723} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 2723} {"info/global_step": 2724, "train_info/time_within_train_step": 2.3570990562438965, "step": 2724} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 2724} {"info/global_step": 2725, "train_info/time_within_train_step": 2.356614351272583, "step": 2725} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 2725} {"info/global_step": 2726, "train_info/time_within_train_step": 2.356311798095703, "step": 2726} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 2726} {"info/global_step": 2727, "train_info/time_within_train_step": 2.356170892715454, "step": 2727} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 2727} {"info/global_step": 2728, "train_info/time_within_train_step": 2.3563945293426514, "step": 2728} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 2728} {"info/global_step": 2729, "train_info/time_within_train_step": 2.35701322555542, "step": 2729} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 2729} {"info/global_step": 2730, "train_info/time_within_train_step": 2.3571319580078125, "step": 2730} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 2730} {"info/global_step": 2731, "train_info/time_within_train_step": 2.356194496154785, "step": 2731} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 2731} {"info/global_step": 2732, "train_info/time_within_train_step": 2.357032299041748, "step": 2732} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 2732} {"info/global_step": 2733, "train_info/time_within_train_step": 2.3563005924224854, "step": 2733} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 2733} {"info/global_step": 2734, "train_info/time_within_train_step": 2.3790643215179443, "step": 2734} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 2734} {"info/global_step": 2735, "train_info/time_within_train_step": 2.356501579284668, "step": 2735} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 2735} {"info/global_step": 2736, "train_info/time_within_train_step": 2.356330156326294, "step": 2736} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 2736} {"info/global_step": 2737, "train_info/time_within_train_step": 2.3568482398986816, "step": 2737} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 2737} {"info/global_step": 2738, "train_info/time_within_train_step": 2.3566811084747314, "step": 2738} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 2738} {"info/global_step": 2739, "train_info/time_within_train_step": 2.3556618690490723, "step": 2739} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 2739} {"info/global_step": 2740, "train_info/time_within_train_step": 2.356609582901001, "step": 2740} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 2740} {"info/global_step": 2741, "train_info/time_within_train_step": 2.3554985523223877, "step": 2741} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 2741} {"info/global_step": 2742, "train_info/time_within_train_step": 2.35575532913208, "step": 2742} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 2742} {"info/global_step": 2743, "train_info/time_within_train_step": 2.35654354095459, "step": 2743} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 2743} {"info/global_step": 2744, "train_info/time_within_train_step": 2.3556299209594727, "step": 2744} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 2744} {"info/global_step": 2745, "train_info/time_within_train_step": 2.548229694366455, "step": 2745} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 2745} {"info/global_step": 2746, "train_info/time_within_train_step": 2.3562235832214355, "step": 2746} {"train_info/time_between_train_steps": 0.0031185150146484375, "step": 2746} {"info/global_step": 2747, "train_info/time_within_train_step": 2.3557474613189697, "step": 2747} {"train_info/time_between_train_steps": 0.003108501434326172, "step": 2747} {"info/global_step": 2748, "train_info/time_within_train_step": 2.35671329498291, "step": 2748} {"train_info/time_between_train_steps": 0.0031135082244873047, "step": 2748} {"info/global_step": 2749, "train_info/time_within_train_step": 2.915468454360962, "step": 2749} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 2749} {"info/global_step": 2750, "train_info/time_within_train_step": 2.355818748474121, "step": 2750} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259288, "_runtime": 7107}, "step": 2750} {"logs": {"train/loss": 3.6924, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 3.06, "_timestamp": 1746259288, "_runtime": 7107}, "step": 2750} {"train_info/time_between_train_steps": 0.024300098419189453, "step": 2750} {"info/global_step": 2751, "train_info/time_within_train_step": 2.3569252490997314, "step": 2751} {"train_info/time_between_train_steps": 0.0031397342681884766, "step": 2751} {"info/global_step": 2752, "train_info/time_within_train_step": 2.3549141883850098, "step": 2752} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 2752} {"info/global_step": 2753, "train_info/time_within_train_step": 2.3562755584716797, "step": 2753} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 2753} {"info/global_step": 2754, "train_info/time_within_train_step": 2.3572452068328857, "step": 2754} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 2754} {"info/global_step": 2755, "train_info/time_within_train_step": 2.354877471923828, "step": 2755} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 2755} {"info/global_step": 2756, "train_info/time_within_train_step": 2.356687068939209, "step": 2756} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 2756} {"info/global_step": 2757, "train_info/time_within_train_step": 2.3565056324005127, "step": 2757} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 2757} {"info/global_step": 2758, "train_info/time_within_train_step": 2.355031728744507, "step": 2758} {"train_info/time_between_train_steps": 0.0031287670135498047, "step": 2758} {"info/global_step": 2759, "train_info/time_within_train_step": 2.355947971343994, "step": 2759} {"train_info/time_between_train_steps": 0.0031099319458007812, "step": 2759} {"info/global_step": 2760, "train_info/time_within_train_step": 2.356513500213623, "step": 2760} {"train_info/time_between_train_steps": 0.003111600875854492, "step": 2760} {"info/global_step": 2761, "train_info/time_within_train_step": 2.35493803024292, "step": 2761} {"train_info/time_between_train_steps": 0.00308990478515625, "step": 2761} {"info/global_step": 2762, "train_info/time_within_train_step": 2.355586528778076, "step": 2762} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 2762} {"info/global_step": 2763, "train_info/time_within_train_step": 2.355010509490967, "step": 2763} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 2763} {"info/global_step": 2764, "train_info/time_within_train_step": 2.355905294418335, "step": 2764} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 2764} {"info/global_step": 2765, "train_info/time_within_train_step": 2.3551719188690186, "step": 2765} {"train_info/time_between_train_steps": 0.003108501434326172, "step": 2765} {"info/global_step": 2766, "train_info/time_within_train_step": 2.3555374145507812, "step": 2766} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 2766} {"info/global_step": 2767, "train_info/time_within_train_step": 2.355834484100342, "step": 2767} {"train_info/time_between_train_steps": 0.0030918121337890625, "step": 2767} {"info/global_step": 2768, "train_info/time_within_train_step": 2.4920461177825928, "step": 2768} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 2768} {"info/global_step": 2769, "train_info/time_within_train_step": 2.3556602001190186, "step": 2769} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 2769} {"info/global_step": 2770, "train_info/time_within_train_step": 2.572103500366211, "step": 2770} {"train_info/time_between_train_steps": 0.0031099319458007812, "step": 2770} {"info/global_step": 2771, "train_info/time_within_train_step": 2.3570291996002197, "step": 2771} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 2771} {"info/global_step": 2772, "train_info/time_within_train_step": 2.3557353019714355, "step": 2772} {"train_info/time_between_train_steps": 0.0031528472900390625, "step": 2772} {"info/global_step": 2773, "train_info/time_within_train_step": 2.3550827503204346, "step": 2773} {"train_info/time_between_train_steps": 0.0031151771545410156, "step": 2773} {"info/global_step": 2774, "train_info/time_within_train_step": 2.3555989265441895, "step": 2774} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 2774} {"info/global_step": 2775, "train_info/time_within_train_step": 2.355922222137451, "step": 2775} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 2775} {"info/global_step": 2776, "train_info/time_within_train_step": 2.3555805683135986, "step": 2776} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 2776} {"info/global_step": 2777, "train_info/time_within_train_step": 2.3547449111938477, "step": 2777} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 2777} {"info/global_step": 2778, "train_info/time_within_train_step": 2.3560450077056885, "step": 2778} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 2778} {"info/global_step": 2779, "train_info/time_within_train_step": 2.3564722537994385, "step": 2779} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 2779} {"info/global_step": 2780, "train_info/time_within_train_step": 2.356031656265259, "step": 2780} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 2780} {"info/global_step": 2781, "train_info/time_within_train_step": 2.3559505939483643, "step": 2781} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 2781} {"info/global_step": 2782, "train_info/time_within_train_step": 2.355543613433838, "step": 2782} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 2782} {"info/global_step": 2783, "train_info/time_within_train_step": 2.3559329509735107, "step": 2783} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 2783} {"info/global_step": 2784, "train_info/time_within_train_step": 2.3783679008483887, "step": 2784} {"train_info/time_between_train_steps": 0.003108978271484375, "step": 2784} {"info/global_step": 2785, "train_info/time_within_train_step": 2.3557543754577637, "step": 2785} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 2785} {"info/global_step": 2786, "train_info/time_within_train_step": 2.3566296100616455, "step": 2786} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 2786} {"info/global_step": 2787, "train_info/time_within_train_step": 2.3561043739318848, "step": 2787} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 2787} {"info/global_step": 2788, "train_info/time_within_train_step": 2.355071783065796, "step": 2788} {"train_info/time_between_train_steps": 0.003143310546875, "step": 2788} {"info/global_step": 2789, "train_info/time_within_train_step": 2.3563661575317383, "step": 2789} {"train_info/time_between_train_steps": 0.003123044967651367, "step": 2789} {"info/global_step": 2790, "train_info/time_within_train_step": 2.3561832904815674, "step": 2790} {"train_info/time_between_train_steps": 0.003103494644165039, "step": 2790} {"info/global_step": 2791, "train_info/time_within_train_step": 2.3556642532348633, "step": 2791} {"train_info/time_between_train_steps": 0.0030975341796875, "step": 2791} {"info/global_step": 2792, "train_info/time_within_train_step": 2.3565869331359863, "step": 2792} {"train_info/time_between_train_steps": 0.00311279296875, "step": 2792} {"info/global_step": 2793, "train_info/time_within_train_step": 2.3567090034484863, "step": 2793} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 2793} {"info/global_step": 2794, "train_info/time_within_train_step": 2.3559372425079346, "step": 2794} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 2794} {"info/global_step": 2795, "train_info/time_within_train_step": 2.5728704929351807, "step": 2795} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 2795} {"info/global_step": 2796, "train_info/time_within_train_step": 2.35617733001709, "step": 2796} {"train_info/time_between_train_steps": 0.003102540969848633, "step": 2796} {"info/global_step": 2797, "train_info/time_within_train_step": 2.35587477684021, "step": 2797} {"train_info/time_between_train_steps": 0.003100156784057617, "step": 2797} {"info/global_step": 2798, "train_info/time_within_train_step": 2.3544297218322754, "step": 2798} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 2798} {"info/global_step": 2799, "train_info/time_within_train_step": 2.3549723625183105, "step": 2799} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 2799} {"info/global_step": 2800, "train_info/time_within_train_step": 2.3546035289764404, "step": 2800} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259407, "_runtime": 7226}, "step": 2800} {"logs": {"train/loss": 3.6905, "train/learning_rate": 4.444444444444444e-05, "train/epoch": 3.07, "_timestamp": 1746259407, "_runtime": 7226}, "step": 2800} {"train_info/time_between_train_steps": 19.83733558654785, "step": 2800} {"info/global_step": 2801, "train_info/time_within_train_step": 2.202332019805908, "step": 2801} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 2801} {"info/global_step": 2802, "train_info/time_within_train_step": 2.1799564361572266, "step": 2802} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 2802} {"info/global_step": 2803, "train_info/time_within_train_step": 2.188382625579834, "step": 2803} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 2803} {"info/global_step": 2804, "train_info/time_within_train_step": 2.3288280963897705, "step": 2804} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 2804} {"info/global_step": 2805, "train_info/time_within_train_step": 2.3513295650482178, "step": 2805} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 2805} {"info/global_step": 2806, "train_info/time_within_train_step": 2.3541066646575928, "step": 2806} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2806} {"info/global_step": 2807, "train_info/time_within_train_step": 2.3561954498291016, "step": 2807} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 2807} {"info/global_step": 2808, "train_info/time_within_train_step": 2.355384349822998, "step": 2808} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 2808} {"info/global_step": 2809, "train_info/time_within_train_step": 2.3572096824645996, "step": 2809} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 2809} {"info/global_step": 2810, "train_info/time_within_train_step": 2.355830669403076, "step": 2810} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 2810} {"info/global_step": 2811, "train_info/time_within_train_step": 2.3562262058258057, "step": 2811} {"train_info/time_between_train_steps": 0.0031142234802246094, "step": 2811} {"info/global_step": 2812, "train_info/time_within_train_step": 2.3566644191741943, "step": 2812} {"train_info/time_between_train_steps": 0.003101348876953125, "step": 2812} {"info/global_step": 2813, "train_info/time_within_train_step": 2.3562605381011963, "step": 2813} {"train_info/time_between_train_steps": 0.0031113624572753906, "step": 2813} {"info/global_step": 2814, "train_info/time_within_train_step": 2.3554835319519043, "step": 2814} {"train_info/time_between_train_steps": 0.003103494644165039, "step": 2814} {"info/global_step": 2815, "train_info/time_within_train_step": 2.355545997619629, "step": 2815} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 2815} {"info/global_step": 2816, "train_info/time_within_train_step": 2.3668808937072754, "step": 2816} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 2816} {"info/global_step": 2817, "train_info/time_within_train_step": 2.3559248447418213, "step": 2817} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 2817} {"info/global_step": 2818, "train_info/time_within_train_step": 2.3563387393951416, "step": 2818} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 2818} {"info/global_step": 2819, "train_info/time_within_train_step": 2.356184244155884, "step": 2819} {"train_info/time_between_train_steps": 0.0030927658081054688, "step": 2819} {"info/global_step": 2820, "train_info/time_within_train_step": 2.5724120140075684, "step": 2820} {"train_info/time_between_train_steps": 0.003097057342529297, "step": 2820} {"info/global_step": 2821, "train_info/time_within_train_step": 2.354921817779541, "step": 2821} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 2821} {"info/global_step": 2822, "train_info/time_within_train_step": 2.3566510677337646, "step": 2822} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 2822} {"info/global_step": 2823, "train_info/time_within_train_step": 2.356414794921875, "step": 2823} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 2823} {"info/global_step": 2824, "train_info/time_within_train_step": 2.3562848567962646, "step": 2824} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 2824} {"info/global_step": 2825, "train_info/time_within_train_step": 2.3570914268493652, "step": 2825} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 2825} {"info/global_step": 2826, "train_info/time_within_train_step": 2.3569793701171875, "step": 2826} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 2826} {"info/global_step": 2827, "train_info/time_within_train_step": 2.3566644191741943, "step": 2827} {"train_info/time_between_train_steps": 0.0031096935272216797, "step": 2827} {"info/global_step": 2828, "train_info/time_within_train_step": 2.357140064239502, "step": 2828} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 2828} {"info/global_step": 2829, "train_info/time_within_train_step": 2.357125759124756, "step": 2829} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 2829} {"info/global_step": 2830, "train_info/time_within_train_step": 2.356532335281372, "step": 2830} {"train_info/time_between_train_steps": 0.12181735038757324, "step": 2830} {"info/global_step": 2831, "train_info/time_within_train_step": 2.357609748840332, "step": 2831} {"train_info/time_between_train_steps": 0.003122091293334961, "step": 2831} {"info/global_step": 2832, "train_info/time_within_train_step": 2.355785608291626, "step": 2832} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 2832} {"info/global_step": 2833, "train_info/time_within_train_step": 2.35630202293396, "step": 2833} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 2833} {"info/global_step": 2834, "train_info/time_within_train_step": 2.3560800552368164, "step": 2834} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 2834} {"info/global_step": 2835, "train_info/time_within_train_step": 2.3565735816955566, "step": 2835} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 2835} {"info/global_step": 2836, "train_info/time_within_train_step": 2.3559978008270264, "step": 2836} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 2836} {"info/global_step": 2837, "train_info/time_within_train_step": 2.3553030490875244, "step": 2837} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 2837} {"info/global_step": 2838, "train_info/time_within_train_step": 2.3564701080322266, "step": 2838} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 2838} {"info/global_step": 2839, "train_info/time_within_train_step": 2.356351852416992, "step": 2839} {"train_info/time_between_train_steps": 0.003466367721557617, "step": 2839} {"info/global_step": 2840, "train_info/time_within_train_step": 2.355546474456787, "step": 2840} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 2840} {"info/global_step": 2841, "train_info/time_within_train_step": 2.356843948364258, "step": 2841} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 2841} {"info/global_step": 2842, "train_info/time_within_train_step": 2.3564114570617676, "step": 2842} {"train_info/time_between_train_steps": 0.003254413604736328, "step": 2842} {"info/global_step": 2843, "train_info/time_within_train_step": 2.355050563812256, "step": 2843} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 2843} {"info/global_step": 2844, "train_info/time_within_train_step": 2.356241464614868, "step": 2844} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 2844} {"info/global_step": 2845, "train_info/time_within_train_step": 2.595177173614502, "step": 2845} {"train_info/time_between_train_steps": 0.0031266212463378906, "step": 2845} {"info/global_step": 2846, "train_info/time_within_train_step": 2.355041742324829, "step": 2846} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 2846} {"info/global_step": 2847, "train_info/time_within_train_step": 2.3556361198425293, "step": 2847} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 2847} {"info/global_step": 2848, "train_info/time_within_train_step": 2.3559348583221436, "step": 2848} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 2848} {"info/global_step": 2849, "train_info/time_within_train_step": 2.3566668033599854, "step": 2849} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 2849} {"info/global_step": 2850, "train_info/time_within_train_step": 2.3563194274902344, "step": 2850} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259546, "_runtime": 7365}, "step": 2850} {"logs": {"train/loss": 3.677, "train/learning_rate": 3.333333333333333e-05, "train/epoch": 3.09, "_timestamp": 1746259546, "_runtime": 7365}, "step": 2850} {"train_info/time_between_train_steps": 0.024022817611694336, "step": 2850} {"info/global_step": 2851, "train_info/time_within_train_step": 2.3564159870147705, "step": 2851} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 2851} {"info/global_step": 2852, "train_info/time_within_train_step": 2.356706142425537, "step": 2852} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 2852} {"info/global_step": 2853, "train_info/time_within_train_step": 2.3556089401245117, "step": 2853} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 2853} {"info/global_step": 2854, "train_info/time_within_train_step": 2.356051445007324, "step": 2854} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 2854} {"info/global_step": 2855, "train_info/time_within_train_step": 2.3573825359344482, "step": 2855} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 2855} {"info/global_step": 2856, "train_info/time_within_train_step": 2.3556387424468994, "step": 2856} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 2856} {"info/global_step": 2857, "train_info/time_within_train_step": 2.3553247451782227, "step": 2857} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 2857} {"info/global_step": 2858, "train_info/time_within_train_step": 2.356567621231079, "step": 2858} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 2858} {"info/global_step": 2859, "train_info/time_within_train_step": 2.3559091091156006, "step": 2859} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 2859} {"info/global_step": 2860, "train_info/time_within_train_step": 2.3555164337158203, "step": 2860} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 2860} {"info/global_step": 2861, "train_info/time_within_train_step": 2.3558244705200195, "step": 2861} {"train_info/time_between_train_steps": 0.003124237060546875, "step": 2861} {"info/global_step": 2862, "train_info/time_within_train_step": 2.3562369346618652, "step": 2862} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 2862} {"info/global_step": 2863, "train_info/time_within_train_step": 2.354630947113037, "step": 2863} {"train_info/time_between_train_steps": 0.0031194686889648438, "step": 2863} {"info/global_step": 2864, "train_info/time_within_train_step": 2.3562214374542236, "step": 2864} {"train_info/time_between_train_steps": 0.00311279296875, "step": 2864} {"info/global_step": 2865, "train_info/time_within_train_step": 2.3560967445373535, "step": 2865} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 2865} {"info/global_step": 2866, "train_info/time_within_train_step": 2.3564095497131348, "step": 2866} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 2866} {"info/global_step": 2867, "train_info/time_within_train_step": 2.3556289672851562, "step": 2867} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 2867} {"info/global_step": 2868, "train_info/time_within_train_step": 2.356234550476074, "step": 2868} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 2868} {"info/global_step": 2869, "train_info/time_within_train_step": 2.5754380226135254, "step": 2869} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 2869} {"info/global_step": 2870, "train_info/time_within_train_step": 2.3553082942962646, "step": 2870} {"train_info/time_between_train_steps": 0.0031325817108154297, "step": 2870} {"info/global_step": 2871, "train_info/time_within_train_step": 2.356095790863037, "step": 2871} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 2871} {"info/global_step": 2872, "train_info/time_within_train_step": 2.356694221496582, "step": 2872} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 2872} {"info/global_step": 2873, "train_info/time_within_train_step": 2.3565125465393066, "step": 2873} {"train_info/time_between_train_steps": 0.0031232833862304688, "step": 2873} {"info/global_step": 2874, "train_info/time_within_train_step": 2.3550126552581787, "step": 2874} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 2874} {"info/global_step": 2875, "train_info/time_within_train_step": 2.355673313140869, "step": 2875} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 2875} {"info/global_step": 2876, "train_info/time_within_train_step": 2.355909824371338, "step": 2876} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 2876} {"info/global_step": 2877, "train_info/time_within_train_step": 2.356269359588623, "step": 2877} {"train_info/time_between_train_steps": 0.0032837390899658203, "step": 2877} {"info/global_step": 2878, "train_info/time_within_train_step": 2.3564364910125732, "step": 2878} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 2878} {"info/global_step": 2879, "train_info/time_within_train_step": 2.3565146923065186, "step": 2879} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 2879} {"info/global_step": 2880, "train_info/time_within_train_step": 2.356133460998535, "step": 2880} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 2880} {"info/global_step": 2881, "train_info/time_within_train_step": 2.3570632934570312, "step": 2881} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 2881} {"info/global_step": 2882, "train_info/time_within_train_step": 2.356760025024414, "step": 2882} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 2882} {"info/global_step": 2883, "train_info/time_within_train_step": 2.3561060428619385, "step": 2883} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 2883} {"info/global_step": 2884, "train_info/time_within_train_step": 2.3550186157226562, "step": 2884} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 2884} {"info/global_step": 2885, "train_info/time_within_train_step": 2.355815887451172, "step": 2885} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 2885} {"info/global_step": 2886, "train_info/time_within_train_step": 2.3556602001190186, "step": 2886} {"train_info/time_between_train_steps": 0.003247976303100586, "step": 2886} {"info/global_step": 2887, "train_info/time_within_train_step": 2.354732036590576, "step": 2887} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 2887} {"info/global_step": 2888, "train_info/time_within_train_step": 2.3562440872192383, "step": 2888} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 2888} {"info/global_step": 2889, "train_info/time_within_train_step": 2.3559422492980957, "step": 2889} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 2889} {"info/global_step": 2890, "train_info/time_within_train_step": 2.355832815170288, "step": 2890} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 2890} {"info/global_step": 2891, "train_info/time_within_train_step": 2.354262351989746, "step": 2891} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 2891} {"info/global_step": 2892, "train_info/time_within_train_step": 2.356740713119507, "step": 2892} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 2892} {"info/global_step": 2893, "train_info/time_within_train_step": 2.7306129932403564, "step": 2893} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 2893} {"info/global_step": 2894, "train_info/time_within_train_step": 2.355848789215088, "step": 2894} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 2894} {"info/global_step": 2895, "train_info/time_within_train_step": 2.3551440238952637, "step": 2895} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 2895} {"info/global_step": 2896, "train_info/time_within_train_step": 2.425959825515747, "step": 2896} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 2896} {"info/global_step": 2897, "train_info/time_within_train_step": 2.355511426925659, "step": 2897} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 2897} {"info/global_step": 2898, "train_info/time_within_train_step": 2.3557791709899902, "step": 2898} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 2898} {"info/global_step": 2899, "train_info/time_within_train_step": 2.3559978008270264, "step": 2899} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 2899} {"info/global_step": 2900, "train_info/time_within_train_step": 2.3550689220428467, "step": 2900} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259666, "_runtime": 7485}, "step": 2900} {"logs": {"train/loss": 3.6732, "train/learning_rate": 2.222222222222222e-05, "train/epoch": 3.11, "_timestamp": 1746259666, "_runtime": 7485}, "step": 2900} {"train_info/time_between_train_steps": 18.834516763687134, "step": 2900} {"info/global_step": 2901, "train_info/time_within_train_step": 2.2097091674804688, "step": 2901} {"train_info/time_between_train_steps": 0.0033202171325683594, "step": 2901} {"info/global_step": 2902, "train_info/time_within_train_step": 2.1824183464050293, "step": 2902} {"train_info/time_between_train_steps": 0.003304719924926758, "step": 2902} {"info/global_step": 2903, "train_info/time_within_train_step": 2.2389488220214844, "step": 2903} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 2903} {"info/global_step": 2904, "train_info/time_within_train_step": 2.350276470184326, "step": 2904} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 2904} {"info/global_step": 2905, "train_info/time_within_train_step": 2.3536736965179443, "step": 2905} {"train_info/time_between_train_steps": 0.003258943557739258, "step": 2905} {"info/global_step": 2906, "train_info/time_within_train_step": 2.3562591075897217, "step": 2906} {"train_info/time_between_train_steps": 0.0032575130462646484, "step": 2906} {"info/global_step": 2907, "train_info/time_within_train_step": 2.356156587600708, "step": 2907} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 2907} {"info/global_step": 2908, "train_info/time_within_train_step": 2.356832504272461, "step": 2908} {"train_info/time_between_train_steps": 0.0032989978790283203, "step": 2908} {"info/global_step": 2909, "train_info/time_within_train_step": 2.3663108348846436, "step": 2909} {"train_info/time_between_train_steps": 0.0032455921173095703, "step": 2909} {"info/global_step": 2910, "train_info/time_within_train_step": 2.3581340312957764, "step": 2910} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 2910} {"info/global_step": 2911, "train_info/time_within_train_step": 2.357736110687256, "step": 2911} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 2911} {"info/global_step": 2912, "train_info/time_within_train_step": 2.356544256210327, "step": 2912} {"train_info/time_between_train_steps": 0.0032737255096435547, "step": 2912} {"info/global_step": 2913, "train_info/time_within_train_step": 2.3581244945526123, "step": 2913} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 2913} {"info/global_step": 2914, "train_info/time_within_train_step": 2.358565092086792, "step": 2914} {"train_info/time_between_train_steps": 0.0032644271850585938, "step": 2914} {"info/global_step": 2915, "train_info/time_within_train_step": 2.3582043647766113, "step": 2915} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 2915} {"info/global_step": 2916, "train_info/time_within_train_step": 2.3582029342651367, "step": 2916} {"train_info/time_between_train_steps": 0.0032396316528320312, "step": 2916} {"info/global_step": 2917, "train_info/time_within_train_step": 2.358309745788574, "step": 2917} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 2917} {"info/global_step": 2918, "train_info/time_within_train_step": 2.587745189666748, "step": 2918} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 2918} {"info/global_step": 2919, "train_info/time_within_train_step": 2.357726573944092, "step": 2919} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 2919} {"info/global_step": 2920, "train_info/time_within_train_step": 2.358232259750366, "step": 2920} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 2920} {"info/global_step": 2921, "train_info/time_within_train_step": 2.3583180904388428, "step": 2921} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 2921} {"info/global_step": 2922, "train_info/time_within_train_step": 2.3578221797943115, "step": 2922} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 2922} {"info/global_step": 2923, "train_info/time_within_train_step": 2.3583900928497314, "step": 2923} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 2923} {"info/global_step": 2924, "train_info/time_within_train_step": 2.3576407432556152, "step": 2924} {"train_info/time_between_train_steps": 0.0033245086669921875, "step": 2924} {"info/global_step": 2925, "train_info/time_within_train_step": 2.3574678897857666, "step": 2925} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 2925} {"info/global_step": 2926, "train_info/time_within_train_step": 2.3581011295318604, "step": 2926} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 2926} {"info/global_step": 2927, "train_info/time_within_train_step": 2.3573594093322754, "step": 2927} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 2927} {"info/global_step": 2928, "train_info/time_within_train_step": 2.357564926147461, "step": 2928} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 2928} {"info/global_step": 2929, "train_info/time_within_train_step": 2.3574750423431396, "step": 2929} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 2929} {"info/global_step": 2930, "train_info/time_within_train_step": 2.3576149940490723, "step": 2930} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 2930} {"info/global_step": 2931, "train_info/time_within_train_step": 2.3571906089782715, "step": 2931} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 2931} {"info/global_step": 2932, "train_info/time_within_train_step": 2.35768461227417, "step": 2932} {"train_info/time_between_train_steps": 0.0031478404998779297, "step": 2932} {"info/global_step": 2933, "train_info/time_within_train_step": 2.358079433441162, "step": 2933} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 2933} {"info/global_step": 2934, "train_info/time_within_train_step": 2.3581981658935547, "step": 2934} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 2934} {"info/global_step": 2935, "train_info/time_within_train_step": 2.356778144836426, "step": 2935} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 2935} {"info/global_step": 2936, "train_info/time_within_train_step": 2.357117176055908, "step": 2936} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 2936} {"info/global_step": 2937, "train_info/time_within_train_step": 2.357219934463501, "step": 2937} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 2937} {"info/global_step": 2938, "train_info/time_within_train_step": 2.35768985748291, "step": 2938} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 2938} {"info/global_step": 2939, "train_info/time_within_train_step": 2.357404947280884, "step": 2939} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 2939} {"info/global_step": 2940, "train_info/time_within_train_step": 2.357229232788086, "step": 2940} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 2940} {"info/global_step": 2941, "train_info/time_within_train_step": 2.357649564743042, "step": 2941} {"train_info/time_between_train_steps": 0.00323486328125, "step": 2941} {"info/global_step": 2942, "train_info/time_within_train_step": 2.356679677963257, "step": 2942} {"train_info/time_between_train_steps": 0.0032501220703125, "step": 2942} {"info/global_step": 2943, "train_info/time_within_train_step": 2.5900349617004395, "step": 2943} {"train_info/time_between_train_steps": 0.00312042236328125, "step": 2943} {"info/global_step": 2944, "train_info/time_within_train_step": 2.3566207885742188, "step": 2944} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 2944} {"info/global_step": 2945, "train_info/time_within_train_step": 2.3576629161834717, "step": 2945} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 2945} {"info/global_step": 2946, "train_info/time_within_train_step": 2.3570263385772705, "step": 2946} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 2946} {"info/global_step": 2947, "train_info/time_within_train_step": 2.3576409816741943, "step": 2947} {"train_info/time_between_train_steps": 0.003122091293334961, "step": 2947} {"info/global_step": 2948, "train_info/time_within_train_step": 2.357020139694214, "step": 2948} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 2948} {"info/global_step": 2949, "train_info/time_within_train_step": 2.35640287399292, "step": 2949} {"train_info/time_between_train_steps": 0.0031092166900634766, "step": 2949} {"info/global_step": 2950, "train_info/time_within_train_step": 2.356717824935913, "step": 2950} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259804, "_runtime": 7623}, "step": 2950} {"logs": {"train/loss": 3.652, "train/learning_rate": 1.111111111111111e-05, "train/epoch": 3.12, "_timestamp": 1746259804, "_runtime": 7623}, "step": 2950} {"train_info/time_between_train_steps": 0.023977041244506836, "step": 2950} {"info/global_step": 2951, "train_info/time_within_train_step": 2.35587739944458, "step": 2951} {"train_info/time_between_train_steps": 0.003103017807006836, "step": 2951} {"info/global_step": 2952, "train_info/time_within_train_step": 2.3571345806121826, "step": 2952} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 2952} {"info/global_step": 2953, "train_info/time_within_train_step": 2.3587794303894043, "step": 2953} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 2953} {"info/global_step": 2954, "train_info/time_within_train_step": 2.3573551177978516, "step": 2954} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 2954} {"info/global_step": 2955, "train_info/time_within_train_step": 2.356837034225464, "step": 2955} {"train_info/time_between_train_steps": 0.1318674087524414, "step": 2955} {"info/global_step": 2956, "train_info/time_within_train_step": 2.3582563400268555, "step": 2956} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 2956} {"info/global_step": 2957, "train_info/time_within_train_step": 2.3579676151275635, "step": 2957} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 2957} {"info/global_step": 2958, "train_info/time_within_train_step": 2.358060598373413, "step": 2958} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 2958} {"info/global_step": 2959, "train_info/time_within_train_step": 2.3572182655334473, "step": 2959} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 2959} {"info/global_step": 2960, "train_info/time_within_train_step": 2.3566176891326904, "step": 2960} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2960} {"info/global_step": 2961, "train_info/time_within_train_step": 2.357633352279663, "step": 2961} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 2961} {"info/global_step": 2962, "train_info/time_within_train_step": 2.3577752113342285, "step": 2962} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 2962} {"info/global_step": 2963, "train_info/time_within_train_step": 2.3576323986053467, "step": 2963} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 2963} {"info/global_step": 2964, "train_info/time_within_train_step": 2.4361400604248047, "step": 2964} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 2964} {"info/global_step": 2965, "train_info/time_within_train_step": 2.3574018478393555, "step": 2965} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 2965} {"info/global_step": 2966, "train_info/time_within_train_step": 2.355443239212036, "step": 2966} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 2966} {"info/global_step": 2967, "train_info/time_within_train_step": 2.3562726974487305, "step": 2967} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 2967} {"info/global_step": 2968, "train_info/time_within_train_step": 2.5814759731292725, "step": 2968} {"train_info/time_between_train_steps": 0.0031266212463378906, "step": 2968} {"info/global_step": 2969, "train_info/time_within_train_step": 2.357085704803467, "step": 2969} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 2969} {"info/global_step": 2970, "train_info/time_within_train_step": 2.3574740886688232, "step": 2970} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 2970} {"info/global_step": 2971, "train_info/time_within_train_step": 2.35693359375, "step": 2971} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 2971} {"info/global_step": 2972, "train_info/time_within_train_step": 2.357008457183838, "step": 2972} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 2972} {"info/global_step": 2973, "train_info/time_within_train_step": 2.3568501472473145, "step": 2973} {"train_info/time_between_train_steps": 0.003119945526123047, "step": 2973} {"info/global_step": 2974, "train_info/time_within_train_step": 2.3562138080596924, "step": 2974} {"train_info/time_between_train_steps": 0.0031528472900390625, "step": 2974} {"info/global_step": 2975, "train_info/time_within_train_step": 2.3568341732025146, "step": 2975} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 2975} {"info/global_step": 2976, "train_info/time_within_train_step": 2.356274366378784, "step": 2976} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 2976} {"info/global_step": 2977, "train_info/time_within_train_step": 2.3572282791137695, "step": 2977} {"train_info/time_between_train_steps": 0.0034635066986083984, "step": 2977} {"info/global_step": 2978, "train_info/time_within_train_step": 2.3567779064178467, "step": 2978} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 2978} {"info/global_step": 2979, "train_info/time_within_train_step": 2.3576931953430176, "step": 2979} {"train_info/time_between_train_steps": 0.0031003952026367188, "step": 2979} {"info/global_step": 2980, "train_info/time_within_train_step": 2.357644557952881, "step": 2980} {"train_info/time_between_train_steps": 0.0031337738037109375, "step": 2980} {"info/global_step": 2981, "train_info/time_within_train_step": 2.3561623096466064, "step": 2981} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 2981} {"info/global_step": 2982, "train_info/time_within_train_step": 2.3570659160614014, "step": 2982} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 2982} {"info/global_step": 2983, "train_info/time_within_train_step": 2.356555938720703, "step": 2983} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 2983} {"info/global_step": 2984, "train_info/time_within_train_step": 2.35752534866333, "step": 2984} {"train_info/time_between_train_steps": 0.0031211376190185547, "step": 2984} {"info/global_step": 2985, "train_info/time_within_train_step": 2.356330394744873, "step": 2985} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 2985} {"info/global_step": 2986, "train_info/time_within_train_step": 2.3551580905914307, "step": 2986} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 2986} {"info/global_step": 2987, "train_info/time_within_train_step": 2.3562583923339844, "step": 2987} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 2987} {"info/global_step": 2988, "train_info/time_within_train_step": 2.3571176528930664, "step": 2988} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 2988} {"info/global_step": 2989, "train_info/time_within_train_step": 2.356623411178589, "step": 2989} {"train_info/time_between_train_steps": 0.003250598907470703, "step": 2989} {"info/global_step": 2990, "train_info/time_within_train_step": 2.356706142425537, "step": 2990} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 2990} {"info/global_step": 2991, "train_info/time_within_train_step": 2.35650897026062, "step": 2991} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 2991} {"info/global_step": 2992, "train_info/time_within_train_step": 2.3570151329040527, "step": 2992} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 2992} {"info/global_step": 2993, "train_info/time_within_train_step": 2.583444356918335, "step": 2993} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 2993} {"info/global_step": 2994, "train_info/time_within_train_step": 2.3571505546569824, "step": 2994} {"train_info/time_between_train_steps": 0.003130197525024414, "step": 2994} {"info/global_step": 2995, "train_info/time_within_train_step": 2.3568267822265625, "step": 2995} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 2995} {"info/global_step": 2996, "train_info/time_within_train_step": 2.3559482097625732, "step": 2996} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 2996} {"info/global_step": 2997, "train_info/time_within_train_step": 2.356170892715454, "step": 2997} {"train_info/time_between_train_steps": 0.0031185150146484375, "step": 2997} {"info/global_step": 2998, "train_info/time_within_train_step": 2.356518030166626, "step": 2998} {"train_info/time_between_train_steps": 0.0031092166900634766, "step": 2998} {"info/global_step": 2999, "train_info/time_within_train_step": 2.91709041595459, "step": 2999} {"train_info/time_between_train_steps": 0.003279447555541992, "step": 2999} {"info/global_step": 3000, "train_info/time_within_train_step": 2.357013463973999, "step": 3000} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259924, "_runtime": 7743}, "step": 3000} {"logs": {"train/loss": 3.645, "train/learning_rate": 0.0, "train/epoch": 3.14, "_timestamp": 1746259924, "_runtime": 7743}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259928, "_runtime": 7747}, "step": 3000} {"logs": {"eval/loss": 4.248782157897949, "eval/runtime": 4.1346, "eval/samples_per_second": 48.372, "eval/steps_per_second": 1.209, "train/epoch": 3.14, "_timestamp": 1746259928, "_runtime": 7747}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259928, "_runtime": 7747}, "step": 3000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.248782157897949, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 70.02008699090153, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.1346, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 48.372, "train/epoch": 3.14, "_timestamp": 1746259928, "_runtime": 7747}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1675.0859375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259963, "_runtime": 7782}, "step": 3000} {"logs": {"train/train_runtime": 7782.6575, "train/train_samples_per_second": 37.005, "train/train_steps_per_second": 0.385, "train/total_flos": 2.509187383296e+16, "train/train_loss": 4.281885763168335, "train/epoch": 3.14, "_timestamp": 1746259963, "_runtime": 7782}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1675.0849609375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259972, "_runtime": 7791}, "step": 3000} {"logs": {"eval/loss": 4.248782157897949, "eval/runtime": 3.8013, "eval/samples_per_second": 52.614, "eval/steps_per_second": 1.315, "train/epoch": 3.14, "_timestamp": 1746259972, "_runtime": 7791}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1675.0849609375, "train_info/memory_max_allocated": 4479.62744140625, "train_info/memory_reserved": 8708.0, "train_info/memory_max_reserved": 8708.0, "_timestamp": 1746259972, "_runtime": 7791}, "step": 3000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.248782157897949, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 70.02008699090153, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 3.8013, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 52.614, "train/epoch": 3.14, "_timestamp": 1746259972, "_runtime": 7791}, "step": 3000}