DNAN_EN / metrics.json
xiulinyang's picture
Adding model checkpoints and config files
26a4811
{"num_parameters": 124439808, "trainable_parameters": 124439808, "step": 0}
{"train_info/time_between_train_steps": 3.7880611419677734, "step": 0}
{"info/global_step": 1, "train_info/time_within_train_step": 28.245509386062622, "step": 1}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 19761.71484375, "train_info/memory_reserved": 22624.0, "train_info/memory_max_reserved": 22624.0, "_timestamp": 1740824103, "_runtime": 52}, "step": 1}
{"logs": {"train/loss": 11.0218, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1740824103, "_runtime": 52}, "step": 1}
{"train_info/time_between_train_steps": 0.026770353317260742, "step": 1}
{"info/global_step": 2, "train_info/time_within_train_step": 27.87890863418579, "step": 2}
{"train_info/time_between_train_steps": 0.005446434020996094, "step": 2}
{"info/global_step": 3, "train_info/time_within_train_step": 27.714547395706177, "step": 3}
{"train_info/time_between_train_steps": 0.005309581756591797, "step": 3}
{"info/global_step": 4, "train_info/time_within_train_step": 27.873948097229004, "step": 4}
{"train_info/time_between_train_steps": 0.0055294036865234375, "step": 4}
{"info/global_step": 5, "train_info/time_within_train_step": 27.747509241104126, "step": 5}
{"train_info/time_between_train_steps": 0.0058400630950927734, "step": 5}
{"info/global_step": 6, "train_info/time_within_train_step": 27.868066549301147, "step": 6}
{"train_info/time_between_train_steps": 0.005422353744506836, "step": 6}
{"info/global_step": 7, "train_info/time_within_train_step": 27.72815752029419, "step": 7}
{"train_info/time_between_train_steps": 0.006606101989746094, "step": 7}
{"info/global_step": 8, "train_info/time_within_train_step": 27.752501487731934, "step": 8}
{"train_info/time_between_train_steps": 0.005498409271240234, "step": 8}
{"info/global_step": 9, "train_info/time_within_train_step": 27.771718978881836, "step": 9}
{"train_info/time_between_train_steps": 0.005301237106323242, "step": 9}
{"info/global_step": 10, "train_info/time_within_train_step": 27.69246006011963, "step": 10}
{"train_info/time_between_train_steps": 0.005982875823974609, "step": 10}
{"info/global_step": 11, "train_info/time_within_train_step": 27.705485820770264, "step": 11}
{"train_info/time_between_train_steps": 0.006503582000732422, "step": 11}
{"info/global_step": 12, "train_info/time_within_train_step": 27.706249952316284, "step": 12}
{"train_info/time_between_train_steps": 0.005203962326049805, "step": 12}
{"info/global_step": 13, "train_info/time_within_train_step": 27.734382390975952, "step": 13}
{"train_info/time_between_train_steps": 0.006273031234741211, "step": 13}
{"info/global_step": 14, "train_info/time_within_train_step": 27.726340532302856, "step": 14}
{"train_info/time_between_train_steps": 0.005394935607910156, "step": 14}
{"info/global_step": 15, "train_info/time_within_train_step": 27.75440740585327, "step": 15}
{"train_info/time_between_train_steps": 0.005065202713012695, "step": 15}
{"info/global_step": 16, "train_info/time_within_train_step": 27.809078216552734, "step": 16}
{"train_info/time_between_train_steps": 0.0055561065673828125, "step": 16}
{"info/global_step": 17, "train_info/time_within_train_step": 27.74449610710144, "step": 17}
{"train_info/time_between_train_steps": 0.011729717254638672, "step": 17}
{"info/global_step": 18, "train_info/time_within_train_step": 27.704740047454834, "step": 18}
{"train_info/time_between_train_steps": 0.005122184753417969, "step": 18}
{"info/global_step": 19, "train_info/time_within_train_step": 27.701870679855347, "step": 19}
{"train_info/time_between_train_steps": 0.005314350128173828, "step": 19}
{"info/global_step": 20, "train_info/time_within_train_step": 27.705451250076294, "step": 20}
{"train_info/time_between_train_steps": 0.00513768196105957, "step": 20}
{"info/global_step": 21, "train_info/time_within_train_step": 27.701735496520996, "step": 21}
{"train_info/time_between_train_steps": 0.005435943603515625, "step": 21}
{"info/global_step": 22, "train_info/time_within_train_step": 27.733572959899902, "step": 22}
{"train_info/time_between_train_steps": 0.005304098129272461, "step": 22}
{"info/global_step": 23, "train_info/time_within_train_step": 27.71440815925598, "step": 23}
{"train_info/time_between_train_steps": 0.005193948745727539, "step": 23}
{"info/global_step": 24, "train_info/time_within_train_step": 27.756873846054077, "step": 24}
{"train_info/time_between_train_steps": 0.005127906799316406, "step": 24}
{"info/global_step": 25, "train_info/time_within_train_step": 27.71349811553955, "step": 25}
{"train_info/time_between_train_steps": 0.005140781402587891, "step": 25}
{"info/global_step": 26, "train_info/time_within_train_step": 27.713382720947266, "step": 26}
{"train_info/time_between_train_steps": 0.005600452423095703, "step": 26}
{"info/global_step": 27, "train_info/time_within_train_step": 27.714730739593506, "step": 27}
{"train_info/time_between_train_steps": 0.005333900451660156, "step": 27}
{"train_info/time_between_train_steps": 29.786367416381836, "step": 27}
{"info/global_step": 28, "train_info/time_within_train_step": 27.70686984062195, "step": 28}
{"train_info/time_between_train_steps": 0.005510091781616211, "step": 28}
{"info/global_step": 29, "train_info/time_within_train_step": 27.89784002304077, "step": 29}
{"train_info/time_between_train_steps": 0.0059356689453125, "step": 29}
{"info/global_step": 30, "train_info/time_within_train_step": 27.718737840652466, "step": 30}
{"train_info/time_between_train_steps": 0.005293607711791992, "step": 30}
{"info/global_step": 31, "train_info/time_within_train_step": 28.026788473129272, "step": 31}
{"train_info/time_between_train_steps": 0.0055425167083740234, "step": 31}
{"info/global_step": 32, "train_info/time_within_train_step": 27.74660015106201, "step": 32}
{"train_info/time_between_train_steps": 0.005425453186035156, "step": 32}
{"info/global_step": 33, "train_info/time_within_train_step": 27.89497995376587, "step": 33}
{"train_info/time_between_train_steps": 0.0055332183837890625, "step": 33}
{"info/global_step": 34, "train_info/time_within_train_step": 27.742093324661255, "step": 34}
{"train_info/time_between_train_steps": 0.005185127258300781, "step": 34}
{"info/global_step": 35, "train_info/time_within_train_step": 27.765562772750854, "step": 35}
{"train_info/time_between_train_steps": 0.005435466766357422, "step": 35}
{"info/global_step": 36, "train_info/time_within_train_step": 27.716415882110596, "step": 36}
{"train_info/time_between_train_steps": 0.005165576934814453, "step": 36}
{"info/global_step": 37, "train_info/time_within_train_step": 27.683839321136475, "step": 37}
{"train_info/time_between_train_steps": 0.005215167999267578, "step": 37}
{"info/global_step": 38, "train_info/time_within_train_step": 27.72301173210144, "step": 38}
{"train_info/time_between_train_steps": 0.005124568939208984, "step": 38}
{"info/global_step": 39, "train_info/time_within_train_step": 27.701402187347412, "step": 39}
{"train_info/time_between_train_steps": 0.0050923824310302734, "step": 39}
{"info/global_step": 40, "train_info/time_within_train_step": 27.74090552330017, "step": 40}
{"train_info/time_between_train_steps": 0.0051996707916259766, "step": 40}
{"info/global_step": 41, "train_info/time_within_train_step": 27.718098402023315, "step": 41}
{"train_info/time_between_train_steps": 0.0051898956298828125, "step": 41}
{"info/global_step": 42, "train_info/time_within_train_step": 27.69398307800293, "step": 42}
{"train_info/time_between_train_steps": 0.005246400833129883, "step": 42}
{"info/global_step": 43, "train_info/time_within_train_step": 27.724716663360596, "step": 43}
{"train_info/time_between_train_steps": 0.005392551422119141, "step": 43}
{"info/global_step": 44, "train_info/time_within_train_step": 27.723763704299927, "step": 44}
{"train_info/time_between_train_steps": 0.0053653717041015625, "step": 44}
{"info/global_step": 45, "train_info/time_within_train_step": 27.714212894439697, "step": 45}
{"train_info/time_between_train_steps": 0.0053253173828125, "step": 45}
{"info/global_step": 46, "train_info/time_within_train_step": 27.803465843200684, "step": 46}
{"train_info/time_between_train_steps": 0.005133152008056641, "step": 46}
{"info/global_step": 47, "train_info/time_within_train_step": 27.701971292495728, "step": 47}
{"train_info/time_between_train_steps": 0.005021095275878906, "step": 47}
{"info/global_step": 48, "train_info/time_within_train_step": 27.688178539276123, "step": 48}
{"train_info/time_between_train_steps": 0.005251884460449219, "step": 48}
{"info/global_step": 49, "train_info/time_within_train_step": 27.703673601150513, "step": 49}
{"train_info/time_between_train_steps": 0.005212068557739258, "step": 49}
{"info/global_step": 50, "train_info/time_within_train_step": 27.70495319366455, "step": 50}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740825493, "_runtime": 1442}, "step": 50}
{"logs": {"train/loss": 7.9982, "train/learning_rate": 0.00025, "train/epoch": 1.02, "_timestamp": 1740825493, "_runtime": 1442}, "step": 50}
{"train_info/time_between_train_steps": 0.026431560516357422, "step": 50}
{"info/global_step": 51, "train_info/time_within_train_step": 27.7627694606781, "step": 51}
{"train_info/time_between_train_steps": 0.005071401596069336, "step": 51}
{"info/global_step": 52, "train_info/time_within_train_step": 27.727630138397217, "step": 52}
{"train_info/time_between_train_steps": 0.005377054214477539, "step": 52}
{"info/global_step": 53, "train_info/time_within_train_step": 27.698277950286865, "step": 53}
{"train_info/time_between_train_steps": 0.005599021911621094, "step": 53}
{"info/global_step": 54, "train_info/time_within_train_step": 27.729766845703125, "step": 54}
{"train_info/time_between_train_steps": 0.005549907684326172, "step": 54}
{"train_info/time_between_train_steps": 29.669888496398926, "step": 54}
{"info/global_step": 55, "train_info/time_within_train_step": 27.71361541748047, "step": 55}
{"train_info/time_between_train_steps": 0.005017518997192383, "step": 55}
{"info/global_step": 56, "train_info/time_within_train_step": 27.823082208633423, "step": 56}
{"train_info/time_between_train_steps": 0.005087375640869141, "step": 56}
{"info/global_step": 57, "train_info/time_within_train_step": 27.702436685562134, "step": 57}
{"train_info/time_between_train_steps": 0.005762815475463867, "step": 57}
{"info/global_step": 58, "train_info/time_within_train_step": 27.824201822280884, "step": 58}
{"train_info/time_between_train_steps": 0.005498170852661133, "step": 58}
{"info/global_step": 59, "train_info/time_within_train_step": 27.705023527145386, "step": 59}
{"train_info/time_between_train_steps": 0.005738973617553711, "step": 59}
{"info/global_step": 60, "train_info/time_within_train_step": 27.87265110015869, "step": 60}
{"train_info/time_between_train_steps": 0.00543522834777832, "step": 60}
{"info/global_step": 61, "train_info/time_within_train_step": 27.939080476760864, "step": 61}
{"train_info/time_between_train_steps": 0.005414009094238281, "step": 61}
{"info/global_step": 62, "train_info/time_within_train_step": 27.787308931350708, "step": 62}
{"train_info/time_between_train_steps": 0.005358695983886719, "step": 62}
{"info/global_step": 63, "train_info/time_within_train_step": 27.905927658081055, "step": 63}
{"train_info/time_between_train_steps": 0.005109548568725586, "step": 63}
{"info/global_step": 64, "train_info/time_within_train_step": 27.74005699157715, "step": 64}
{"train_info/time_between_train_steps": 0.005379438400268555, "step": 64}
{"info/global_step": 65, "train_info/time_within_train_step": 27.714900493621826, "step": 65}
{"train_info/time_between_train_steps": 0.0051991939544677734, "step": 65}
{"info/global_step": 66, "train_info/time_within_train_step": 27.688419818878174, "step": 66}
{"train_info/time_between_train_steps": 0.005120515823364258, "step": 66}
{"info/global_step": 67, "train_info/time_within_train_step": 27.680577278137207, "step": 67}
{"train_info/time_between_train_steps": 0.005227327346801758, "step": 67}
{"info/global_step": 68, "train_info/time_within_train_step": 27.681684970855713, "step": 68}
{"train_info/time_between_train_steps": 0.005062103271484375, "step": 68}
{"info/global_step": 69, "train_info/time_within_train_step": 27.70560359954834, "step": 69}
{"train_info/time_between_train_steps": 0.005250692367553711, "step": 69}
{"info/global_step": 70, "train_info/time_within_train_step": 27.698724269866943, "step": 70}
{"train_info/time_between_train_steps": 0.005117177963256836, "step": 70}
{"info/global_step": 71, "train_info/time_within_train_step": 27.695756196975708, "step": 71}
{"train_info/time_between_train_steps": 0.005283832550048828, "step": 71}
{"info/global_step": 72, "train_info/time_within_train_step": 27.713040351867676, "step": 72}
{"train_info/time_between_train_steps": 0.005185127258300781, "step": 72}
{"info/global_step": 73, "train_info/time_within_train_step": 27.68972420692444, "step": 73}
{"train_info/time_between_train_steps": 0.005155086517333984, "step": 73}
{"info/global_step": 74, "train_info/time_within_train_step": 27.687261819839478, "step": 74}
{"train_info/time_between_train_steps": 0.005108833312988281, "step": 74}
{"info/global_step": 75, "train_info/time_within_train_step": 27.681994438171387, "step": 75}
{"train_info/time_between_train_steps": 0.005167484283447266, "step": 75}
{"info/global_step": 76, "train_info/time_within_train_step": 27.74064826965332, "step": 76}
{"train_info/time_between_train_steps": 0.005753993988037109, "step": 76}
{"info/global_step": 77, "train_info/time_within_train_step": 27.817914724349976, "step": 77}
{"train_info/time_between_train_steps": 0.011017084121704102, "step": 77}
{"info/global_step": 78, "train_info/time_within_train_step": 27.699766874313354, "step": 78}
{"train_info/time_between_train_steps": 0.0052030086517333984, "step": 78}
{"info/global_step": 79, "train_info/time_within_train_step": 27.697784662246704, "step": 79}
{"train_info/time_between_train_steps": 0.0052759647369384766, "step": 79}
{"info/global_step": 80, "train_info/time_within_train_step": 27.706557989120483, "step": 80}
{"train_info/time_between_train_steps": 0.005483150482177734, "step": 80}
{"info/global_step": 81, "train_info/time_within_train_step": 27.737077713012695, "step": 81}
{"train_info/time_between_train_steps": 0.00672459602355957, "step": 81}
{"train_info/time_between_train_steps": 29.999504566192627, "step": 81}
{"info/global_step": 82, "train_info/time_within_train_step": 27.693124771118164, "step": 82}
{"train_info/time_between_train_steps": 0.0054988861083984375, "step": 82}
{"info/global_step": 83, "train_info/time_within_train_step": 27.870315313339233, "step": 83}
{"train_info/time_between_train_steps": 0.0053081512451171875, "step": 83}
{"info/global_step": 84, "train_info/time_within_train_step": 27.695530891418457, "step": 84}
{"train_info/time_between_train_steps": 0.005259990692138672, "step": 84}
{"info/global_step": 85, "train_info/time_within_train_step": 27.857964754104614, "step": 85}
{"train_info/time_between_train_steps": 0.00534367561340332, "step": 85}
{"info/global_step": 86, "train_info/time_within_train_step": 27.69622230529785, "step": 86}
{"train_info/time_between_train_steps": 0.005288600921630859, "step": 86}
{"info/global_step": 87, "train_info/time_within_train_step": 27.861531972885132, "step": 87}
{"train_info/time_between_train_steps": 0.005279064178466797, "step": 87}
{"info/global_step": 88, "train_info/time_within_train_step": 27.752924919128418, "step": 88}
{"train_info/time_between_train_steps": 0.005209684371948242, "step": 88}
{"info/global_step": 89, "train_info/time_within_train_step": 27.75864267349243, "step": 89}
{"train_info/time_between_train_steps": 0.005182743072509766, "step": 89}
{"info/global_step": 90, "train_info/time_within_train_step": 27.713009357452393, "step": 90}
{"train_info/time_between_train_steps": 0.005054950714111328, "step": 90}
{"info/global_step": 91, "train_info/time_within_train_step": 27.80310606956482, "step": 91}
{"train_info/time_between_train_steps": 0.004907369613647461, "step": 91}
{"info/global_step": 92, "train_info/time_within_train_step": 27.732232332229614, "step": 92}
{"train_info/time_between_train_steps": 0.0051991939544677734, "step": 92}
{"info/global_step": 93, "train_info/time_within_train_step": 27.69894313812256, "step": 93}
{"train_info/time_between_train_steps": 0.005001068115234375, "step": 93}
{"info/global_step": 94, "train_info/time_within_train_step": 27.740082502365112, "step": 94}
{"train_info/time_between_train_steps": 0.005225181579589844, "step": 94}
{"info/global_step": 95, "train_info/time_within_train_step": 27.71693444252014, "step": 95}
{"train_info/time_between_train_steps": 0.005131244659423828, "step": 95}
{"info/global_step": 96, "train_info/time_within_train_step": 27.743969440460205, "step": 96}
{"train_info/time_between_train_steps": 0.005102396011352539, "step": 96}
{"info/global_step": 97, "train_info/time_within_train_step": 27.715368032455444, "step": 97}
{"train_info/time_between_train_steps": 0.005327701568603516, "step": 97}
{"info/global_step": 98, "train_info/time_within_train_step": 27.717996835708618, "step": 98}
{"train_info/time_between_train_steps": 0.005067586898803711, "step": 98}
{"info/global_step": 99, "train_info/time_within_train_step": 27.728034734725952, "step": 99}
{"train_info/time_between_train_steps": 0.005372285842895508, "step": 99}
{"info/global_step": 100, "train_info/time_within_train_step": 27.704466819763184, "step": 100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740826942, "_runtime": 2891}, "step": 100}
{"logs": {"train/loss": 5.8003, "train/learning_rate": 0.0005, "train/epoch": 3.02, "_timestamp": 1740826942, "_runtime": 2891}, "step": 100}
{"train_info/time_between_train_steps": 73.18370079994202, "step": 100}
{"info/global_step": 101, "train_info/time_within_train_step": 27.70071578025818, "step": 101}
{"train_info/time_between_train_steps": 0.0050547122955322266, "step": 101}
{"info/global_step": 102, "train_info/time_within_train_step": 27.704102993011475, "step": 102}
{"train_info/time_between_train_steps": 0.005181312561035156, "step": 102}
{"info/global_step": 103, "train_info/time_within_train_step": 27.687839031219482, "step": 103}
{"train_info/time_between_train_steps": 0.005050182342529297, "step": 103}
{"info/global_step": 104, "train_info/time_within_train_step": 27.69083285331726, "step": 104}
{"train_info/time_between_train_steps": 0.005153179168701172, "step": 104}
{"info/global_step": 105, "train_info/time_within_train_step": 27.684593200683594, "step": 105}
{"train_info/time_between_train_steps": 0.0050051212310791016, "step": 105}
{"info/global_step": 106, "train_info/time_within_train_step": 27.701864004135132, "step": 106}
{"train_info/time_between_train_steps": 0.005112648010253906, "step": 106}
{"info/global_step": 107, "train_info/time_within_train_step": 27.822410583496094, "step": 107}
{"train_info/time_between_train_steps": 0.005424022674560547, "step": 107}
{"info/global_step": 108, "train_info/time_within_train_step": 27.744323015213013, "step": 108}
{"train_info/time_between_train_steps": 0.005571126937866211, "step": 108}
{"train_info/time_between_train_steps": 29.649384021759033, "step": 108}
{"info/global_step": 109, "train_info/time_within_train_step": 27.70844078063965, "step": 109}
{"train_info/time_between_train_steps": 0.0049898624420166016, "step": 109}
{"info/global_step": 110, "train_info/time_within_train_step": 27.83847403526306, "step": 110}
{"train_info/time_between_train_steps": 0.005169391632080078, "step": 110}
{"info/global_step": 111, "train_info/time_within_train_step": 27.718424797058105, "step": 111}
{"train_info/time_between_train_steps": 0.006288051605224609, "step": 111}
{"info/global_step": 112, "train_info/time_within_train_step": 27.86815881729126, "step": 112}
{"train_info/time_between_train_steps": 0.006147623062133789, "step": 112}
{"info/global_step": 113, "train_info/time_within_train_step": 27.709745407104492, "step": 113}
{"train_info/time_between_train_steps": 0.0065190792083740234, "step": 113}
{"info/global_step": 114, "train_info/time_within_train_step": 27.847676277160645, "step": 114}
{"train_info/time_between_train_steps": 0.005347490310668945, "step": 114}
{"info/global_step": 115, "train_info/time_within_train_step": 27.72253918647766, "step": 115}
{"train_info/time_between_train_steps": 0.0054378509521484375, "step": 115}
{"info/global_step": 116, "train_info/time_within_train_step": 27.778765201568604, "step": 116}
{"train_info/time_between_train_steps": 0.005368232727050781, "step": 116}
{"info/global_step": 117, "train_info/time_within_train_step": 27.698750734329224, "step": 117}
{"train_info/time_between_train_steps": 0.00494384765625, "step": 117}
{"info/global_step": 118, "train_info/time_within_train_step": 27.740641355514526, "step": 118}
{"train_info/time_between_train_steps": 0.009716272354125977, "step": 118}
{"info/global_step": 119, "train_info/time_within_train_step": 27.79171395301819, "step": 119}
{"train_info/time_between_train_steps": 0.010639429092407227, "step": 119}
{"info/global_step": 120, "train_info/time_within_train_step": 27.720006227493286, "step": 120}
{"train_info/time_between_train_steps": 0.00573277473449707, "step": 120}
{"info/global_step": 121, "train_info/time_within_train_step": 27.75653839111328, "step": 121}
{"train_info/time_between_train_steps": 0.006563425064086914, "step": 121}
{"info/global_step": 122, "train_info/time_within_train_step": 27.860503673553467, "step": 122}
{"train_info/time_between_train_steps": 0.006151676177978516, "step": 122}
{"info/global_step": 123, "train_info/time_within_train_step": 27.915786504745483, "step": 123}
{"train_info/time_between_train_steps": 0.006303548812866211, "step": 123}
{"info/global_step": 124, "train_info/time_within_train_step": 27.774923086166382, "step": 124}
{"train_info/time_between_train_steps": 0.006476879119873047, "step": 124}
{"info/global_step": 125, "train_info/time_within_train_step": 27.770323276519775, "step": 125}
{"train_info/time_between_train_steps": 0.006311178207397461, "step": 125}
{"info/global_step": 126, "train_info/time_within_train_step": 27.759220123291016, "step": 126}
{"train_info/time_between_train_steps": 0.011489152908325195, "step": 126}
{"info/global_step": 127, "train_info/time_within_train_step": 27.742541313171387, "step": 127}
{"train_info/time_between_train_steps": 0.006157875061035156, "step": 127}
{"info/global_step": 128, "train_info/time_within_train_step": 27.749855041503906, "step": 128}
{"train_info/time_between_train_steps": 0.011115312576293945, "step": 128}
{"info/global_step": 129, "train_info/time_within_train_step": 27.781652688980103, "step": 129}
{"train_info/time_between_train_steps": 0.006207704544067383, "step": 129}
{"info/global_step": 130, "train_info/time_within_train_step": 27.744268655776978, "step": 130}
{"train_info/time_between_train_steps": 0.011104583740234375, "step": 130}
{"info/global_step": 131, "train_info/time_within_train_step": 27.742699146270752, "step": 131}
{"train_info/time_between_train_steps": 0.006204843521118164, "step": 131}
{"info/global_step": 132, "train_info/time_within_train_step": 27.73805809020996, "step": 132}
{"train_info/time_between_train_steps": 0.005957365036010742, "step": 132}
{"info/global_step": 133, "train_info/time_within_train_step": 27.74616503715515, "step": 133}
{"train_info/time_between_train_steps": 0.006145000457763672, "step": 133}
{"info/global_step": 134, "train_info/time_within_train_step": 27.747852087020874, "step": 134}
{"train_info/time_between_train_steps": 0.006326198577880859, "step": 134}
{"info/global_step": 135, "train_info/time_within_train_step": 27.76485538482666, "step": 135}
{"train_info/time_between_train_steps": 0.011858463287353516, "step": 135}
{"train_info/time_between_train_steps": 30.023730516433716, "step": 135}
{"info/global_step": 136, "train_info/time_within_train_step": 27.80540156364441, "step": 136}
{"train_info/time_between_train_steps": 0.005544424057006836, "step": 136}
{"info/global_step": 137, "train_info/time_within_train_step": 27.887460470199585, "step": 137}
{"train_info/time_between_train_steps": 0.010448694229125977, "step": 137}
{"info/global_step": 138, "train_info/time_within_train_step": 27.706188678741455, "step": 138}
{"train_info/time_between_train_steps": 0.008067607879638672, "step": 138}
{"info/global_step": 139, "train_info/time_within_train_step": 27.814921617507935, "step": 139}
{"train_info/time_between_train_steps": 0.005296945571899414, "step": 139}
{"info/global_step": 140, "train_info/time_within_train_step": 27.697428464889526, "step": 140}
{"train_info/time_between_train_steps": 0.010326385498046875, "step": 140}
{"info/global_step": 141, "train_info/time_within_train_step": 27.820491790771484, "step": 141}
{"train_info/time_between_train_steps": 0.010231256484985352, "step": 141}
{"info/global_step": 142, "train_info/time_within_train_step": 27.685983419418335, "step": 142}
{"train_info/time_between_train_steps": 0.0052149295806884766, "step": 142}
{"info/global_step": 143, "train_info/time_within_train_step": 27.77022075653076, "step": 143}
{"train_info/time_between_train_steps": 0.005195140838623047, "step": 143}
{"info/global_step": 144, "train_info/time_within_train_step": 27.701437950134277, "step": 144}
{"train_info/time_between_train_steps": 0.0050733089447021484, "step": 144}
{"info/global_step": 145, "train_info/time_within_train_step": 27.675015449523926, "step": 145}
{"train_info/time_between_train_steps": 0.0049974918365478516, "step": 145}
{"info/global_step": 146, "train_info/time_within_train_step": 27.73888850212097, "step": 146}
{"train_info/time_between_train_steps": 0.005048036575317383, "step": 146}
{"info/global_step": 147, "train_info/time_within_train_step": 27.68892240524292, "step": 147}
{"train_info/time_between_train_steps": 0.005126953125, "step": 147}
{"info/global_step": 148, "train_info/time_within_train_step": 27.738964796066284, "step": 148}
{"train_info/time_between_train_steps": 0.005072593688964844, "step": 148}
{"info/global_step": 149, "train_info/time_within_train_step": 27.82083797454834, "step": 149}
{"train_info/time_between_train_steps": 0.00516510009765625, "step": 149}
{"info/global_step": 150, "train_info/time_within_train_step": 27.738208055496216, "step": 150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740828465, "_runtime": 4414}, "step": 150}
{"logs": {"train/loss": 5.17, "train/learning_rate": 0.0005833333333333333, "train/epoch": 5.01, "_timestamp": 1740828465, "_runtime": 4414}, "step": 150}
{"train_info/time_between_train_steps": 0.02614760398864746, "step": 150}
{"info/global_step": 151, "train_info/time_within_train_step": 27.68132209777832, "step": 151}
{"train_info/time_between_train_steps": 0.005135536193847656, "step": 151}
{"info/global_step": 152, "train_info/time_within_train_step": 27.818657398223877, "step": 152}
{"train_info/time_between_train_steps": 0.010589122772216797, "step": 152}
{"info/global_step": 153, "train_info/time_within_train_step": 27.722400188446045, "step": 153}
{"train_info/time_between_train_steps": 0.0053479671478271484, "step": 153}
{"info/global_step": 154, "train_info/time_within_train_step": 27.69991970062256, "step": 154}
{"train_info/time_between_train_steps": 0.005299091339111328, "step": 154}
{"info/global_step": 155, "train_info/time_within_train_step": 27.694236040115356, "step": 155}
{"train_info/time_between_train_steps": 0.005053997039794922, "step": 155}
{"info/global_step": 156, "train_info/time_within_train_step": 27.691053867340088, "step": 156}
{"train_info/time_between_train_steps": 0.005323886871337891, "step": 156}
{"info/global_step": 157, "train_info/time_within_train_step": 27.72681498527527, "step": 157}
{"train_info/time_between_train_steps": 0.005190610885620117, "step": 157}
{"info/global_step": 158, "train_info/time_within_train_step": 27.73736310005188, "step": 158}
{"train_info/time_between_train_steps": 0.005418539047241211, "step": 158}
{"info/global_step": 159, "train_info/time_within_train_step": 28.796908617019653, "step": 159}
{"train_info/time_between_train_steps": 0.005344867706298828, "step": 159}
{"info/global_step": 160, "train_info/time_within_train_step": 27.70088291168213, "step": 160}
{"train_info/time_between_train_steps": 0.00513148307800293, "step": 160}
{"info/global_step": 161, "train_info/time_within_train_step": 27.737423419952393, "step": 161}
{"train_info/time_between_train_steps": 0.005547046661376953, "step": 161}
{"info/global_step": 162, "train_info/time_within_train_step": 27.718035221099854, "step": 162}
{"train_info/time_between_train_steps": 0.0066585540771484375, "step": 162}
{"train_info/time_between_train_steps": 30.146008014678955, "step": 162}
{"info/global_step": 163, "train_info/time_within_train_step": 27.691269636154175, "step": 163}
{"train_info/time_between_train_steps": 0.009775161743164062, "step": 163}
{"info/global_step": 164, "train_info/time_within_train_step": 27.79708456993103, "step": 164}
{"train_info/time_between_train_steps": 0.00982809066772461, "step": 164}
{"info/global_step": 165, "train_info/time_within_train_step": 27.7124981880188, "step": 165}
{"train_info/time_between_train_steps": 0.010118961334228516, "step": 165}
{"info/global_step": 166, "train_info/time_within_train_step": 27.86442995071411, "step": 166}
{"train_info/time_between_train_steps": 0.005469083786010742, "step": 166}
{"info/global_step": 167, "train_info/time_within_train_step": 27.796879529953003, "step": 167}
{"train_info/time_between_train_steps": 0.005290031433105469, "step": 167}
{"info/global_step": 168, "train_info/time_within_train_step": 27.87415337562561, "step": 168}
{"train_info/time_between_train_steps": 0.005539417266845703, "step": 168}
{"info/global_step": 169, "train_info/time_within_train_step": 27.772125720977783, "step": 169}
{"train_info/time_between_train_steps": 0.005262613296508789, "step": 169}
{"info/global_step": 170, "train_info/time_within_train_step": 27.792458534240723, "step": 170}
{"train_info/time_between_train_steps": 0.0053174495697021484, "step": 170}
{"info/global_step": 171, "train_info/time_within_train_step": 27.729955434799194, "step": 171}
{"train_info/time_between_train_steps": 0.005135297775268555, "step": 171}
{"info/global_step": 172, "train_info/time_within_train_step": 27.682992458343506, "step": 172}
{"train_info/time_between_train_steps": 0.005150794982910156, "step": 172}
{"info/global_step": 173, "train_info/time_within_train_step": 27.70274257659912, "step": 173}
{"train_info/time_between_train_steps": 0.005312442779541016, "step": 173}
{"info/global_step": 174, "train_info/time_within_train_step": 27.6839861869812, "step": 174}
{"train_info/time_between_train_steps": 0.004984617233276367, "step": 174}
{"info/global_step": 175, "train_info/time_within_train_step": 27.68492579460144, "step": 175}
{"train_info/time_between_train_steps": 0.005352497100830078, "step": 175}
{"info/global_step": 176, "train_info/time_within_train_step": 27.682879209518433, "step": 176}
{"train_info/time_between_train_steps": 0.0051381587982177734, "step": 176}
{"info/global_step": 177, "train_info/time_within_train_step": 27.690643072128296, "step": 177}
{"train_info/time_between_train_steps": 0.005058765411376953, "step": 177}
{"info/global_step": 178, "train_info/time_within_train_step": 27.70091676712036, "step": 178}
{"train_info/time_between_train_steps": 0.005292654037475586, "step": 178}
{"info/global_step": 179, "train_info/time_within_train_step": 27.700216054916382, "step": 179}
{"train_info/time_between_train_steps": 0.005173444747924805, "step": 179}
{"info/global_step": 180, "train_info/time_within_train_step": 27.686551332473755, "step": 180}
{"train_info/time_between_train_steps": 0.005277156829833984, "step": 180}
{"info/global_step": 181, "train_info/time_within_train_step": 27.723023414611816, "step": 181}
{"train_info/time_between_train_steps": 0.0051898956298828125, "step": 181}
{"info/global_step": 182, "train_info/time_within_train_step": 27.78919553756714, "step": 182}
{"train_info/time_between_train_steps": 0.005093812942504883, "step": 182}
{"info/global_step": 183, "train_info/time_within_train_step": 27.707981824874878, "step": 183}
{"train_info/time_between_train_steps": 0.0053501129150390625, "step": 183}
{"info/global_step": 184, "train_info/time_within_train_step": 27.712560176849365, "step": 184}
{"train_info/time_between_train_steps": 0.009626150131225586, "step": 184}
{"info/global_step": 185, "train_info/time_within_train_step": 27.69282865524292, "step": 185}
{"train_info/time_between_train_steps": 0.010521888732910156, "step": 185}
{"info/global_step": 186, "train_info/time_within_train_step": 27.744566679000854, "step": 186}
{"train_info/time_between_train_steps": 0.010106325149536133, "step": 186}
{"info/global_step": 187, "train_info/time_within_train_step": 27.683058977127075, "step": 187}
{"train_info/time_between_train_steps": 0.010000467300415039, "step": 187}
{"info/global_step": 188, "train_info/time_within_train_step": 27.705600023269653, "step": 188}
{"train_info/time_between_train_steps": 0.010479211807250977, "step": 188}
{"info/global_step": 189, "train_info/time_within_train_step": 27.70455288887024, "step": 189}
{"train_info/time_between_train_steps": 0.005850791931152344, "step": 189}
{"train_info/time_between_train_steps": 29.765056610107422, "step": 189}
{"info/global_step": 190, "train_info/time_within_train_step": 27.69384789466858, "step": 190}
{"train_info/time_between_train_steps": 0.005122661590576172, "step": 190}
{"info/global_step": 191, "train_info/time_within_train_step": 27.852377891540527, "step": 191}
{"train_info/time_between_train_steps": 0.006392002105712891, "step": 191}
{"info/global_step": 192, "train_info/time_within_train_step": 27.702239274978638, "step": 192}
{"train_info/time_between_train_steps": 0.0054666996002197266, "step": 192}
{"info/global_step": 193, "train_info/time_within_train_step": 27.823495149612427, "step": 193}
{"train_info/time_between_train_steps": 0.005356788635253906, "step": 193}
{"info/global_step": 194, "train_info/time_within_train_step": 27.693451404571533, "step": 194}
{"train_info/time_between_train_steps": 0.005388498306274414, "step": 194}
{"info/global_step": 195, "train_info/time_within_train_step": 27.867023229599, "step": 195}
{"train_info/time_between_train_steps": 0.005517721176147461, "step": 195}
{"info/global_step": 196, "train_info/time_within_train_step": 27.70014214515686, "step": 196}
{"train_info/time_between_train_steps": 0.005280971527099609, "step": 196}
{"info/global_step": 197, "train_info/time_within_train_step": 27.886200666427612, "step": 197}
{"train_info/time_between_train_steps": 0.006073951721191406, "step": 197}
{"info/global_step": 198, "train_info/time_within_train_step": 27.691112518310547, "step": 198}
{"train_info/time_between_train_steps": 0.004974365234375, "step": 198}
{"info/global_step": 199, "train_info/time_within_train_step": 27.677524089813232, "step": 199}
{"train_info/time_between_train_steps": 0.0051081180572509766, "step": 199}
{"info/global_step": 200, "train_info/time_within_train_step": 27.685187816619873, "step": 200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740829914, "_runtime": 5863}, "step": 200}
{"logs": {"train/loss": 4.9158, "train/learning_rate": 0.0005555555555555556, "train/epoch": 7.01, "_timestamp": 1740829914, "_runtime": 5863}, "step": 200}
{"train_info/time_between_train_steps": 68.65972971916199, "step": 200}
{"info/global_step": 201, "train_info/time_within_train_step": 27.690451860427856, "step": 201}
{"train_info/time_between_train_steps": 0.005060434341430664, "step": 201}
{"info/global_step": 202, "train_info/time_within_train_step": 27.70335078239441, "step": 202}
{"train_info/time_between_train_steps": 0.005304813385009766, "step": 202}
{"info/global_step": 203, "train_info/time_within_train_step": 27.68970012664795, "step": 203}
{"train_info/time_between_train_steps": 0.00506901741027832, "step": 203}
{"info/global_step": 204, "train_info/time_within_train_step": 27.706671237945557, "step": 204}
{"train_info/time_between_train_steps": 0.005129337310791016, "step": 204}
{"info/global_step": 205, "train_info/time_within_train_step": 27.731332063674927, "step": 205}
{"train_info/time_between_train_steps": 0.00535893440246582, "step": 205}
{"info/global_step": 206, "train_info/time_within_train_step": 27.77019691467285, "step": 206}
{"train_info/time_between_train_steps": 0.00987100601196289, "step": 206}
{"info/global_step": 207, "train_info/time_within_train_step": 27.700847148895264, "step": 207}
{"train_info/time_between_train_steps": 0.0052220821380615234, "step": 207}
{"info/global_step": 208, "train_info/time_within_train_step": 27.733834266662598, "step": 208}
{"train_info/time_between_train_steps": 0.0052220821380615234, "step": 208}
{"info/global_step": 209, "train_info/time_within_train_step": 27.68312120437622, "step": 209}
{"train_info/time_between_train_steps": 0.005187273025512695, "step": 209}
{"info/global_step": 210, "train_info/time_within_train_step": 27.69752073287964, "step": 210}
{"train_info/time_between_train_steps": 0.005288600921630859, "step": 210}
{"info/global_step": 211, "train_info/time_within_train_step": 27.694874048233032, "step": 211}
{"train_info/time_between_train_steps": 0.005369901657104492, "step": 211}
{"info/global_step": 212, "train_info/time_within_train_step": 27.697333335876465, "step": 212}
{"train_info/time_between_train_steps": 0.005258321762084961, "step": 212}
{"info/global_step": 213, "train_info/time_within_train_step": 27.79727029800415, "step": 213}
{"train_info/time_between_train_steps": 0.00532841682434082, "step": 213}
{"info/global_step": 214, "train_info/time_within_train_step": 27.6985981464386, "step": 214}
{"train_info/time_between_train_steps": 0.005286693572998047, "step": 214}
{"info/global_step": 215, "train_info/time_within_train_step": 27.710121631622314, "step": 215}
{"train_info/time_between_train_steps": 0.005738496780395508, "step": 215}
{"info/global_step": 216, "train_info/time_within_train_step": 27.706376552581787, "step": 216}
{"train_info/time_between_train_steps": 0.005585432052612305, "step": 216}
{"train_info/time_between_train_steps": 29.84687614440918, "step": 216}
{"info/global_step": 217, "train_info/time_within_train_step": 27.700008153915405, "step": 217}
{"train_info/time_between_train_steps": 0.004994869232177734, "step": 217}
{"info/global_step": 218, "train_info/time_within_train_step": 27.80018639564514, "step": 218}
{"train_info/time_between_train_steps": 0.004944562911987305, "step": 218}
{"info/global_step": 219, "train_info/time_within_train_step": 27.687668085098267, "step": 219}
{"train_info/time_between_train_steps": 0.009992361068725586, "step": 219}
{"info/global_step": 220, "train_info/time_within_train_step": 27.837613582611084, "step": 220}
{"train_info/time_between_train_steps": 0.010288476943969727, "step": 220}
{"info/global_step": 221, "train_info/time_within_train_step": 27.731398105621338, "step": 221}
{"train_info/time_between_train_steps": 0.009811162948608398, "step": 221}
{"info/global_step": 222, "train_info/time_within_train_step": 27.889615297317505, "step": 222}
{"train_info/time_between_train_steps": 0.005448341369628906, "step": 222}
{"info/global_step": 223, "train_info/time_within_train_step": 27.70195746421814, "step": 223}
{"train_info/time_between_train_steps": 0.0052547454833984375, "step": 223}
{"info/global_step": 224, "train_info/time_within_train_step": 27.830727338790894, "step": 224}
{"train_info/time_between_train_steps": 0.005397319793701172, "step": 224}
{"info/global_step": 225, "train_info/time_within_train_step": 27.706448078155518, "step": 225}
{"train_info/time_between_train_steps": 0.0050852298736572266, "step": 225}
{"info/global_step": 226, "train_info/time_within_train_step": 27.680111169815063, "step": 226}
{"train_info/time_between_train_steps": 0.004983663558959961, "step": 226}
{"info/global_step": 227, "train_info/time_within_train_step": 27.792027711868286, "step": 227}
{"train_info/time_between_train_steps": 0.00510096549987793, "step": 227}
{"info/global_step": 228, "train_info/time_within_train_step": 27.681824445724487, "step": 228}
{"train_info/time_between_train_steps": 0.009984493255615234, "step": 228}
{"info/global_step": 229, "train_info/time_within_train_step": 27.690601348876953, "step": 229}
{"train_info/time_between_train_steps": 0.00533604621887207, "step": 229}
{"info/global_step": 230, "train_info/time_within_train_step": 27.680262327194214, "step": 230}
{"train_info/time_between_train_steps": 0.005041599273681641, "step": 230}
{"info/global_step": 231, "train_info/time_within_train_step": 27.689854621887207, "step": 231}
{"train_info/time_between_train_steps": 0.005084514617919922, "step": 231}
{"info/global_step": 232, "train_info/time_within_train_step": 27.695849418640137, "step": 232}
{"train_info/time_between_train_steps": 0.005303144454956055, "step": 232}
{"info/global_step": 233, "train_info/time_within_train_step": 27.747002124786377, "step": 233}
{"train_info/time_between_train_steps": 0.0051021575927734375, "step": 233}
{"info/global_step": 234, "train_info/time_within_train_step": 27.70759344100952, "step": 234}
{"train_info/time_between_train_steps": 0.005190372467041016, "step": 234}
{"info/global_step": 235, "train_info/time_within_train_step": 27.739644050598145, "step": 235}
{"train_info/time_between_train_steps": 0.00521397590637207, "step": 235}
{"info/global_step": 236, "train_info/time_within_train_step": 27.684016704559326, "step": 236}
{"train_info/time_between_train_steps": 0.005043506622314453, "step": 236}
{"info/global_step": 237, "train_info/time_within_train_step": 27.690277099609375, "step": 237}
{"train_info/time_between_train_steps": 0.01017141342163086, "step": 237}
{"info/global_step": 238, "train_info/time_within_train_step": 27.69309973716736, "step": 238}
{"train_info/time_between_train_steps": 0.005242347717285156, "step": 238}
{"info/global_step": 239, "train_info/time_within_train_step": 27.695059299468994, "step": 239}
{"train_info/time_between_train_steps": 0.00515294075012207, "step": 239}
{"info/global_step": 240, "train_info/time_within_train_step": 27.707957983016968, "step": 240}
{"train_info/time_between_train_steps": 0.005288839340209961, "step": 240}
{"info/global_step": 241, "train_info/time_within_train_step": 27.69513201713562, "step": 241}
{"train_info/time_between_train_steps": 0.005203723907470703, "step": 241}
{"info/global_step": 242, "train_info/time_within_train_step": 27.752567291259766, "step": 242}
{"train_info/time_between_train_steps": 0.0053021907806396484, "step": 242}
{"info/global_step": 243, "train_info/time_within_train_step": 27.82372260093689, "step": 243}
{"train_info/time_between_train_steps": 0.005800724029541016, "step": 243}
{"train_info/time_between_train_steps": 30.004590272903442, "step": 243}
{"info/global_step": 244, "train_info/time_within_train_step": 27.690030097961426, "step": 244}
{"train_info/time_between_train_steps": 0.009923219680786133, "step": 244}
{"info/global_step": 245, "train_info/time_within_train_step": 27.835737466812134, "step": 245}
{"train_info/time_between_train_steps": 0.010064125061035156, "step": 245}
{"info/global_step": 246, "train_info/time_within_train_step": 27.697606563568115, "step": 246}
{"train_info/time_between_train_steps": 0.010331869125366211, "step": 246}
{"info/global_step": 247, "train_info/time_within_train_step": 27.81367039680481, "step": 247}
{"train_info/time_between_train_steps": 0.005342960357666016, "step": 247}
{"info/global_step": 248, "train_info/time_within_train_step": 27.70019817352295, "step": 248}
{"train_info/time_between_train_steps": 0.005235910415649414, "step": 248}
{"info/global_step": 249, "train_info/time_within_train_step": 27.88652467727661, "step": 249}
{"train_info/time_between_train_steps": 0.005324840545654297, "step": 249}
{"info/global_step": 250, "train_info/time_within_train_step": 27.71311044692993, "step": 250}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740831430, "_runtime": 7379}, "step": 250}
{"logs": {"train/loss": 4.7809, "train/learning_rate": 0.0005277777777777777, "train/epoch": 9.01, "_timestamp": 1740831430, "_runtime": 7379}, "step": 250}
{"train_info/time_between_train_steps": 0.02584981918334961, "step": 250}
{"info/global_step": 251, "train_info/time_within_train_step": 27.768550872802734, "step": 251}
{"train_info/time_between_train_steps": 0.005216121673583984, "step": 251}
{"info/global_step": 252, "train_info/time_within_train_step": 27.718239545822144, "step": 252}
{"train_info/time_between_train_steps": 0.005140542984008789, "step": 252}
{"info/global_step": 253, "train_info/time_within_train_step": 27.957794189453125, "step": 253}
{"train_info/time_between_train_steps": 0.0055997371673583984, "step": 253}
{"info/global_step": 254, "train_info/time_within_train_step": 29.324788808822632, "step": 254}
{"train_info/time_between_train_steps": 0.009539365768432617, "step": 254}
{"info/global_step": 255, "train_info/time_within_train_step": 27.686142444610596, "step": 255}
{"train_info/time_between_train_steps": 0.009871959686279297, "step": 255}
{"info/global_step": 256, "train_info/time_within_train_step": 27.707345724105835, "step": 256}
{"train_info/time_between_train_steps": 0.0101318359375, "step": 256}
{"info/global_step": 257, "train_info/time_within_train_step": 27.684229612350464, "step": 257}
{"train_info/time_between_train_steps": 0.004990339279174805, "step": 257}
{"info/global_step": 258, "train_info/time_within_train_step": 27.822718381881714, "step": 258}
{"train_info/time_between_train_steps": 0.005110263824462891, "step": 258}
{"info/global_step": 259, "train_info/time_within_train_step": 27.706258296966553, "step": 259}
{"train_info/time_between_train_steps": 0.008712291717529297, "step": 259}
{"info/global_step": 260, "train_info/time_within_train_step": 27.748253107070923, "step": 260}
{"train_info/time_between_train_steps": 0.005133390426635742, "step": 260}
{"info/global_step": 261, "train_info/time_within_train_step": 27.686441898345947, "step": 261}
{"train_info/time_between_train_steps": 0.0050580501556396484, "step": 261}
{"info/global_step": 262, "train_info/time_within_train_step": 27.73181176185608, "step": 262}
{"train_info/time_between_train_steps": 0.005734920501708984, "step": 262}
{"info/global_step": 263, "train_info/time_within_train_step": 27.6821072101593, "step": 263}
{"train_info/time_between_train_steps": 0.005005359649658203, "step": 263}
{"info/global_step": 264, "train_info/time_within_train_step": 27.725099325180054, "step": 264}
{"train_info/time_between_train_steps": 0.005166292190551758, "step": 264}
{"info/global_step": 265, "train_info/time_within_train_step": 27.691503286361694, "step": 265}
{"train_info/time_between_train_steps": 0.0052411556243896484, "step": 265}
{"info/global_step": 266, "train_info/time_within_train_step": 27.688347339630127, "step": 266}
{"train_info/time_between_train_steps": 0.005199432373046875, "step": 266}
{"info/global_step": 267, "train_info/time_within_train_step": 27.68877124786377, "step": 267}
{"train_info/time_between_train_steps": 0.005328655242919922, "step": 267}
{"info/global_step": 268, "train_info/time_within_train_step": 27.701383352279663, "step": 268}
{"train_info/time_between_train_steps": 0.005228281021118164, "step": 268}
{"info/global_step": 269, "train_info/time_within_train_step": 27.719315767288208, "step": 269}
{"train_info/time_between_train_steps": 0.005315542221069336, "step": 269}
{"info/global_step": 270, "train_info/time_within_train_step": 27.72285032272339, "step": 270}
{"train_info/time_between_train_steps": 0.0058612823486328125, "step": 270}
{"train_info/time_between_train_steps": 29.74225878715515, "step": 270}
{"info/global_step": 271, "train_info/time_within_train_step": 27.699797868728638, "step": 271}
{"train_info/time_between_train_steps": 0.004974842071533203, "step": 271}
{"info/global_step": 272, "train_info/time_within_train_step": 27.974323987960815, "step": 272}
{"train_info/time_between_train_steps": 0.005283832550048828, "step": 272}
{"info/global_step": 273, "train_info/time_within_train_step": 27.71097707748413, "step": 273}
{"train_info/time_between_train_steps": 0.005384206771850586, "step": 273}
{"info/global_step": 274, "train_info/time_within_train_step": 27.852763891220093, "step": 274}
{"train_info/time_between_train_steps": 0.005238056182861328, "step": 274}
{"info/global_step": 275, "train_info/time_within_train_step": 27.69466280937195, "step": 275}
{"train_info/time_between_train_steps": 0.005295515060424805, "step": 275}
{"info/global_step": 276, "train_info/time_within_train_step": 27.86263680458069, "step": 276}
{"train_info/time_between_train_steps": 0.0054552555084228516, "step": 276}
{"info/global_step": 277, "train_info/time_within_train_step": 27.71383500099182, "step": 277}
{"train_info/time_between_train_steps": 0.005296230316162109, "step": 277}
{"info/global_step": 278, "train_info/time_within_train_step": 27.773378610610962, "step": 278}
{"train_info/time_between_train_steps": 0.005466938018798828, "step": 278}
{"info/global_step": 279, "train_info/time_within_train_step": 27.720260620117188, "step": 279}
{"train_info/time_between_train_steps": 0.0051517486572265625, "step": 279}
{"info/global_step": 280, "train_info/time_within_train_step": 27.68303108215332, "step": 280}
{"train_info/time_between_train_steps": 0.005066633224487305, "step": 280}
{"info/global_step": 281, "train_info/time_within_train_step": 27.699601650238037, "step": 281}
{"train_info/time_between_train_steps": 0.005049228668212891, "step": 281}
{"info/global_step": 282, "train_info/time_within_train_step": 27.687711477279663, "step": 282}
{"train_info/time_between_train_steps": 0.005125999450683594, "step": 282}
{"info/global_step": 283, "train_info/time_within_train_step": 27.739423513412476, "step": 283}
{"train_info/time_between_train_steps": 0.005048274993896484, "step": 283}
{"info/global_step": 284, "train_info/time_within_train_step": 27.696190118789673, "step": 284}
{"train_info/time_between_train_steps": 0.005054473876953125, "step": 284}
{"info/global_step": 285, "train_info/time_within_train_step": 27.7551748752594, "step": 285}
{"train_info/time_between_train_steps": 0.004928112030029297, "step": 285}
{"info/global_step": 286, "train_info/time_within_train_step": 27.709315061569214, "step": 286}
{"train_info/time_between_train_steps": 0.0049762725830078125, "step": 286}
{"info/global_step": 287, "train_info/time_within_train_step": 27.74649953842163, "step": 287}
{"train_info/time_between_train_steps": 0.005185127258300781, "step": 287}
{"info/global_step": 288, "train_info/time_within_train_step": 27.7759530544281, "step": 288}
{"train_info/time_between_train_steps": 0.004976987838745117, "step": 288}
{"info/global_step": 289, "train_info/time_within_train_step": 27.77699589729309, "step": 289}
{"train_info/time_between_train_steps": 0.0052242279052734375, "step": 289}
{"info/global_step": 290, "train_info/time_within_train_step": 27.66975450515747, "step": 290}
{"train_info/time_between_train_steps": 0.004957675933837891, "step": 290}
{"info/global_step": 291, "train_info/time_within_train_step": 27.696810007095337, "step": 291}
{"train_info/time_between_train_steps": 0.0049936771392822266, "step": 291}
{"info/global_step": 292, "train_info/time_within_train_step": 27.689391613006592, "step": 292}
{"train_info/time_between_train_steps": 0.00511479377746582, "step": 292}
{"info/global_step": 293, "train_info/time_within_train_step": 27.68093466758728, "step": 293}
{"train_info/time_between_train_steps": 0.005021572113037109, "step": 293}
{"info/global_step": 294, "train_info/time_within_train_step": 27.686478853225708, "step": 294}
{"train_info/time_between_train_steps": 0.0057065486907958984, "step": 294}
{"info/global_step": 295, "train_info/time_within_train_step": 27.676884412765503, "step": 295}
{"train_info/time_between_train_steps": 0.004882335662841797, "step": 295}
{"info/global_step": 296, "train_info/time_within_train_step": 27.744085550308228, "step": 296}
{"train_info/time_between_train_steps": 0.005126953125, "step": 296}
{"info/global_step": 297, "train_info/time_within_train_step": 27.702570915222168, "step": 297}
{"train_info/time_between_train_steps": 0.00536036491394043, "step": 297}
{"train_info/time_between_train_steps": 29.789317846298218, "step": 297}
{"info/global_step": 298, "train_info/time_within_train_step": 27.684459924697876, "step": 298}
{"train_info/time_between_train_steps": 0.0048944950103759766, "step": 298}
{"info/global_step": 299, "train_info/time_within_train_step": 27.833518505096436, "step": 299}
{"train_info/time_between_train_steps": 0.0049974918365478516, "step": 299}
{"info/global_step": 300, "train_info/time_within_train_step": 27.6945378780365, "step": 300}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740832880, "_runtime": 8829}, "step": 300}
{"logs": {"train/loss": 4.6208, "train/learning_rate": 0.0005, "train/epoch": 11.0, "_timestamp": 1740832880, "_runtime": 8829}, "step": 300}
{"train_info/time_between_train_steps": 65.89691710472107, "step": 300}
{"info/global_step": 301, "train_info/time_within_train_step": 28.31470823287964, "step": 301}
{"train_info/time_between_train_steps": 0.010166645050048828, "step": 301}
{"info/global_step": 302, "train_info/time_within_train_step": 27.703016757965088, "step": 302}
{"train_info/time_between_train_steps": 0.005416393280029297, "step": 302}
{"info/global_step": 303, "train_info/time_within_train_step": 27.96810746192932, "step": 303}
{"train_info/time_between_train_steps": 0.005486488342285156, "step": 303}
{"info/global_step": 304, "train_info/time_within_train_step": 27.700064182281494, "step": 304}
{"train_info/time_between_train_steps": 0.0052280426025390625, "step": 304}
{"info/global_step": 305, "train_info/time_within_train_step": 27.81597661972046, "step": 305}
{"train_info/time_between_train_steps": 0.00540614128112793, "step": 305}
{"info/global_step": 306, "train_info/time_within_train_step": 27.68986177444458, "step": 306}
{"train_info/time_between_train_steps": 0.004990577697753906, "step": 306}
{"info/global_step": 307, "train_info/time_within_train_step": 27.671053409576416, "step": 307}
{"train_info/time_between_train_steps": 0.004998922348022461, "step": 307}
{"info/global_step": 308, "train_info/time_within_train_step": 27.699034214019775, "step": 308}
{"train_info/time_between_train_steps": 0.005150794982910156, "step": 308}
{"info/global_step": 309, "train_info/time_within_train_step": 27.68761134147644, "step": 309}
{"train_info/time_between_train_steps": 0.0050122737884521484, "step": 309}
{"info/global_step": 310, "train_info/time_within_train_step": 27.728851318359375, "step": 310}
{"train_info/time_between_train_steps": 0.005139827728271484, "step": 310}
{"info/global_step": 311, "train_info/time_within_train_step": 27.689040422439575, "step": 311}
{"train_info/time_between_train_steps": 0.005077838897705078, "step": 311}
{"info/global_step": 312, "train_info/time_within_train_step": 27.74622416496277, "step": 312}
{"train_info/time_between_train_steps": 0.004988908767700195, "step": 312}
{"info/global_step": 313, "train_info/time_within_train_step": 27.69682765007019, "step": 313}
{"train_info/time_between_train_steps": 0.005201101303100586, "step": 313}
{"info/global_step": 314, "train_info/time_within_train_step": 27.77381134033203, "step": 314}
{"train_info/time_between_train_steps": 0.0049626827239990234, "step": 314}
{"info/global_step": 315, "train_info/time_within_train_step": 27.68382692337036, "step": 315}
{"train_info/time_between_train_steps": 0.010013341903686523, "step": 315}
{"info/global_step": 316, "train_info/time_within_train_step": 28.080734729766846, "step": 316}
{"train_info/time_between_train_steps": 0.014333486557006836, "step": 316}
{"info/global_step": 317, "train_info/time_within_train_step": 27.81632661819458, "step": 317}
{"train_info/time_between_train_steps": 0.005003929138183594, "step": 317}
{"info/global_step": 318, "train_info/time_within_train_step": 27.82829475402832, "step": 318}
{"train_info/time_between_train_steps": 0.014801025390625, "step": 318}
{"info/global_step": 319, "train_info/time_within_train_step": 27.73217535018921, "step": 319}
{"train_info/time_between_train_steps": 0.009831905364990234, "step": 319}
{"info/global_step": 320, "train_info/time_within_train_step": 27.795313596725464, "step": 320}
{"train_info/time_between_train_steps": 0.010039806365966797, "step": 320}
{"info/global_step": 321, "train_info/time_within_train_step": 27.756673097610474, "step": 321}
{"train_info/time_between_train_steps": 0.005138874053955078, "step": 321}
{"info/global_step": 322, "train_info/time_within_train_step": 27.68706202507019, "step": 322}
{"train_info/time_between_train_steps": 0.005056142807006836, "step": 322}
{"info/global_step": 323, "train_info/time_within_train_step": 27.746856212615967, "step": 323}
{"train_info/time_between_train_steps": 0.005658626556396484, "step": 323}
{"info/global_step": 324, "train_info/time_within_train_step": 27.71417546272278, "step": 324}
{"train_info/time_between_train_steps": 0.005705356597900391, "step": 324}
{"train_info/time_between_train_steps": 29.95971655845642, "step": 324}
{"info/global_step": 325, "train_info/time_within_train_step": 27.683840036392212, "step": 325}
{"train_info/time_between_train_steps": 0.004889249801635742, "step": 325}
{"info/global_step": 326, "train_info/time_within_train_step": 27.82358717918396, "step": 326}
{"train_info/time_between_train_steps": 0.005277156829833984, "step": 326}
{"info/global_step": 327, "train_info/time_within_train_step": 27.729092359542847, "step": 327}
{"train_info/time_between_train_steps": 0.0061452388763427734, "step": 327}
{"info/global_step": 328, "train_info/time_within_train_step": 27.825883626937866, "step": 328}
{"train_info/time_between_train_steps": 0.0052947998046875, "step": 328}
{"info/global_step": 329, "train_info/time_within_train_step": 27.68842363357544, "step": 329}
{"train_info/time_between_train_steps": 0.005503654479980469, "step": 329}
{"info/global_step": 330, "train_info/time_within_train_step": 27.88675880432129, "step": 330}
{"train_info/time_between_train_steps": 0.005421161651611328, "step": 330}
{"info/global_step": 331, "train_info/time_within_train_step": 27.687194108963013, "step": 331}
{"train_info/time_between_train_steps": 0.00525975227355957, "step": 331}
{"info/global_step": 332, "train_info/time_within_train_step": 27.814470529556274, "step": 332}
{"train_info/time_between_train_steps": 0.005290031433105469, "step": 332}
{"info/global_step": 333, "train_info/time_within_train_step": 27.794780015945435, "step": 333}
{"train_info/time_between_train_steps": 0.005058765411376953, "step": 333}
{"info/global_step": 334, "train_info/time_within_train_step": 27.686293363571167, "step": 334}
{"train_info/time_between_train_steps": 0.0050656795501708984, "step": 334}
{"info/global_step": 335, "train_info/time_within_train_step": 27.739587783813477, "step": 335}
{"train_info/time_between_train_steps": 0.005070686340332031, "step": 335}
{"info/global_step": 336, "train_info/time_within_train_step": 27.68271493911743, "step": 336}
{"train_info/time_between_train_steps": 0.005087137222290039, "step": 336}
{"info/global_step": 337, "train_info/time_within_train_step": 27.72687554359436, "step": 337}
{"train_info/time_between_train_steps": 0.005151987075805664, "step": 337}
{"info/global_step": 338, "train_info/time_within_train_step": 27.696459531784058, "step": 338}
{"train_info/time_between_train_steps": 0.005015850067138672, "step": 338}
{"info/global_step": 339, "train_info/time_within_train_step": 27.739161491394043, "step": 339}
{"train_info/time_between_train_steps": 0.005136966705322266, "step": 339}
{"info/global_step": 340, "train_info/time_within_train_step": 27.698787450790405, "step": 340}
{"train_info/time_between_train_steps": 0.005093097686767578, "step": 340}
{"info/global_step": 341, "train_info/time_within_train_step": 27.721898317337036, "step": 341}
{"train_info/time_between_train_steps": 0.0051343441009521484, "step": 341}
{"info/global_step": 342, "train_info/time_within_train_step": 27.677818775177002, "step": 342}
{"train_info/time_between_train_steps": 0.005182981491088867, "step": 342}
{"info/global_step": 343, "train_info/time_within_train_step": 27.718980312347412, "step": 343}
{"train_info/time_between_train_steps": 0.005194187164306641, "step": 343}
{"info/global_step": 344, "train_info/time_within_train_step": 27.698964834213257, "step": 344}
{"train_info/time_between_train_steps": 0.005169391632080078, "step": 344}
{"info/global_step": 345, "train_info/time_within_train_step": 27.683090925216675, "step": 345}
{"train_info/time_between_train_steps": 0.005137205123901367, "step": 345}
{"info/global_step": 346, "train_info/time_within_train_step": 27.682157039642334, "step": 346}
{"train_info/time_between_train_steps": 0.005159616470336914, "step": 346}
{"info/global_step": 347, "train_info/time_within_train_step": 27.68567419052124, "step": 347}
{"train_info/time_between_train_steps": 0.005208492279052734, "step": 347}
{"info/global_step": 348, "train_info/time_within_train_step": 27.780143976211548, "step": 348}
{"train_info/time_between_train_steps": 0.010355472564697266, "step": 348}
{"info/global_step": 349, "train_info/time_within_train_step": 27.722211122512817, "step": 349}
{"train_info/time_between_train_steps": 0.0056040287017822266, "step": 349}
{"info/global_step": 350, "train_info/time_within_train_step": 29.383646726608276, "step": 350}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740834368, "_runtime": 10317}, "step": 350}
{"logs": {"train/loss": 4.3481, "train/learning_rate": 0.00047222222222222224, "train/epoch": 12.02, "_timestamp": 1740834368, "_runtime": 10317}, "step": 350}
{"train_info/time_between_train_steps": 0.7293825149536133, "step": 350}
{"info/global_step": 351, "train_info/time_within_train_step": 27.71374201774597, "step": 351}
{"train_info/time_between_train_steps": 0.005836963653564453, "step": 351}
{"train_info/time_between_train_steps": 30.10848879814148, "step": 351}
{"info/global_step": 352, "train_info/time_within_train_step": 27.692814111709595, "step": 352}
{"train_info/time_between_train_steps": 0.0050792694091796875, "step": 352}
{"info/global_step": 353, "train_info/time_within_train_step": 27.843517780303955, "step": 353}
{"train_info/time_between_train_steps": 0.0052645206451416016, "step": 353}
{"info/global_step": 354, "train_info/time_within_train_step": 27.688941717147827, "step": 354}
{"train_info/time_between_train_steps": 0.00531458854675293, "step": 354}
{"info/global_step": 355, "train_info/time_within_train_step": 27.858290672302246, "step": 355}
{"train_info/time_between_train_steps": 0.0052776336669921875, "step": 355}
{"info/global_step": 356, "train_info/time_within_train_step": 27.70293617248535, "step": 356}
{"train_info/time_between_train_steps": 0.005409955978393555, "step": 356}
{"info/global_step": 357, "train_info/time_within_train_step": 27.815258741378784, "step": 357}
{"train_info/time_between_train_steps": 0.005219459533691406, "step": 357}
{"info/global_step": 358, "train_info/time_within_train_step": 27.68798303604126, "step": 358}
{"train_info/time_between_train_steps": 0.005445718765258789, "step": 358}
{"info/global_step": 359, "train_info/time_within_train_step": 27.771528720855713, "step": 359}
{"train_info/time_between_train_steps": 0.005360603332519531, "step": 359}
{"info/global_step": 360, "train_info/time_within_train_step": 27.696993112564087, "step": 360}
{"train_info/time_between_train_steps": 0.0050313472747802734, "step": 360}
{"info/global_step": 361, "train_info/time_within_train_step": 27.67265224456787, "step": 361}
{"train_info/time_between_train_steps": 0.0050811767578125, "step": 361}
{"info/global_step": 362, "train_info/time_within_train_step": 27.71242332458496, "step": 362}
{"train_info/time_between_train_steps": 0.004982948303222656, "step": 362}
{"info/global_step": 363, "train_info/time_within_train_step": 27.78746271133423, "step": 363}
{"train_info/time_between_train_steps": 0.005163431167602539, "step": 363}
{"info/global_step": 364, "train_info/time_within_train_step": 27.685216426849365, "step": 364}
{"train_info/time_between_train_steps": 0.0049974918365478516, "step": 364}
{"info/global_step": 365, "train_info/time_within_train_step": 27.699547052383423, "step": 365}
{"train_info/time_between_train_steps": 0.005105257034301758, "step": 365}
{"info/global_step": 366, "train_info/time_within_train_step": 27.679184913635254, "step": 366}
{"train_info/time_between_train_steps": 0.005199909210205078, "step": 366}
{"info/global_step": 367, "train_info/time_within_train_step": 27.686453342437744, "step": 367}
{"train_info/time_between_train_steps": 0.005114078521728516, "step": 367}
{"info/global_step": 368, "train_info/time_within_train_step": 27.691442489624023, "step": 368}
{"train_info/time_between_train_steps": 0.005526304244995117, "step": 368}
{"info/global_step": 369, "train_info/time_within_train_step": 27.687214136123657, "step": 369}
{"train_info/time_between_train_steps": 0.005266427993774414, "step": 369}
{"info/global_step": 370, "train_info/time_within_train_step": 27.733667135238647, "step": 370}
{"train_info/time_between_train_steps": 0.005341053009033203, "step": 370}
{"info/global_step": 371, "train_info/time_within_train_step": 27.71192479133606, "step": 371}
{"train_info/time_between_train_steps": 0.005162715911865234, "step": 371}
{"info/global_step": 372, "train_info/time_within_train_step": 27.678988218307495, "step": 372}
{"train_info/time_between_train_steps": 0.005349874496459961, "step": 372}
{"info/global_step": 373, "train_info/time_within_train_step": 27.689069509506226, "step": 373}
{"train_info/time_between_train_steps": 0.005288124084472656, "step": 373}
{"info/global_step": 374, "train_info/time_within_train_step": 27.694862365722656, "step": 374}
{"train_info/time_between_train_steps": 0.005211830139160156, "step": 374}
{"info/global_step": 375, "train_info/time_within_train_step": 27.749579429626465, "step": 375}
{"train_info/time_between_train_steps": 0.005239248275756836, "step": 375}
{"info/global_step": 376, "train_info/time_within_train_step": 27.689353942871094, "step": 376}
{"train_info/time_between_train_steps": 0.005298614501953125, "step": 376}
{"info/global_step": 377, "train_info/time_within_train_step": 27.692123651504517, "step": 377}
{"train_info/time_between_train_steps": 0.006635904312133789, "step": 377}
{"info/global_step": 378, "train_info/time_within_train_step": 27.70120668411255, "step": 378}
{"train_info/time_between_train_steps": 0.005726814270019531, "step": 378}
{"train_info/time_between_train_steps": 29.77442169189453, "step": 378}
{"info/global_step": 379, "train_info/time_within_train_step": 27.694073915481567, "step": 379}
{"train_info/time_between_train_steps": 0.005371570587158203, "step": 379}
{"info/global_step": 380, "train_info/time_within_train_step": 27.83268141746521, "step": 380}
{"train_info/time_between_train_steps": 0.005142927169799805, "step": 380}
{"info/global_step": 381, "train_info/time_within_train_step": 27.689643383026123, "step": 381}
{"train_info/time_between_train_steps": 0.006165027618408203, "step": 381}
{"info/global_step": 382, "train_info/time_within_train_step": 27.888978242874146, "step": 382}
{"train_info/time_between_train_steps": 0.005408048629760742, "step": 382}
{"info/global_step": 383, "train_info/time_within_train_step": 27.694881200790405, "step": 383}
{"train_info/time_between_train_steps": 0.005347490310668945, "step": 383}
{"info/global_step": 384, "train_info/time_within_train_step": 28.00465154647827, "step": 384}
{"train_info/time_between_train_steps": 0.005627632141113281, "step": 384}
{"info/global_step": 385, "train_info/time_within_train_step": 27.708280324935913, "step": 385}
{"train_info/time_between_train_steps": 0.005397319793701172, "step": 385}
{"info/global_step": 386, "train_info/time_within_train_step": 27.77204155921936, "step": 386}
{"train_info/time_between_train_steps": 0.005115985870361328, "step": 386}
{"info/global_step": 387, "train_info/time_within_train_step": 27.733999252319336, "step": 387}
{"train_info/time_between_train_steps": 0.009888410568237305, "step": 387}
{"info/global_step": 388, "train_info/time_within_train_step": 27.67678475379944, "step": 388}
{"train_info/time_between_train_steps": 0.004895687103271484, "step": 388}
{"info/global_step": 389, "train_info/time_within_train_step": 27.685023069381714, "step": 389}
{"train_info/time_between_train_steps": 0.004931449890136719, "step": 389}
{"info/global_step": 390, "train_info/time_within_train_step": 27.67155885696411, "step": 390}
{"train_info/time_between_train_steps": 0.005100727081298828, "step": 390}
{"info/global_step": 391, "train_info/time_within_train_step": 27.738587141036987, "step": 391}
{"train_info/time_between_train_steps": 0.004996776580810547, "step": 391}
{"info/global_step": 392, "train_info/time_within_train_step": 27.688738107681274, "step": 392}
{"train_info/time_between_train_steps": 0.005154132843017578, "step": 392}
{"info/global_step": 393, "train_info/time_within_train_step": 27.81110382080078, "step": 393}
{"train_info/time_between_train_steps": 0.004900455474853516, "step": 393}
{"info/global_step": 394, "train_info/time_within_train_step": 27.670275449752808, "step": 394}
{"train_info/time_between_train_steps": 0.005010843276977539, "step": 394}
{"info/global_step": 395, "train_info/time_within_train_step": 27.731797218322754, "step": 395}
{"train_info/time_between_train_steps": 0.005105257034301758, "step": 395}
{"info/global_step": 396, "train_info/time_within_train_step": 27.68563485145569, "step": 396}
{"train_info/time_between_train_steps": 0.004901409149169922, "step": 396}
{"info/global_step": 397, "train_info/time_within_train_step": 27.736372232437134, "step": 397}
{"train_info/time_between_train_steps": 0.005099058151245117, "step": 397}
{"info/global_step": 398, "train_info/time_within_train_step": 27.685951948165894, "step": 398}
{"train_info/time_between_train_steps": 0.004903554916381836, "step": 398}
{"info/global_step": 399, "train_info/time_within_train_step": 27.67534303665161, "step": 399}
{"train_info/time_between_train_steps": 0.005183219909667969, "step": 399}
{"info/global_step": 400, "train_info/time_within_train_step": 27.673490047454834, "step": 400}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740835816, "_runtime": 11765}, "step": 400}
{"logs": {"train/loss": 4.2378, "train/learning_rate": 0.00044444444444444436, "train/epoch": 14.02, "_timestamp": 1740835816, "_runtime": 11765}, "step": 400}
{"train_info/time_between_train_steps": 64.01022624969482, "step": 400}
{"info/global_step": 401, "train_info/time_within_train_step": 27.715702295303345, "step": 401}
{"train_info/time_between_train_steps": 0.005244731903076172, "step": 401}
{"info/global_step": 402, "train_info/time_within_train_step": 27.691340923309326, "step": 402}
{"train_info/time_between_train_steps": 0.004961967468261719, "step": 402}
{"info/global_step": 403, "train_info/time_within_train_step": 27.705077409744263, "step": 403}
{"train_info/time_between_train_steps": 0.005106210708618164, "step": 403}
{"info/global_step": 404, "train_info/time_within_train_step": 27.694612741470337, "step": 404}
{"train_info/time_between_train_steps": 0.005345344543457031, "step": 404}
{"info/global_step": 405, "train_info/time_within_train_step": 27.696762561798096, "step": 405}
{"train_info/time_between_train_steps": 0.005524158477783203, "step": 405}
{"train_info/time_between_train_steps": 29.747445106506348, "step": 405}
{"info/global_step": 406, "train_info/time_within_train_step": 27.695367097854614, "step": 406}
{"train_info/time_between_train_steps": 0.004847288131713867, "step": 406}
{"info/global_step": 407, "train_info/time_within_train_step": 27.857388734817505, "step": 407}
{"train_info/time_between_train_steps": 0.005078315734863281, "step": 407}
{"info/global_step": 408, "train_info/time_within_train_step": 27.793639659881592, "step": 408}
{"train_info/time_between_train_steps": 0.005339622497558594, "step": 408}
{"info/global_step": 409, "train_info/time_within_train_step": 27.83681297302246, "step": 409}
{"train_info/time_between_train_steps": 0.005090951919555664, "step": 409}
{"info/global_step": 410, "train_info/time_within_train_step": 27.721065998077393, "step": 410}
{"train_info/time_between_train_steps": 0.005240917205810547, "step": 410}
{"info/global_step": 411, "train_info/time_within_train_step": 27.846831560134888, "step": 411}
{"train_info/time_between_train_steps": 0.005246400833129883, "step": 411}
{"info/global_step": 412, "train_info/time_within_train_step": 27.68318271636963, "step": 412}
{"train_info/time_between_train_steps": 0.004983186721801758, "step": 412}
{"info/global_step": 413, "train_info/time_within_train_step": 27.79054307937622, "step": 413}
{"train_info/time_between_train_steps": 0.010418891906738281, "step": 413}
{"info/global_step": 414, "train_info/time_within_train_step": 27.710638523101807, "step": 414}
{"train_info/time_between_train_steps": 0.004860877990722656, "step": 414}
{"info/global_step": 415, "train_info/time_within_train_step": 27.735029935836792, "step": 415}
{"train_info/time_between_train_steps": 0.009807348251342773, "step": 415}
{"info/global_step": 416, "train_info/time_within_train_step": 27.702127933502197, "step": 416}
{"train_info/time_between_train_steps": 0.004975080490112305, "step": 416}
{"info/global_step": 417, "train_info/time_within_train_step": 27.669419288635254, "step": 417}
{"train_info/time_between_train_steps": 0.004876852035522461, "step": 417}
{"info/global_step": 418, "train_info/time_within_train_step": 27.723541498184204, "step": 418}
{"train_info/time_between_train_steps": 0.009755611419677734, "step": 418}
{"info/global_step": 419, "train_info/time_within_train_step": 27.684327602386475, "step": 419}
{"train_info/time_between_train_steps": 0.004923105239868164, "step": 419}
{"info/global_step": 420, "train_info/time_within_train_step": 27.727847576141357, "step": 420}
{"train_info/time_between_train_steps": 0.004906654357910156, "step": 420}
{"info/global_step": 421, "train_info/time_within_train_step": 27.688854217529297, "step": 421}
{"train_info/time_between_train_steps": 0.00513911247253418, "step": 421}
{"info/global_step": 422, "train_info/time_within_train_step": 27.6735999584198, "step": 422}
{"train_info/time_between_train_steps": 0.009706497192382812, "step": 422}
{"info/global_step": 423, "train_info/time_within_train_step": 27.669618368148804, "step": 423}
{"train_info/time_between_train_steps": 0.00496673583984375, "step": 423}
{"info/global_step": 424, "train_info/time_within_train_step": 27.767581701278687, "step": 424}
{"train_info/time_between_train_steps": 0.010165929794311523, "step": 424}
{"info/global_step": 425, "train_info/time_within_train_step": 27.670666694641113, "step": 425}
{"train_info/time_between_train_steps": 0.009455680847167969, "step": 425}
{"info/global_step": 426, "train_info/time_within_train_step": 27.67463207244873, "step": 426}
{"train_info/time_between_train_steps": 0.005069732666015625, "step": 426}
{"info/global_step": 427, "train_info/time_within_train_step": 27.675658464431763, "step": 427}
{"train_info/time_between_train_steps": 0.005036115646362305, "step": 427}
{"info/global_step": 428, "train_info/time_within_train_step": 27.673872709274292, "step": 428}
{"train_info/time_between_train_steps": 0.005051612854003906, "step": 428}
{"info/global_step": 429, "train_info/time_within_train_step": 27.67629361152649, "step": 429}
{"train_info/time_between_train_steps": 0.00524592399597168, "step": 429}
{"info/global_step": 430, "train_info/time_within_train_step": 27.681583881378174, "step": 430}
{"train_info/time_between_train_steps": 0.005123615264892578, "step": 430}
{"info/global_step": 431, "train_info/time_within_train_step": 27.693169593811035, "step": 431}
{"train_info/time_between_train_steps": 0.005305051803588867, "step": 431}
{"info/global_step": 432, "train_info/time_within_train_step": 27.69833278656006, "step": 432}
{"train_info/time_between_train_steps": 0.010790348052978516, "step": 432}
{"train_info/time_between_train_steps": 29.937363624572754, "step": 432}
{"info/global_step": 433, "train_info/time_within_train_step": 27.687923908233643, "step": 433}
{"train_info/time_between_train_steps": 0.00988459587097168, "step": 433}
{"info/global_step": 434, "train_info/time_within_train_step": 27.857445001602173, "step": 434}
{"train_info/time_between_train_steps": 0.009891510009765625, "step": 434}
{"info/global_step": 435, "train_info/time_within_train_step": 27.67554807662964, "step": 435}
{"train_info/time_between_train_steps": 0.009940624237060547, "step": 435}
{"info/global_step": 436, "train_info/time_within_train_step": 27.79150629043579, "step": 436}
{"train_info/time_between_train_steps": 0.009677648544311523, "step": 436}
{"info/global_step": 437, "train_info/time_within_train_step": 27.675451517105103, "step": 437}
{"train_info/time_between_train_steps": 0.005045413970947266, "step": 437}
{"info/global_step": 438, "train_info/time_within_train_step": 27.98516273498535, "step": 438}
{"train_info/time_between_train_steps": 0.0052640438079833984, "step": 438}
{"info/global_step": 439, "train_info/time_within_train_step": 27.677082538604736, "step": 439}
{"train_info/time_between_train_steps": 0.005086421966552734, "step": 439}
{"info/global_step": 440, "train_info/time_within_train_step": 27.727195978164673, "step": 440}
{"train_info/time_between_train_steps": 0.005097627639770508, "step": 440}
{"info/global_step": 441, "train_info/time_within_train_step": 27.68182063102722, "step": 441}
{"train_info/time_between_train_steps": 0.0049326419830322266, "step": 441}
{"info/global_step": 442, "train_info/time_within_train_step": 27.665661096572876, "step": 442}
{"train_info/time_between_train_steps": 0.004942655563354492, "step": 442}
{"info/global_step": 443, "train_info/time_within_train_step": 27.67825198173523, "step": 443}
{"train_info/time_between_train_steps": 0.004904270172119141, "step": 443}
{"info/global_step": 444, "train_info/time_within_train_step": 27.681687116622925, "step": 444}
{"train_info/time_between_train_steps": 0.004858255386352539, "step": 444}
{"info/global_step": 445, "train_info/time_within_train_step": 29.499985456466675, "step": 445}
{"train_info/time_between_train_steps": 0.005654811859130859, "step": 445}
{"info/global_step": 446, "train_info/time_within_train_step": 27.797162532806396, "step": 446}
{"train_info/time_between_train_steps": 0.00486445426940918, "step": 446}
{"info/global_step": 447, "train_info/time_within_train_step": 27.720513582229614, "step": 447}
{"train_info/time_between_train_steps": 0.004870891571044922, "step": 447}
{"info/global_step": 448, "train_info/time_within_train_step": 27.697356700897217, "step": 448}
{"train_info/time_between_train_steps": 0.005402088165283203, "step": 448}
{"info/global_step": 449, "train_info/time_within_train_step": 27.726869106292725, "step": 449}
{"train_info/time_between_train_steps": 0.00550532341003418, "step": 449}
{"info/global_step": 450, "train_info/time_within_train_step": 27.684000253677368, "step": 450}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740837330, "_runtime": 13279}, "step": 450}
{"logs": {"train/loss": 4.0729, "train/learning_rate": 0.00041666666666666664, "train/epoch": 16.02, "_timestamp": 1740837330, "_runtime": 13279}, "step": 450}
{"train_info/time_between_train_steps": 0.025930166244506836, "step": 450}
{"info/global_step": 451, "train_info/time_within_train_step": 27.73427438735962, "step": 451}
{"train_info/time_between_train_steps": 0.005078315734863281, "step": 451}
{"info/global_step": 452, "train_info/time_within_train_step": 27.684383153915405, "step": 452}
{"train_info/time_between_train_steps": 0.004854440689086914, "step": 452}
{"info/global_step": 453, "train_info/time_within_train_step": 27.677574396133423, "step": 453}
{"train_info/time_between_train_steps": 0.004899740219116211, "step": 453}
{"info/global_step": 454, "train_info/time_within_train_step": 27.80413317680359, "step": 454}
{"train_info/time_between_train_steps": 0.005186796188354492, "step": 454}
{"info/global_step": 455, "train_info/time_within_train_step": 27.690826177597046, "step": 455}
{"train_info/time_between_train_steps": 0.004988193511962891, "step": 455}
{"info/global_step": 456, "train_info/time_within_train_step": 27.71909523010254, "step": 456}
{"train_info/time_between_train_steps": 0.004974842071533203, "step": 456}
{"info/global_step": 457, "train_info/time_within_train_step": 27.686352729797363, "step": 457}
{"train_info/time_between_train_steps": 0.005320072174072266, "step": 457}
{"info/global_step": 458, "train_info/time_within_train_step": 27.71625781059265, "step": 458}
{"train_info/time_between_train_steps": 0.005297660827636719, "step": 458}
{"info/global_step": 459, "train_info/time_within_train_step": 27.711673498153687, "step": 459}
{"train_info/time_between_train_steps": 0.005975008010864258, "step": 459}
{"train_info/time_between_train_steps": 29.592323303222656, "step": 459}
{"info/global_step": 460, "train_info/time_within_train_step": 27.677295684814453, "step": 460}
{"train_info/time_between_train_steps": 0.004805803298950195, "step": 460}
{"info/global_step": 461, "train_info/time_within_train_step": 27.846956729888916, "step": 461}
{"train_info/time_between_train_steps": 0.005087375640869141, "step": 461}
{"info/global_step": 462, "train_info/time_within_train_step": 27.69061017036438, "step": 462}
{"train_info/time_between_train_steps": 0.0051424503326416016, "step": 462}
{"info/global_step": 463, "train_info/time_within_train_step": 27.812079191207886, "step": 463}
{"train_info/time_between_train_steps": 0.005174398422241211, "step": 463}
{"info/global_step": 464, "train_info/time_within_train_step": 27.69693946838379, "step": 464}
{"train_info/time_between_train_steps": 0.0055429935455322266, "step": 464}
{"info/global_step": 465, "train_info/time_within_train_step": 27.84162712097168, "step": 465}
{"train_info/time_between_train_steps": 0.0051915645599365234, "step": 465}
{"info/global_step": 466, "train_info/time_within_train_step": 27.686394929885864, "step": 466}
{"train_info/time_between_train_steps": 0.0054302215576171875, "step": 466}
{"info/global_step": 467, "train_info/time_within_train_step": 27.76968502998352, "step": 467}
{"train_info/time_between_train_steps": 0.005197763442993164, "step": 467}
{"info/global_step": 468, "train_info/time_within_train_step": 27.7227725982666, "step": 468}
{"train_info/time_between_train_steps": 0.0049970149993896484, "step": 468}
{"info/global_step": 469, "train_info/time_within_train_step": 27.77405023574829, "step": 469}
{"train_info/time_between_train_steps": 0.005004405975341797, "step": 469}
{"info/global_step": 470, "train_info/time_within_train_step": 27.722710609436035, "step": 470}
{"train_info/time_between_train_steps": 0.005176544189453125, "step": 470}
{"info/global_step": 471, "train_info/time_within_train_step": 27.690796375274658, "step": 471}
{"train_info/time_between_train_steps": 0.005308389663696289, "step": 471}
{"info/global_step": 472, "train_info/time_within_train_step": 27.737648010253906, "step": 472}
{"train_info/time_between_train_steps": 0.0050678253173828125, "step": 472}
{"info/global_step": 473, "train_info/time_within_train_step": 27.690638780593872, "step": 473}
{"train_info/time_between_train_steps": 0.004964113235473633, "step": 473}
{"info/global_step": 474, "train_info/time_within_train_step": 27.7276713848114, "step": 474}
{"train_info/time_between_train_steps": 0.005186796188354492, "step": 474}
{"info/global_step": 475, "train_info/time_within_train_step": 27.677839994430542, "step": 475}
{"train_info/time_between_train_steps": 0.00987553596496582, "step": 475}
{"info/global_step": 476, "train_info/time_within_train_step": 27.776566982269287, "step": 476}
{"train_info/time_between_train_steps": 0.005464076995849609, "step": 476}
{"info/global_step": 477, "train_info/time_within_train_step": 27.699624061584473, "step": 477}
{"train_info/time_between_train_steps": 0.005422830581665039, "step": 477}
{"info/global_step": 478, "train_info/time_within_train_step": 27.673069715499878, "step": 478}
{"train_info/time_between_train_steps": 0.005317211151123047, "step": 478}
{"info/global_step": 479, "train_info/time_within_train_step": 27.68050718307495, "step": 479}
{"train_info/time_between_train_steps": 0.00502777099609375, "step": 479}
{"info/global_step": 480, "train_info/time_within_train_step": 27.67504906654358, "step": 480}
{"train_info/time_between_train_steps": 0.005350828170776367, "step": 480}
{"info/global_step": 481, "train_info/time_within_train_step": 27.692520141601562, "step": 481}
{"train_info/time_between_train_steps": 0.0065155029296875, "step": 481}
{"info/global_step": 482, "train_info/time_within_train_step": 27.818052291870117, "step": 482}
{"train_info/time_between_train_steps": 0.014669179916381836, "step": 482}
{"info/global_step": 483, "train_info/time_within_train_step": 27.7994704246521, "step": 483}
{"train_info/time_between_train_steps": 0.0051119327545166016, "step": 483}
{"info/global_step": 484, "train_info/time_within_train_step": 27.80413031578064, "step": 484}
{"train_info/time_between_train_steps": 0.0051326751708984375, "step": 484}
{"info/global_step": 485, "train_info/time_within_train_step": 27.73630380630493, "step": 485}
{"train_info/time_between_train_steps": 0.005503654479980469, "step": 485}
{"info/global_step": 486, "train_info/time_within_train_step": 27.70350408554077, "step": 486}
{"train_info/time_between_train_steps": 0.01563715934753418, "step": 486}
{"train_info/time_between_train_steps": 29.821906566619873, "step": 486}
{"info/global_step": 487, "train_info/time_within_train_step": 27.707539081573486, "step": 487}
{"train_info/time_between_train_steps": 0.005282163619995117, "step": 487}
{"info/global_step": 488, "train_info/time_within_train_step": 27.866729974746704, "step": 488}
{"train_info/time_between_train_steps": 0.0051441192626953125, "step": 488}
{"info/global_step": 489, "train_info/time_within_train_step": 27.67479157447815, "step": 489}
{"train_info/time_between_train_steps": 0.0051004886627197266, "step": 489}
{"info/global_step": 490, "train_info/time_within_train_step": 27.8334903717041, "step": 490}
{"train_info/time_between_train_steps": 0.005152463912963867, "step": 490}
{"info/global_step": 491, "train_info/time_within_train_step": 27.793882131576538, "step": 491}
{"train_info/time_between_train_steps": 0.005084991455078125, "step": 491}
{"info/global_step": 492, "train_info/time_within_train_step": 27.805104732513428, "step": 492}
{"train_info/time_between_train_steps": 0.00496673583984375, "step": 492}
{"info/global_step": 493, "train_info/time_within_train_step": 27.720075845718384, "step": 493}
{"train_info/time_between_train_steps": 0.007458686828613281, "step": 493}
{"info/global_step": 494, "train_info/time_within_train_step": 27.76487708091736, "step": 494}
{"train_info/time_between_train_steps": 0.0051152706146240234, "step": 494}
{"info/global_step": 495, "train_info/time_within_train_step": 27.687869548797607, "step": 495}
{"train_info/time_between_train_steps": 0.009567737579345703, "step": 495}
{"info/global_step": 496, "train_info/time_within_train_step": 27.677684783935547, "step": 496}
{"train_info/time_between_train_steps": 0.008967399597167969, "step": 496}
{"info/global_step": 497, "train_info/time_within_train_step": 27.76382803916931, "step": 497}
{"train_info/time_between_train_steps": 0.0049207210540771484, "step": 497}
{"info/global_step": 498, "train_info/time_within_train_step": 27.669023275375366, "step": 498}
{"train_info/time_between_train_steps": 0.005078315734863281, "step": 498}
{"info/global_step": 499, "train_info/time_within_train_step": 27.763712882995605, "step": 499}
{"train_info/time_between_train_steps": 0.004914760589599609, "step": 499}
{"info/global_step": 500, "train_info/time_within_train_step": 27.672534942626953, "step": 500}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740838777, "_runtime": 14726}, "step": 500}
{"logs": {"train/loss": 3.941, "train/learning_rate": 0.00038888888888888887, "train/epoch": 18.01, "_timestamp": 1740838777, "_runtime": 14726}, "step": 500}
{"train_info/time_between_train_steps": 61.851787090301514, "step": 500}
{"info/global_step": 501, "train_info/time_within_train_step": 28.538471460342407, "step": 501}
{"train_info/time_between_train_steps": 0.004990816116333008, "step": 501}
{"info/global_step": 502, "train_info/time_within_train_step": 27.690359354019165, "step": 502}
{"train_info/time_between_train_steps": 0.0049610137939453125, "step": 502}
{"info/global_step": 503, "train_info/time_within_train_step": 27.679474353790283, "step": 503}
{"train_info/time_between_train_steps": 0.010022878646850586, "step": 503}
{"info/global_step": 504, "train_info/time_within_train_step": 27.675956964492798, "step": 504}
{"train_info/time_between_train_steps": 0.004946708679199219, "step": 504}
{"info/global_step": 505, "train_info/time_within_train_step": 27.671958684921265, "step": 505}
{"train_info/time_between_train_steps": 0.004989147186279297, "step": 505}
{"info/global_step": 506, "train_info/time_within_train_step": 27.67660617828369, "step": 506}
{"train_info/time_between_train_steps": 0.004991054534912109, "step": 506}
{"info/global_step": 507, "train_info/time_within_train_step": 27.67815065383911, "step": 507}
{"train_info/time_between_train_steps": 0.006908893585205078, "step": 507}
{"info/global_step": 508, "train_info/time_within_train_step": 27.69458818435669, "step": 508}
{"train_info/time_between_train_steps": 0.007827520370483398, "step": 508}
{"info/global_step": 509, "train_info/time_within_train_step": 27.685293912887573, "step": 509}
{"train_info/time_between_train_steps": 0.005198240280151367, "step": 509}
{"info/global_step": 510, "train_info/time_within_train_step": 27.671449661254883, "step": 510}
{"train_info/time_between_train_steps": 0.008224964141845703, "step": 510}
{"info/global_step": 511, "train_info/time_within_train_step": 27.68022847175598, "step": 511}
{"train_info/time_between_train_steps": 0.0051076412200927734, "step": 511}
{"info/global_step": 512, "train_info/time_within_train_step": 27.683968544006348, "step": 512}
{"train_info/time_between_train_steps": 0.005418539047241211, "step": 512}
{"info/global_step": 513, "train_info/time_within_train_step": 27.695680379867554, "step": 513}
{"train_info/time_between_train_steps": 0.005377531051635742, "step": 513}
{"train_info/time_between_train_steps": 29.939750909805298, "step": 513}
{"info/global_step": 514, "train_info/time_within_train_step": 27.774749040603638, "step": 514}
{"train_info/time_between_train_steps": 0.009954452514648438, "step": 514}
{"info/global_step": 515, "train_info/time_within_train_step": 27.82589077949524, "step": 515}
{"train_info/time_between_train_steps": 0.00507044792175293, "step": 515}
{"info/global_step": 516, "train_info/time_within_train_step": 27.692161798477173, "step": 516}
{"train_info/time_between_train_steps": 0.005224466323852539, "step": 516}
{"info/global_step": 517, "train_info/time_within_train_step": 27.851133823394775, "step": 517}
{"train_info/time_between_train_steps": 0.005154848098754883, "step": 517}
{"info/global_step": 518, "train_info/time_within_train_step": 27.709155559539795, "step": 518}
{"train_info/time_between_train_steps": 0.005364418029785156, "step": 518}
{"info/global_step": 519, "train_info/time_within_train_step": 27.838502407073975, "step": 519}
{"train_info/time_between_train_steps": 0.0062253475189208984, "step": 519}
{"info/global_step": 520, "train_info/time_within_train_step": 27.6978440284729, "step": 520}
{"train_info/time_between_train_steps": 0.005019426345825195, "step": 520}
{"info/global_step": 521, "train_info/time_within_train_step": 27.766270399093628, "step": 521}
{"train_info/time_between_train_steps": 0.005234718322753906, "step": 521}
{"info/global_step": 522, "train_info/time_within_train_step": 27.721823930740356, "step": 522}
{"train_info/time_between_train_steps": 0.004953145980834961, "step": 522}
{"info/global_step": 523, "train_info/time_within_train_step": 27.66607689857483, "step": 523}
{"train_info/time_between_train_steps": 0.004929542541503906, "step": 523}
{"info/global_step": 524, "train_info/time_within_train_step": 27.670429944992065, "step": 524}
{"train_info/time_between_train_steps": 0.004975318908691406, "step": 524}
{"info/global_step": 525, "train_info/time_within_train_step": 27.68411612510681, "step": 525}
{"train_info/time_between_train_steps": 0.004883766174316406, "step": 525}
{"info/global_step": 526, "train_info/time_within_train_step": 27.74719214439392, "step": 526}
{"train_info/time_between_train_steps": 0.005048036575317383, "step": 526}
{"info/global_step": 527, "train_info/time_within_train_step": 27.733570098876953, "step": 527}
{"train_info/time_between_train_steps": 0.00487208366394043, "step": 527}
{"info/global_step": 528, "train_info/time_within_train_step": 27.760092735290527, "step": 528}
{"train_info/time_between_train_steps": 0.0050013065338134766, "step": 528}
{"info/global_step": 529, "train_info/time_within_train_step": 27.797242164611816, "step": 529}
{"train_info/time_between_train_steps": 0.0054492950439453125, "step": 529}
{"info/global_step": 530, "train_info/time_within_train_step": 27.667036294937134, "step": 530}
{"train_info/time_between_train_steps": 0.004889011383056641, "step": 530}
{"info/global_step": 531, "train_info/time_within_train_step": 27.669853925704956, "step": 531}
{"train_info/time_between_train_steps": 0.005079984664916992, "step": 531}
{"info/global_step": 532, "train_info/time_within_train_step": 27.67752194404602, "step": 532}
{"train_info/time_between_train_steps": 0.006651878356933594, "step": 532}
{"info/global_step": 533, "train_info/time_within_train_step": 27.71123194694519, "step": 533}
{"train_info/time_between_train_steps": 0.004915952682495117, "step": 533}
{"info/global_step": 534, "train_info/time_within_train_step": 27.678771257400513, "step": 534}
{"train_info/time_between_train_steps": 0.005084037780761719, "step": 534}
{"info/global_step": 535, "train_info/time_within_train_step": 27.67933440208435, "step": 535}
{"train_info/time_between_train_steps": 0.009957551956176758, "step": 535}
{"info/global_step": 536, "train_info/time_within_train_step": 27.698485136032104, "step": 536}
{"train_info/time_between_train_steps": 0.0051653385162353516, "step": 536}
{"info/global_step": 537, "train_info/time_within_train_step": 27.695810317993164, "step": 537}
{"train_info/time_between_train_steps": 0.008214950561523438, "step": 537}
{"info/global_step": 538, "train_info/time_within_train_step": 27.695643186569214, "step": 538}
{"train_info/time_between_train_steps": 0.005135297775268555, "step": 538}
{"info/global_step": 539, "train_info/time_within_train_step": 27.757988452911377, "step": 539}
{"train_info/time_between_train_steps": 0.005369663238525391, "step": 539}
{"info/global_step": 540, "train_info/time_within_train_step": 27.717520475387573, "step": 540}
{"train_info/time_between_train_steps": 0.010320186614990234, "step": 540}
{"train_info/time_between_train_steps": 37.21029734611511, "step": 540}
{"info/global_step": 541, "train_info/time_within_train_step": 28.03437066078186, "step": 541}
{"train_info/time_between_train_steps": 0.005332469940185547, "step": 541}
{"info/global_step": 542, "train_info/time_within_train_step": 31.623679637908936, "step": 542}
{"train_info/time_between_train_steps": 0.005580425262451172, "step": 542}
{"info/global_step": 543, "train_info/time_within_train_step": 28.279159784317017, "step": 543}
{"train_info/time_between_train_steps": 0.010154485702514648, "step": 543}
{"info/global_step": 544, "train_info/time_within_train_step": 27.9926176071167, "step": 544}
{"train_info/time_between_train_steps": 0.005124092102050781, "step": 544}
{"info/global_step": 545, "train_info/time_within_train_step": 27.67764401435852, "step": 545}
{"train_info/time_between_train_steps": 0.005307674407958984, "step": 545}
{"info/global_step": 546, "train_info/time_within_train_step": 27.866935968399048, "step": 546}
{"train_info/time_between_train_steps": 0.005261898040771484, "step": 546}
{"info/global_step": 547, "train_info/time_within_train_step": 27.680941104888916, "step": 547}
{"train_info/time_between_train_steps": 0.005048990249633789, "step": 547}
{"info/global_step": 548, "train_info/time_within_train_step": 27.812732219696045, "step": 548}
{"train_info/time_between_train_steps": 0.0051500797271728516, "step": 548}
{"info/global_step": 549, "train_info/time_within_train_step": 27.68227219581604, "step": 549}
{"train_info/time_between_train_steps": 0.004887580871582031, "step": 549}
{"info/global_step": 550, "train_info/time_within_train_step": 27.70200252532959, "step": 550}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740840303, "_runtime": 16252}, "step": 550}
{"logs": {"train/loss": 3.826, "train/learning_rate": 0.0003611111111111111, "train/epoch": 20.01, "_timestamp": 1740840303, "_runtime": 16252}, "step": 550}
{"train_info/time_between_train_steps": 0.0297696590423584, "step": 550}
{"info/global_step": 551, "train_info/time_within_train_step": 27.68769860267639, "step": 551}
{"train_info/time_between_train_steps": 0.0049915313720703125, "step": 551}
{"info/global_step": 552, "train_info/time_within_train_step": 27.68511652946472, "step": 552}
{"train_info/time_between_train_steps": 0.004961967468261719, "step": 552}
{"info/global_step": 553, "train_info/time_within_train_step": 27.735146522521973, "step": 553}
{"train_info/time_between_train_steps": 0.005128145217895508, "step": 553}
{"info/global_step": 554, "train_info/time_within_train_step": 27.677552700042725, "step": 554}
{"train_info/time_between_train_steps": 0.004854917526245117, "step": 554}
{"info/global_step": 555, "train_info/time_within_train_step": 27.718973398208618, "step": 555}
{"train_info/time_between_train_steps": 0.005406379699707031, "step": 555}
{"info/global_step": 556, "train_info/time_within_train_step": 27.689841270446777, "step": 556}
{"train_info/time_between_train_steps": 0.0051691532135009766, "step": 556}
{"info/global_step": 557, "train_info/time_within_train_step": 27.731921434402466, "step": 557}
{"train_info/time_between_train_steps": 0.005002260208129883, "step": 557}
{"info/global_step": 558, "train_info/time_within_train_step": 27.695067644119263, "step": 558}
{"train_info/time_between_train_steps": 0.00508427619934082, "step": 558}
{"info/global_step": 559, "train_info/time_within_train_step": 27.748209238052368, "step": 559}
{"train_info/time_between_train_steps": 0.004982471466064453, "step": 559}
{"info/global_step": 560, "train_info/time_within_train_step": 27.767049312591553, "step": 560}
{"train_info/time_between_train_steps": 0.005130767822265625, "step": 560}
{"info/global_step": 561, "train_info/time_within_train_step": 27.674967765808105, "step": 561}
{"train_info/time_between_train_steps": 0.005042552947998047, "step": 561}
{"info/global_step": 562, "train_info/time_within_train_step": 27.689786911010742, "step": 562}
{"train_info/time_between_train_steps": 0.0051746368408203125, "step": 562}
{"info/global_step": 563, "train_info/time_within_train_step": 27.697322845458984, "step": 563}
{"train_info/time_between_train_steps": 0.005582571029663086, "step": 563}
{"info/global_step": 564, "train_info/time_within_train_step": 27.712852001190186, "step": 564}
{"train_info/time_between_train_steps": 0.0050432682037353516, "step": 564}
{"info/global_step": 565, "train_info/time_within_train_step": 27.697511911392212, "step": 565}
{"train_info/time_between_train_steps": 0.0052607059478759766, "step": 565}
{"info/global_step": 566, "train_info/time_within_train_step": 27.689690113067627, "step": 566}
{"train_info/time_between_train_steps": 0.0052487850189208984, "step": 566}
{"info/global_step": 567, "train_info/time_within_train_step": 27.697678089141846, "step": 567}
{"train_info/time_between_train_steps": 0.005914211273193359, "step": 567}
{"train_info/time_between_train_steps": 29.885384798049927, "step": 567}
{"info/global_step": 568, "train_info/time_within_train_step": 27.664153575897217, "step": 568}
{"train_info/time_between_train_steps": 0.009563446044921875, "step": 568}
{"info/global_step": 569, "train_info/time_within_train_step": 27.828189849853516, "step": 569}
{"train_info/time_between_train_steps": 0.005131721496582031, "step": 569}
{"info/global_step": 570, "train_info/time_within_train_step": 27.694371223449707, "step": 570}
{"train_info/time_between_train_steps": 0.005155801773071289, "step": 570}
{"info/global_step": 571, "train_info/time_within_train_step": 27.818868160247803, "step": 571}
{"train_info/time_between_train_steps": 0.005113840103149414, "step": 571}
{"info/global_step": 572, "train_info/time_within_train_step": 27.68872094154358, "step": 572}
{"train_info/time_between_train_steps": 0.005194425582885742, "step": 572}
{"info/global_step": 573, "train_info/time_within_train_step": 27.789438247680664, "step": 573}
{"train_info/time_between_train_steps": 0.005086660385131836, "step": 573}
{"info/global_step": 574, "train_info/time_within_train_step": 27.773414134979248, "step": 574}
{"train_info/time_between_train_steps": 0.005383968353271484, "step": 574}
{"info/global_step": 575, "train_info/time_within_train_step": 27.775232553482056, "step": 575}
{"train_info/time_between_train_steps": 0.005170583724975586, "step": 575}
{"info/global_step": 576, "train_info/time_within_train_step": 27.695175170898438, "step": 576}
{"train_info/time_between_train_steps": 0.004993438720703125, "step": 576}
{"info/global_step": 577, "train_info/time_within_train_step": 27.665024995803833, "step": 577}
{"train_info/time_between_train_steps": 0.004942178726196289, "step": 577}
{"info/global_step": 578, "train_info/time_within_train_step": 27.71666145324707, "step": 578}
{"train_info/time_between_train_steps": 0.009944915771484375, "step": 578}
{"info/global_step": 579, "train_info/time_within_train_step": 27.67567729949951, "step": 579}
{"train_info/time_between_train_steps": 0.004936933517456055, "step": 579}
{"info/global_step": 580, "train_info/time_within_train_step": 27.706153631210327, "step": 580}
{"train_info/time_between_train_steps": 0.005031585693359375, "step": 580}
{"info/global_step": 581, "train_info/time_within_train_step": 27.674498319625854, "step": 581}
{"train_info/time_between_train_steps": 0.004955768585205078, "step": 581}
{"info/global_step": 582, "train_info/time_within_train_step": 27.683513164520264, "step": 582}
{"train_info/time_between_train_steps": 0.005001544952392578, "step": 582}
{"info/global_step": 583, "train_info/time_within_train_step": 27.67023468017578, "step": 583}
{"train_info/time_between_train_steps": 0.005039691925048828, "step": 583}
{"info/global_step": 584, "train_info/time_within_train_step": 27.689181804656982, "step": 584}
{"train_info/time_between_train_steps": 0.004988908767700195, "step": 584}
{"info/global_step": 585, "train_info/time_within_train_step": 27.685707092285156, "step": 585}
{"train_info/time_between_train_steps": 0.0050334930419921875, "step": 585}
{"info/global_step": 586, "train_info/time_within_train_step": 27.761868238449097, "step": 586}
{"train_info/time_between_train_steps": 0.0049474239349365234, "step": 586}
{"info/global_step": 587, "train_info/time_within_train_step": 27.67378544807434, "step": 587}
{"train_info/time_between_train_steps": 0.0050318241119384766, "step": 587}
{"info/global_step": 588, "train_info/time_within_train_step": 27.671586513519287, "step": 588}
{"train_info/time_between_train_steps": 0.004948854446411133, "step": 588}
{"info/global_step": 589, "train_info/time_within_train_step": 27.667776584625244, "step": 589}
{"train_info/time_between_train_steps": 0.0050051212310791016, "step": 589}
{"info/global_step": 590, "train_info/time_within_train_step": 27.782241582870483, "step": 590}
{"train_info/time_between_train_steps": 0.0052356719970703125, "step": 590}
{"info/global_step": 591, "train_info/time_within_train_step": 27.716526746749878, "step": 591}
{"train_info/time_between_train_steps": 0.005022764205932617, "step": 591}
{"info/global_step": 592, "train_info/time_within_train_step": 27.67828631401062, "step": 592}
{"train_info/time_between_train_steps": 0.005151033401489258, "step": 592}
{"info/global_step": 593, "train_info/time_within_train_step": 27.684534311294556, "step": 593}
{"train_info/time_between_train_steps": 0.005425691604614258, "step": 593}
{"info/global_step": 594, "train_info/time_within_train_step": 27.729870796203613, "step": 594}
{"train_info/time_between_train_steps": 0.0054607391357421875, "step": 594}
{"train_info/time_between_train_steps": 30.103595495224, "step": 594}
{"info/global_step": 595, "train_info/time_within_train_step": 27.685643196105957, "step": 595}
{"train_info/time_between_train_steps": 0.004884004592895508, "step": 595}
{"info/global_step": 596, "train_info/time_within_train_step": 27.81301736831665, "step": 596}
{"train_info/time_between_train_steps": 0.005746603012084961, "step": 596}
{"info/global_step": 597, "train_info/time_within_train_step": 27.696244478225708, "step": 597}
{"train_info/time_between_train_steps": 0.005352973937988281, "step": 597}
{"info/global_step": 598, "train_info/time_within_train_step": 27.853381633758545, "step": 598}
{"train_info/time_between_train_steps": 0.0050814151763916016, "step": 598}
{"info/global_step": 599, "train_info/time_within_train_step": 27.68786597251892, "step": 599}
{"train_info/time_between_train_steps": 0.005131959915161133, "step": 599}
{"info/global_step": 600, "train_info/time_within_train_step": 27.846378564834595, "step": 600}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740841750, "_runtime": 17699}, "step": 600}
{"logs": {"train/loss": 3.7276, "train/learning_rate": 0.0003333333333333333, "train/epoch": 22.0, "_timestamp": 1740841750, "_runtime": 17699}, "step": 600}
{"train_info/time_between_train_steps": 57.27272868156433, "step": 600}
{"info/global_step": 601, "train_info/time_within_train_step": 28.26378345489502, "step": 601}
{"train_info/time_between_train_steps": 0.015015602111816406, "step": 601}
{"info/global_step": 602, "train_info/time_within_train_step": 28.025111436843872, "step": 602}
{"train_info/time_between_train_steps": 0.005140781402587891, "step": 602}
{"info/global_step": 603, "train_info/time_within_train_step": 27.702581644058228, "step": 603}
{"train_info/time_between_train_steps": 0.004887104034423828, "step": 603}
{"info/global_step": 604, "train_info/time_within_train_step": 27.670287132263184, "step": 604}
{"train_info/time_between_train_steps": 0.004877805709838867, "step": 604}
{"info/global_step": 605, "train_info/time_within_train_step": 27.784454822540283, "step": 605}
{"train_info/time_between_train_steps": 0.0052032470703125, "step": 605}
{"info/global_step": 606, "train_info/time_within_train_step": 27.664655208587646, "step": 606}
{"train_info/time_between_train_steps": 0.009766101837158203, "step": 606}
{"info/global_step": 607, "train_info/time_within_train_step": 27.734017848968506, "step": 607}
{"train_info/time_between_train_steps": 0.005088329315185547, "step": 607}
{"info/global_step": 608, "train_info/time_within_train_step": 27.68215036392212, "step": 608}
{"train_info/time_between_train_steps": 0.004853963851928711, "step": 608}
{"info/global_step": 609, "train_info/time_within_train_step": 27.725008249282837, "step": 609}
{"train_info/time_between_train_steps": 0.005091190338134766, "step": 609}
{"info/global_step": 610, "train_info/time_within_train_step": 27.675264358520508, "step": 610}
{"train_info/time_between_train_steps": 0.005095243453979492, "step": 610}
{"info/global_step": 611, "train_info/time_within_train_step": 27.73589515686035, "step": 611}
{"train_info/time_between_train_steps": 0.004917144775390625, "step": 611}
{"info/global_step": 612, "train_info/time_within_train_step": 27.689215898513794, "step": 612}
{"train_info/time_between_train_steps": 0.005128383636474609, "step": 612}
{"info/global_step": 613, "train_info/time_within_train_step": 27.716068029403687, "step": 613}
{"train_info/time_between_train_steps": 0.004960775375366211, "step": 613}
{"info/global_step": 614, "train_info/time_within_train_step": 27.689669847488403, "step": 614}
{"train_info/time_between_train_steps": 0.004925727844238281, "step": 614}
{"info/global_step": 615, "train_info/time_within_train_step": 27.67919421195984, "step": 615}
{"train_info/time_between_train_steps": 0.0050737857818603516, "step": 615}
{"info/global_step": 616, "train_info/time_within_train_step": 27.668785333633423, "step": 616}
{"train_info/time_between_train_steps": 0.005002260208129883, "step": 616}
{"info/global_step": 617, "train_info/time_within_train_step": 27.691757440567017, "step": 617}
{"train_info/time_between_train_steps": 0.005064249038696289, "step": 617}
{"info/global_step": 618, "train_info/time_within_train_step": 27.677024364471436, "step": 618}
{"train_info/time_between_train_steps": 0.005033254623413086, "step": 618}
{"info/global_step": 619, "train_info/time_within_train_step": 27.684285163879395, "step": 619}
{"train_info/time_between_train_steps": 0.005181074142456055, "step": 619}
{"info/global_step": 620, "train_info/time_within_train_step": 28.08976101875305, "step": 620}
{"train_info/time_between_train_steps": 0.010335206985473633, "step": 620}
{"info/global_step": 621, "train_info/time_within_train_step": 27.692357063293457, "step": 621}
{"train_info/time_between_train_steps": 0.005265712738037109, "step": 621}
{"train_info/time_between_train_steps": 29.709611654281616, "step": 621}
{"info/global_step": 622, "train_info/time_within_train_step": 27.78045415878296, "step": 622}
{"train_info/time_between_train_steps": 0.006834745407104492, "step": 622}
{"info/global_step": 623, "train_info/time_within_train_step": 27.885828971862793, "step": 623}
{"train_info/time_between_train_steps": 0.005908966064453125, "step": 623}
{"info/global_step": 624, "train_info/time_within_train_step": 27.710910081863403, "step": 624}
{"train_info/time_between_train_steps": 0.005643606185913086, "step": 624}
{"info/global_step": 625, "train_info/time_within_train_step": 27.92944598197937, "step": 625}
{"train_info/time_between_train_steps": 0.005697727203369141, "step": 625}
{"info/global_step": 626, "train_info/time_within_train_step": 27.84441876411438, "step": 626}
{"train_info/time_between_train_steps": 0.005472421646118164, "step": 626}
{"info/global_step": 627, "train_info/time_within_train_step": 27.876531839370728, "step": 627}
{"train_info/time_between_train_steps": 0.005527973175048828, "step": 627}
{"info/global_step": 628, "train_info/time_within_train_step": 27.73575735092163, "step": 628}
{"train_info/time_between_train_steps": 0.0057964324951171875, "step": 628}
{"info/global_step": 629, "train_info/time_within_train_step": 27.7913076877594, "step": 629}
{"train_info/time_between_train_steps": 0.005209445953369141, "step": 629}
{"info/global_step": 630, "train_info/time_within_train_step": 27.705824613571167, "step": 630}
{"train_info/time_between_train_steps": 0.00518488883972168, "step": 630}
{"info/global_step": 631, "train_info/time_within_train_step": 27.687830924987793, "step": 631}
{"train_info/time_between_train_steps": 0.005135059356689453, "step": 631}
{"info/global_step": 632, "train_info/time_within_train_step": 27.727758407592773, "step": 632}
{"train_info/time_between_train_steps": 0.010061264038085938, "step": 632}
{"info/global_step": 633, "train_info/time_within_train_step": 27.69417929649353, "step": 633}
{"train_info/time_between_train_steps": 0.004924297332763672, "step": 633}
{"info/global_step": 634, "train_info/time_within_train_step": 27.676318645477295, "step": 634}
{"train_info/time_between_train_steps": 0.00527644157409668, "step": 634}
{"info/global_step": 635, "train_info/time_within_train_step": 27.769784212112427, "step": 635}
{"train_info/time_between_train_steps": 0.005064725875854492, "step": 635}
{"info/global_step": 636, "train_info/time_within_train_step": 27.722774744033813, "step": 636}
{"train_info/time_between_train_steps": 0.005045652389526367, "step": 636}
{"info/global_step": 637, "train_info/time_within_train_step": 27.686607360839844, "step": 637}
{"train_info/time_between_train_steps": 0.005286455154418945, "step": 637}
{"info/global_step": 638, "train_info/time_within_train_step": 27.671982049942017, "step": 638}
{"train_info/time_between_train_steps": 0.005297183990478516, "step": 638}
{"info/global_step": 639, "train_info/time_within_train_step": 27.909485578536987, "step": 639}
{"train_info/time_between_train_steps": 0.005059242248535156, "step": 639}
{"info/global_step": 640, "train_info/time_within_train_step": 27.862473249435425, "step": 640}
{"train_info/time_between_train_steps": 0.005169868469238281, "step": 640}
{"info/global_step": 641, "train_info/time_within_train_step": 27.673311710357666, "step": 641}
{"train_info/time_between_train_steps": 0.005018949508666992, "step": 641}
{"info/global_step": 642, "train_info/time_within_train_step": 27.68473792076111, "step": 642}
{"train_info/time_between_train_steps": 0.005134105682373047, "step": 642}
{"info/global_step": 643, "train_info/time_within_train_step": 27.678916215896606, "step": 643}
{"train_info/time_between_train_steps": 0.005121469497680664, "step": 643}
{"info/global_step": 644, "train_info/time_within_train_step": 27.680357217788696, "step": 644}
{"train_info/time_between_train_steps": 0.00513768196105957, "step": 644}
{"info/global_step": 645, "train_info/time_within_train_step": 27.68493127822876, "step": 645}
{"train_info/time_between_train_steps": 0.0050656795501708984, "step": 645}
{"info/global_step": 646, "train_info/time_within_train_step": 27.70220136642456, "step": 646}
{"train_info/time_between_train_steps": 0.00519108772277832, "step": 646}
{"info/global_step": 647, "train_info/time_within_train_step": 27.686874389648438, "step": 647}
{"train_info/time_between_train_steps": 0.005599021911621094, "step": 647}
{"info/global_step": 648, "train_info/time_within_train_step": 27.701208353042603, "step": 648}
{"train_info/time_between_train_steps": 0.00643157958984375, "step": 648}
{"train_info/time_between_train_steps": 29.752322912216187, "step": 648}
{"info/global_step": 649, "train_info/time_within_train_step": 27.783902168273926, "step": 649}
{"train_info/time_between_train_steps": 0.0048749446868896484, "step": 649}
{"info/global_step": 650, "train_info/time_within_train_step": 27.81309223175049, "step": 650}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740843257, "_runtime": 19206}, "step": 650}
{"logs": {"train/loss": 3.6415, "train/learning_rate": 0.00030555555555555555, "train/epoch": 24.0, "_timestamp": 1740843257, "_runtime": 19206}, "step": 650}
{"train_info/time_between_train_steps": 0.02568840980529785, "step": 650}
{"info/global_step": 651, "train_info/time_within_train_step": 27.699673414230347, "step": 651}
{"train_info/time_between_train_steps": 0.0052835941314697266, "step": 651}
{"info/global_step": 652, "train_info/time_within_train_step": 27.877374172210693, "step": 652}
{"train_info/time_between_train_steps": 0.005191802978515625, "step": 652}
{"info/global_step": 653, "train_info/time_within_train_step": 27.68099308013916, "step": 653}
{"train_info/time_between_train_steps": 0.005148887634277344, "step": 653}
{"info/global_step": 654, "train_info/time_within_train_step": 27.812268018722534, "step": 654}
{"train_info/time_between_train_steps": 0.005180835723876953, "step": 654}
{"info/global_step": 655, "train_info/time_within_train_step": 27.721638679504395, "step": 655}
{"train_info/time_between_train_steps": 0.005434989929199219, "step": 655}
{"info/global_step": 656, "train_info/time_within_train_step": 27.73462200164795, "step": 656}
{"train_info/time_between_train_steps": 0.0062596797943115234, "step": 656}
{"info/global_step": 657, "train_info/time_within_train_step": 27.692196130752563, "step": 657}
{"train_info/time_between_train_steps": 0.005011796951293945, "step": 657}
{"info/global_step": 658, "train_info/time_within_train_step": 27.66310429573059, "step": 658}
{"train_info/time_between_train_steps": 0.004877567291259766, "step": 658}
{"info/global_step": 659, "train_info/time_within_train_step": 27.666418075561523, "step": 659}
{"train_info/time_between_train_steps": 0.005001544952392578, "step": 659}
{"info/global_step": 660, "train_info/time_within_train_step": 27.677677869796753, "step": 660}
{"train_info/time_between_train_steps": 0.004837512969970703, "step": 660}
{"info/global_step": 661, "train_info/time_within_train_step": 27.741764783859253, "step": 661}
{"train_info/time_between_train_steps": 0.0049228668212890625, "step": 661}
{"info/global_step": 662, "train_info/time_within_train_step": 27.67442560195923, "step": 662}
{"train_info/time_between_train_steps": 0.005023479461669922, "step": 662}
{"info/global_step": 663, "train_info/time_within_train_step": 27.667781829833984, "step": 663}
{"train_info/time_between_train_steps": 0.0050351619720458984, "step": 663}
{"info/global_step": 664, "train_info/time_within_train_step": 27.668005228042603, "step": 664}
{"train_info/time_between_train_steps": 0.0049610137939453125, "step": 664}
{"info/global_step": 665, "train_info/time_within_train_step": 27.79037094116211, "step": 665}
{"train_info/time_between_train_steps": 0.0048980712890625, "step": 665}
{"info/global_step": 666, "train_info/time_within_train_step": 27.69136643409729, "step": 666}
{"train_info/time_between_train_steps": 0.0054547786712646484, "step": 666}
{"info/global_step": 667, "train_info/time_within_train_step": 27.680794954299927, "step": 667}
{"train_info/time_between_train_steps": 0.00494384765625, "step": 667}
{"info/global_step": 668, "train_info/time_within_train_step": 27.682769298553467, "step": 668}
{"train_info/time_between_train_steps": 0.005079030990600586, "step": 668}
{"info/global_step": 669, "train_info/time_within_train_step": 27.683570861816406, "step": 669}
{"train_info/time_between_train_steps": 0.005063772201538086, "step": 669}
{"info/global_step": 670, "train_info/time_within_train_step": 27.69808602333069, "step": 670}
{"train_info/time_between_train_steps": 0.005298137664794922, "step": 670}
{"info/global_step": 671, "train_info/time_within_train_step": 27.71128487586975, "step": 671}
{"train_info/time_between_train_steps": 0.0050067901611328125, "step": 671}
{"info/global_step": 672, "train_info/time_within_train_step": 27.68874764442444, "step": 672}
{"train_info/time_between_train_steps": 0.0051081180572509766, "step": 672}
{"info/global_step": 673, "train_info/time_within_train_step": 27.683480739593506, "step": 673}
{"train_info/time_between_train_steps": 0.005063772201538086, "step": 673}
{"info/global_step": 674, "train_info/time_within_train_step": 27.74240732192993, "step": 674}
{"train_info/time_between_train_steps": 0.005105018615722656, "step": 674}
{"info/global_step": 675, "train_info/time_within_train_step": 27.712934494018555, "step": 675}
{"train_info/time_between_train_steps": 0.005464315414428711, "step": 675}
{"train_info/time_between_train_steps": 29.910584211349487, "step": 675}
{"info/global_step": 676, "train_info/time_within_train_step": 27.698601007461548, "step": 676}
{"train_info/time_between_train_steps": 0.004916191101074219, "step": 676}
{"info/global_step": 677, "train_info/time_within_train_step": 27.857526302337646, "step": 677}
{"train_info/time_between_train_steps": 0.004795551300048828, "step": 677}
{"info/global_step": 678, "train_info/time_within_train_step": 27.68055295944214, "step": 678}
{"train_info/time_between_train_steps": 0.0048177242279052734, "step": 678}
{"info/global_step": 679, "train_info/time_within_train_step": 27.866209745407104, "step": 679}
{"train_info/time_between_train_steps": 0.005165815353393555, "step": 679}
{"info/global_step": 680, "train_info/time_within_train_step": 27.823453664779663, "step": 680}
{"train_info/time_between_train_steps": 0.005391120910644531, "step": 680}
{"info/global_step": 681, "train_info/time_within_train_step": 27.827982425689697, "step": 681}
{"train_info/time_between_train_steps": 0.005140066146850586, "step": 681}
{"info/global_step": 682, "train_info/time_within_train_step": 27.697964668273926, "step": 682}
{"train_info/time_between_train_steps": 0.005079030990600586, "step": 682}
{"info/global_step": 683, "train_info/time_within_train_step": 27.75378727912903, "step": 683}
{"train_info/time_between_train_steps": 0.00513458251953125, "step": 683}
{"info/global_step": 684, "train_info/time_within_train_step": 27.709417581558228, "step": 684}
{"train_info/time_between_train_steps": 0.005217552185058594, "step": 684}
{"info/global_step": 685, "train_info/time_within_train_step": 27.68973660469055, "step": 685}
{"train_info/time_between_train_steps": 0.005190134048461914, "step": 685}
{"info/global_step": 686, "train_info/time_within_train_step": 27.746852159500122, "step": 686}
{"train_info/time_between_train_steps": 0.015586614608764648, "step": 686}
{"info/global_step": 687, "train_info/time_within_train_step": 27.719690322875977, "step": 687}
{"train_info/time_between_train_steps": 0.00505828857421875, "step": 687}
{"info/global_step": 688, "train_info/time_within_train_step": 27.69042706489563, "step": 688}
{"train_info/time_between_train_steps": 0.005038261413574219, "step": 688}
{"info/global_step": 689, "train_info/time_within_train_step": 27.678998231887817, "step": 689}
{"train_info/time_between_train_steps": 0.0060541629791259766, "step": 689}
{"info/global_step": 690, "train_info/time_within_train_step": 27.75462532043457, "step": 690}
{"train_info/time_between_train_steps": 0.004940032958984375, "step": 690}
{"info/global_step": 691, "train_info/time_within_train_step": 27.70759153366089, "step": 691}
{"train_info/time_between_train_steps": 0.005103349685668945, "step": 691}
{"info/global_step": 692, "train_info/time_within_train_step": 27.72522258758545, "step": 692}
{"train_info/time_between_train_steps": 0.005373477935791016, "step": 692}
{"info/global_step": 693, "train_info/time_within_train_step": 27.6722252368927, "step": 693}
{"train_info/time_between_train_steps": 0.004964351654052734, "step": 693}
{"info/global_step": 694, "train_info/time_within_train_step": 27.697333097457886, "step": 694}
{"train_info/time_between_train_steps": 0.004899740219116211, "step": 694}
{"info/global_step": 695, "train_info/time_within_train_step": 27.803155660629272, "step": 695}
{"train_info/time_between_train_steps": 0.00487828254699707, "step": 695}
{"info/global_step": 696, "train_info/time_within_train_step": 27.68677592277527, "step": 696}
{"train_info/time_between_train_steps": 0.005341768264770508, "step": 696}
{"info/global_step": 697, "train_info/time_within_train_step": 27.683055639266968, "step": 697}
{"train_info/time_between_train_steps": 0.0053369998931884766, "step": 697}
{"info/global_step": 698, "train_info/time_within_train_step": 27.698196411132812, "step": 698}
{"train_info/time_between_train_steps": 0.004990816116333008, "step": 698}
{"info/global_step": 699, "train_info/time_within_train_step": 27.703386068344116, "step": 699}
{"train_info/time_between_train_steps": 0.00511622428894043, "step": 699}
{"info/global_step": 700, "train_info/time_within_train_step": 27.685921669006348, "step": 700}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740844675, "_runtime": 20624}, "step": 700}
{"logs": {"train/loss": 3.4952, "train/learning_rate": 0.0002777777777777778, "train/epoch": 25.02, "_timestamp": 1740844675, "_runtime": 20624}, "step": 700}
{"train_info/time_between_train_steps": 205.7708718776703, "step": 700}
{"info/global_step": 701, "train_info/time_within_train_step": 28.254541635513306, "step": 701}
{"train_info/time_between_train_steps": 0.00508427619934082, "step": 701}
{"info/global_step": 702, "train_info/time_within_train_step": 27.70797324180603, "step": 702}
{"train_info/time_between_train_steps": 0.0053348541259765625, "step": 702}
{"train_info/time_between_train_steps": 30.087986946105957, "step": 702}
{"info/global_step": 703, "train_info/time_within_train_step": 27.708192348480225, "step": 703}
{"train_info/time_between_train_steps": 0.005136728286743164, "step": 703}
{"info/global_step": 704, "train_info/time_within_train_step": 27.84008288383484, "step": 704}
{"train_info/time_between_train_steps": 0.005040407180786133, "step": 704}
{"info/global_step": 705, "train_info/time_within_train_step": 27.746328830718994, "step": 705}
{"train_info/time_between_train_steps": 0.00483250617980957, "step": 705}
{"info/global_step": 706, "train_info/time_within_train_step": 27.84048843383789, "step": 706}
{"train_info/time_between_train_steps": 0.005275249481201172, "step": 706}
{"info/global_step": 707, "train_info/time_within_train_step": 27.735986471176147, "step": 707}
{"train_info/time_between_train_steps": 0.0054204463958740234, "step": 707}
{"info/global_step": 708, "train_info/time_within_train_step": 27.886640310287476, "step": 708}
{"train_info/time_between_train_steps": 0.005254030227661133, "step": 708}
{"info/global_step": 709, "train_info/time_within_train_step": 27.687414407730103, "step": 709}
{"train_info/time_between_train_steps": 0.005116939544677734, "step": 709}
{"info/global_step": 710, "train_info/time_within_train_step": 27.858542442321777, "step": 710}
{"train_info/time_between_train_steps": 0.005039691925048828, "step": 710}
{"info/global_step": 711, "train_info/time_within_train_step": 27.702407121658325, "step": 711}
{"train_info/time_between_train_steps": 0.004914999008178711, "step": 711}
{"info/global_step": 712, "train_info/time_within_train_step": 27.722926139831543, "step": 712}
{"train_info/time_between_train_steps": 0.006056785583496094, "step": 712}
{"info/global_step": 713, "train_info/time_within_train_step": 27.683764457702637, "step": 713}
{"train_info/time_between_train_steps": 0.0052797794342041016, "step": 713}
{"info/global_step": 714, "train_info/time_within_train_step": 27.71592426300049, "step": 714}
{"train_info/time_between_train_steps": 0.004989147186279297, "step": 714}
{"info/global_step": 715, "train_info/time_within_train_step": 27.705907583236694, "step": 715}
{"train_info/time_between_train_steps": 0.0049211978912353516, "step": 715}
{"info/global_step": 716, "train_info/time_within_train_step": 27.700575590133667, "step": 716}
{"train_info/time_between_train_steps": 0.005867958068847656, "step": 716}
{"info/global_step": 717, "train_info/time_within_train_step": 27.699155807495117, "step": 717}
{"train_info/time_between_train_steps": 0.005313873291015625, "step": 717}
{"info/global_step": 718, "train_info/time_within_train_step": 27.73455286026001, "step": 718}
{"train_info/time_between_train_steps": 0.005024433135986328, "step": 718}
{"info/global_step": 719, "train_info/time_within_train_step": 27.68619132041931, "step": 719}
{"train_info/time_between_train_steps": 0.004867076873779297, "step": 719}
{"info/global_step": 720, "train_info/time_within_train_step": 27.702112674713135, "step": 720}
{"train_info/time_between_train_steps": 0.005155086517333984, "step": 720}
{"info/global_step": 721, "train_info/time_within_train_step": 27.748716831207275, "step": 721}
{"train_info/time_between_train_steps": 0.005070209503173828, "step": 721}
{"info/global_step": 722, "train_info/time_within_train_step": 27.686864852905273, "step": 722}
{"train_info/time_between_train_steps": 0.005057573318481445, "step": 722}
{"info/global_step": 723, "train_info/time_within_train_step": 27.681989908218384, "step": 723}
{"train_info/time_between_train_steps": 0.005129337310791016, "step": 723}
{"info/global_step": 724, "train_info/time_within_train_step": 27.71997308731079, "step": 724}
{"train_info/time_between_train_steps": 0.005264759063720703, "step": 724}
{"info/global_step": 725, "train_info/time_within_train_step": 27.709550142288208, "step": 725}
{"train_info/time_between_train_steps": 0.005185604095458984, "step": 725}
{"info/global_step": 726, "train_info/time_within_train_step": 27.773688316345215, "step": 726}
{"train_info/time_between_train_steps": 0.005421876907348633, "step": 726}
{"info/global_step": 727, "train_info/time_within_train_step": 27.723800897598267, "step": 727}
{"train_info/time_between_train_steps": 0.0050432682037353516, "step": 727}
{"info/global_step": 728, "train_info/time_within_train_step": 27.732863426208496, "step": 728}
{"train_info/time_between_train_steps": 0.0052280426025390625, "step": 728}
{"info/global_step": 729, "train_info/time_within_train_step": 27.782514333724976, "step": 729}
{"train_info/time_between_train_steps": 0.0053691864013671875, "step": 729}
{"train_info/time_between_train_steps": 29.764040231704712, "step": 729}
{"info/global_step": 730, "train_info/time_within_train_step": 31.10205841064453, "step": 730}
{"train_info/time_between_train_steps": 0.005063772201538086, "step": 730}
{"info/global_step": 731, "train_info/time_within_train_step": 28.25043773651123, "step": 731}
{"train_info/time_between_train_steps": 0.005301475524902344, "step": 731}
{"info/global_step": 732, "train_info/time_within_train_step": 30.852128505706787, "step": 732}
{"train_info/time_between_train_steps": 0.005167245864868164, "step": 732}
{"info/global_step": 733, "train_info/time_within_train_step": 28.004018783569336, "step": 733}
{"train_info/time_between_train_steps": 0.005093574523925781, "step": 733}
{"info/global_step": 734, "train_info/time_within_train_step": 27.715487718582153, "step": 734}
{"train_info/time_between_train_steps": 0.005473613739013672, "step": 734}
{"info/global_step": 735, "train_info/time_within_train_step": 27.825292348861694, "step": 735}
{"train_info/time_between_train_steps": 0.005259513854980469, "step": 735}
{"info/global_step": 736, "train_info/time_within_train_step": 27.698736667633057, "step": 736}
{"train_info/time_between_train_steps": 0.005049228668212891, "step": 736}
{"info/global_step": 737, "train_info/time_within_train_step": 27.772340059280396, "step": 737}
{"train_info/time_between_train_steps": 0.005064725875854492, "step": 737}
{"info/global_step": 738, "train_info/time_within_train_step": 27.728332042694092, "step": 738}
{"train_info/time_between_train_steps": 0.004832029342651367, "step": 738}
{"info/global_step": 739, "train_info/time_within_train_step": 27.731085777282715, "step": 739}
{"train_info/time_between_train_steps": 0.0048978328704833984, "step": 739}
{"info/global_step": 740, "train_info/time_within_train_step": 27.786435842514038, "step": 740}
{"train_info/time_between_train_steps": 0.00596928596496582, "step": 740}
{"info/global_step": 741, "train_info/time_within_train_step": 27.7187340259552, "step": 741}
{"train_info/time_between_train_steps": 0.0059778690338134766, "step": 741}
{"info/global_step": 742, "train_info/time_within_train_step": 27.711377382278442, "step": 742}
{"train_info/time_between_train_steps": 0.0050389766693115234, "step": 742}
{"info/global_step": 743, "train_info/time_within_train_step": 27.7295925617218, "step": 743}
{"train_info/time_between_train_steps": 0.004990816116333008, "step": 743}
{"info/global_step": 744, "train_info/time_within_train_step": 27.69840669631958, "step": 744}
{"train_info/time_between_train_steps": 0.0051081180572509766, "step": 744}
{"info/global_step": 745, "train_info/time_within_train_step": 27.721356868743896, "step": 745}
{"train_info/time_between_train_steps": 0.0051076412200927734, "step": 745}
{"info/global_step": 746, "train_info/time_within_train_step": 27.694146394729614, "step": 746}
{"train_info/time_between_train_steps": 0.0048677921295166016, "step": 746}
{"info/global_step": 747, "train_info/time_within_train_step": 27.70768404006958, "step": 747}
{"train_info/time_between_train_steps": 0.004968881607055664, "step": 747}
{"info/global_step": 748, "train_info/time_within_train_step": 27.684829711914062, "step": 748}
{"train_info/time_between_train_steps": 0.005113124847412109, "step": 748}
{"info/global_step": 749, "train_info/time_within_train_step": 27.681796550750732, "step": 749}
{"train_info/time_between_train_steps": 0.005017995834350586, "step": 749}
{"info/global_step": 750, "train_info/time_within_train_step": 27.711034774780273, "step": 750}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740846343, "_runtime": 22292}, "step": 750}
{"logs": {"train/loss": 3.4946, "train/learning_rate": 0.00025, "train/epoch": 27.02, "_timestamp": 1740846343, "_runtime": 22292}, "step": 750}
{"train_info/time_between_train_steps": 0.026391029357910156, "step": 750}
{"info/global_step": 751, "train_info/time_within_train_step": 27.68461775779724, "step": 751}
{"train_info/time_between_train_steps": 0.006167411804199219, "step": 751}
{"info/global_step": 752, "train_info/time_within_train_step": 27.696069717407227, "step": 752}
{"train_info/time_between_train_steps": 0.0051271915435791016, "step": 752}
{"info/global_step": 753, "train_info/time_within_train_step": 27.717214822769165, "step": 753}
{"train_info/time_between_train_steps": 0.005079984664916992, "step": 753}
{"info/global_step": 754, "train_info/time_within_train_step": 27.72770857810974, "step": 754}
{"train_info/time_between_train_steps": 0.005025148391723633, "step": 754}
{"info/global_step": 755, "train_info/time_within_train_step": 27.699385166168213, "step": 755}
{"train_info/time_between_train_steps": 0.005212545394897461, "step": 755}
{"info/global_step": 756, "train_info/time_within_train_step": 27.78471326828003, "step": 756}
{"train_info/time_between_train_steps": 0.0056688785552978516, "step": 756}
{"train_info/time_between_train_steps": 29.823610544204712, "step": 756}
{"info/global_step": 757, "train_info/time_within_train_step": 27.679866313934326, "step": 757}
{"train_info/time_between_train_steps": 0.00493621826171875, "step": 757}
{"info/global_step": 758, "train_info/time_within_train_step": 27.8112313747406, "step": 758}
{"train_info/time_between_train_steps": 0.005324363708496094, "step": 758}
{"info/global_step": 759, "train_info/time_within_train_step": 27.68957543373108, "step": 759}
{"train_info/time_between_train_steps": 0.0048601627349853516, "step": 759}
{"info/global_step": 760, "train_info/time_within_train_step": 27.849790811538696, "step": 760}
{"train_info/time_between_train_steps": 0.005031108856201172, "step": 760}
{"info/global_step": 761, "train_info/time_within_train_step": 27.72820258140564, "step": 761}
{"train_info/time_between_train_steps": 0.0052068233489990234, "step": 761}
{"info/global_step": 762, "train_info/time_within_train_step": 27.8509202003479, "step": 762}
{"train_info/time_between_train_steps": 0.0051119327545166016, "step": 762}
{"info/global_step": 763, "train_info/time_within_train_step": 27.72571110725403, "step": 763}
{"train_info/time_between_train_steps": 0.005269527435302734, "step": 763}
{"info/global_step": 764, "train_info/time_within_train_step": 27.78406834602356, "step": 764}
{"train_info/time_between_train_steps": 0.005171775817871094, "step": 764}
{"info/global_step": 765, "train_info/time_within_train_step": 27.699117183685303, "step": 765}
{"train_info/time_between_train_steps": 0.005185365676879883, "step": 765}
{"info/global_step": 766, "train_info/time_within_train_step": 27.700966835021973, "step": 766}
{"train_info/time_between_train_steps": 0.005179643630981445, "step": 766}
{"info/global_step": 767, "train_info/time_within_train_step": 27.686622858047485, "step": 767}
{"train_info/time_between_train_steps": 0.004982948303222656, "step": 767}
{"info/global_step": 768, "train_info/time_within_train_step": 27.74769377708435, "step": 768}
{"train_info/time_between_train_steps": 0.004995107650756836, "step": 768}
{"info/global_step": 769, "train_info/time_within_train_step": 27.724650859832764, "step": 769}
{"train_info/time_between_train_steps": 0.005130767822265625, "step": 769}
{"info/global_step": 770, "train_info/time_within_train_step": 27.760494470596313, "step": 770}
{"train_info/time_between_train_steps": 0.0060443878173828125, "step": 770}
{"info/global_step": 771, "train_info/time_within_train_step": 27.799352407455444, "step": 771}
{"train_info/time_between_train_steps": 0.004956483840942383, "step": 771}
{"info/global_step": 772, "train_info/time_within_train_step": 27.706594467163086, "step": 772}
{"train_info/time_between_train_steps": 0.006472110748291016, "step": 772}
{"info/global_step": 773, "train_info/time_within_train_step": 27.69157338142395, "step": 773}
{"train_info/time_between_train_steps": 0.0052106380462646484, "step": 773}
{"info/global_step": 774, "train_info/time_within_train_step": 27.708574771881104, "step": 774}
{"train_info/time_between_train_steps": 0.006930351257324219, "step": 774}
{"info/global_step": 775, "train_info/time_within_train_step": 27.69233775138855, "step": 775}
{"train_info/time_between_train_steps": 0.005071401596069336, "step": 775}
{"info/global_step": 776, "train_info/time_within_train_step": 27.68123173713684, "step": 776}
{"train_info/time_between_train_steps": 0.00507044792175293, "step": 776}
{"info/global_step": 777, "train_info/time_within_train_step": 27.720924615859985, "step": 777}
{"train_info/time_between_train_steps": 0.0062656402587890625, "step": 777}
{"info/global_step": 778, "train_info/time_within_train_step": 27.725847005844116, "step": 778}
{"train_info/time_between_train_steps": 0.004975318908691406, "step": 778}
{"info/global_step": 779, "train_info/time_within_train_step": 27.736603021621704, "step": 779}
{"train_info/time_between_train_steps": 0.006090641021728516, "step": 779}
{"info/global_step": 780, "train_info/time_within_train_step": 27.705061435699463, "step": 780}
{"train_info/time_between_train_steps": 0.005053520202636719, "step": 780}
{"info/global_step": 781, "train_info/time_within_train_step": 27.730817556381226, "step": 781}
{"train_info/time_between_train_steps": 0.005067348480224609, "step": 781}
{"info/global_step": 782, "train_info/time_within_train_step": 27.70754909515381, "step": 782}
{"train_info/time_between_train_steps": 0.00535893440246582, "step": 782}
{"info/global_step": 783, "train_info/time_within_train_step": 27.706660747528076, "step": 783}
{"train_info/time_between_train_steps": 0.0056362152099609375, "step": 783}
{"train_info/time_between_train_steps": 29.51830768585205, "step": 783}
{"info/global_step": 784, "train_info/time_within_train_step": 27.703696250915527, "step": 784}
{"train_info/time_between_train_steps": 0.0057141780853271484, "step": 784}
{"info/global_step": 785, "train_info/time_within_train_step": 27.95079803466797, "step": 785}
{"train_info/time_between_train_steps": 0.0051479339599609375, "step": 785}
{"info/global_step": 786, "train_info/time_within_train_step": 27.73789930343628, "step": 786}
{"train_info/time_between_train_steps": 0.00510406494140625, "step": 786}
{"info/global_step": 787, "train_info/time_within_train_step": 27.833077907562256, "step": 787}
{"train_info/time_between_train_steps": 0.005252361297607422, "step": 787}
{"info/global_step": 788, "train_info/time_within_train_step": 27.706275939941406, "step": 788}
{"train_info/time_between_train_steps": 0.005204677581787109, "step": 788}
{"info/global_step": 789, "train_info/time_within_train_step": 27.868988752365112, "step": 789}
{"train_info/time_between_train_steps": 0.005631685256958008, "step": 789}
{"info/global_step": 790, "train_info/time_within_train_step": 27.724032402038574, "step": 790}
{"train_info/time_between_train_steps": 0.011478900909423828, "step": 790}
{"info/global_step": 791, "train_info/time_within_train_step": 27.78103232383728, "step": 791}
{"train_info/time_between_train_steps": 0.005250692367553711, "step": 791}
{"info/global_step": 792, "train_info/time_within_train_step": 27.693026304244995, "step": 792}
{"train_info/time_between_train_steps": 0.005300998687744141, "step": 792}
{"info/global_step": 793, "train_info/time_within_train_step": 27.681272745132446, "step": 793}
{"train_info/time_between_train_steps": 0.005112171173095703, "step": 793}
{"info/global_step": 794, "train_info/time_within_train_step": 27.67368173599243, "step": 794}
{"train_info/time_between_train_steps": 0.0051059722900390625, "step": 794}
{"info/global_step": 795, "train_info/time_within_train_step": 27.68716335296631, "step": 795}
{"train_info/time_between_train_steps": 0.0049059391021728516, "step": 795}
{"info/global_step": 796, "train_info/time_within_train_step": 27.672405242919922, "step": 796}
{"train_info/time_between_train_steps": 0.005040168762207031, "step": 796}
{"info/global_step": 797, "train_info/time_within_train_step": 27.675934314727783, "step": 797}
{"train_info/time_between_train_steps": 0.004956722259521484, "step": 797}
{"info/global_step": 798, "train_info/time_within_train_step": 27.696499824523926, "step": 798}
{"train_info/time_between_train_steps": 0.005181550979614258, "step": 798}
{"info/global_step": 799, "train_info/time_within_train_step": 27.696920156478882, "step": 799}
{"train_info/time_between_train_steps": 0.0051593780517578125, "step": 799}
{"info/global_step": 800, "train_info/time_within_train_step": 27.68538737297058, "step": 800}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740847791, "_runtime": 23740}, "step": 800}
{"logs": {"train/loss": 3.4295, "train/learning_rate": 0.00022222222222222218, "train/epoch": 29.01, "_timestamp": 1740847791, "_runtime": 23740}, "step": 800}
{"train_info/time_between_train_steps": 45.34138894081116, "step": 800}
{"info/global_step": 801, "train_info/time_within_train_step": 28.04743719100952, "step": 801}
{"train_info/time_between_train_steps": 0.00522160530090332, "step": 801}
{"info/global_step": 802, "train_info/time_within_train_step": 27.984935522079468, "step": 802}
{"train_info/time_between_train_steps": 0.0052394866943359375, "step": 802}
{"info/global_step": 803, "train_info/time_within_train_step": 27.734066247940063, "step": 803}
{"train_info/time_between_train_steps": 0.005075931549072266, "step": 803}
{"info/global_step": 804, "train_info/time_within_train_step": 27.705271244049072, "step": 804}
{"train_info/time_between_train_steps": 0.005868196487426758, "step": 804}
{"info/global_step": 805, "train_info/time_within_train_step": 27.700191020965576, "step": 805}
{"train_info/time_between_train_steps": 0.005052804946899414, "step": 805}
{"info/global_step": 806, "train_info/time_within_train_step": 27.703271865844727, "step": 806}
{"train_info/time_between_train_steps": 0.005578279495239258, "step": 806}
{"info/global_step": 807, "train_info/time_within_train_step": 27.703209400177002, "step": 807}
{"train_info/time_between_train_steps": 0.005028963088989258, "step": 807}
{"info/global_step": 808, "train_info/time_within_train_step": 27.72884178161621, "step": 808}
{"train_info/time_between_train_steps": 0.0053598880767822266, "step": 808}
{"info/global_step": 809, "train_info/time_within_train_step": 27.72204566001892, "step": 809}
{"train_info/time_between_train_steps": 0.0055620670318603516, "step": 809}
{"info/global_step": 810, "train_info/time_within_train_step": 27.731279611587524, "step": 810}
{"train_info/time_between_train_steps": 0.006745100021362305, "step": 810}
{"train_info/time_between_train_steps": 29.725592851638794, "step": 810}
{"info/global_step": 811, "train_info/time_within_train_step": 27.714940547943115, "step": 811}
{"train_info/time_between_train_steps": 0.005440235137939453, "step": 811}
{"info/global_step": 812, "train_info/time_within_train_step": 27.8736469745636, "step": 812}
{"train_info/time_between_train_steps": 0.0052759647369384766, "step": 812}
{"info/global_step": 813, "train_info/time_within_train_step": 27.694947719573975, "step": 813}
{"train_info/time_between_train_steps": 0.005990028381347656, "step": 813}
{"info/global_step": 814, "train_info/time_within_train_step": 27.814206838607788, "step": 814}
{"train_info/time_between_train_steps": 0.005049943923950195, "step": 814}
{"info/global_step": 815, "train_info/time_within_train_step": 27.692090272903442, "step": 815}
{"train_info/time_between_train_steps": 0.005128622055053711, "step": 815}
{"info/global_step": 816, "train_info/time_within_train_step": 27.920867919921875, "step": 816}
{"train_info/time_between_train_steps": 0.005758762359619141, "step": 816}
{"info/global_step": 817, "train_info/time_within_train_step": 27.699326515197754, "step": 817}
{"train_info/time_between_train_steps": 0.005112886428833008, "step": 817}
{"info/global_step": 818, "train_info/time_within_train_step": 27.78337836265564, "step": 818}
{"train_info/time_between_train_steps": 0.005307674407958984, "step": 818}
{"info/global_step": 819, "train_info/time_within_train_step": 27.701679706573486, "step": 819}
{"train_info/time_between_train_steps": 0.004866838455200195, "step": 819}
{"info/global_step": 820, "train_info/time_within_train_step": 27.688483238220215, "step": 820}
{"train_info/time_between_train_steps": 0.004977703094482422, "step": 820}
{"info/global_step": 821, "train_info/time_within_train_step": 27.67960524559021, "step": 821}
{"train_info/time_between_train_steps": 0.0051631927490234375, "step": 821}
{"info/global_step": 822, "train_info/time_within_train_step": 27.67815113067627, "step": 822}
{"train_info/time_between_train_steps": 0.009550809860229492, "step": 822}
{"info/global_step": 823, "train_info/time_within_train_step": 27.675416231155396, "step": 823}
{"train_info/time_between_train_steps": 0.004899740219116211, "step": 823}
{"info/global_step": 824, "train_info/time_within_train_step": 27.677238702774048, "step": 824}
{"train_info/time_between_train_steps": 0.009716272354125977, "step": 824}
{"info/global_step": 825, "train_info/time_within_train_step": 27.677024841308594, "step": 825}
{"train_info/time_between_train_steps": 0.005070209503173828, "step": 825}
{"info/global_step": 826, "train_info/time_within_train_step": 27.691486120224, "step": 826}
{"train_info/time_between_train_steps": 0.0050432682037353516, "step": 826}
{"info/global_step": 827, "train_info/time_within_train_step": 27.742215394973755, "step": 827}
{"train_info/time_between_train_steps": 0.009226322174072266, "step": 827}
{"info/global_step": 828, "train_info/time_within_train_step": 27.676904678344727, "step": 828}
{"train_info/time_between_train_steps": 0.01007390022277832, "step": 828}
{"info/global_step": 829, "train_info/time_within_train_step": 29.15452742576599, "step": 829}
{"train_info/time_between_train_steps": 0.005240201950073242, "step": 829}
{"info/global_step": 830, "train_info/time_within_train_step": 27.972545385360718, "step": 830}
{"train_info/time_between_train_steps": 0.004892826080322266, "step": 830}
{"info/global_step": 831, "train_info/time_within_train_step": 27.798168420791626, "step": 831}
{"train_info/time_between_train_steps": 0.004880428314208984, "step": 831}
{"info/global_step": 832, "train_info/time_within_train_step": 27.68090796470642, "step": 832}
{"train_info/time_between_train_steps": 0.004984855651855469, "step": 832}
{"info/global_step": 833, "train_info/time_within_train_step": 27.693134546279907, "step": 833}
{"train_info/time_between_train_steps": 0.005284547805786133, "step": 833}
{"info/global_step": 834, "train_info/time_within_train_step": 27.680370330810547, "step": 834}
{"train_info/time_between_train_steps": 0.004912614822387695, "step": 834}
{"info/global_step": 835, "train_info/time_within_train_step": 27.69346523284912, "step": 835}
{"train_info/time_between_train_steps": 0.005159616470336914, "step": 835}
{"info/global_step": 836, "train_info/time_within_train_step": 27.69474506378174, "step": 836}
{"train_info/time_between_train_steps": 0.005087375640869141, "step": 836}
{"info/global_step": 837, "train_info/time_within_train_step": 27.715152502059937, "step": 837}
{"train_info/time_between_train_steps": 0.0056650638580322266, "step": 837}
{"train_info/time_between_train_steps": 29.846271276474, "step": 837}
{"info/global_step": 838, "train_info/time_within_train_step": 27.688467264175415, "step": 838}
{"train_info/time_between_train_steps": 0.004858255386352539, "step": 838}
{"info/global_step": 839, "train_info/time_within_train_step": 27.86183524131775, "step": 839}
{"train_info/time_between_train_steps": 0.005103349685668945, "step": 839}
{"info/global_step": 840, "train_info/time_within_train_step": 27.69709014892578, "step": 840}
{"train_info/time_between_train_steps": 0.0051958560943603516, "step": 840}
{"info/global_step": 841, "train_info/time_within_train_step": 27.81467866897583, "step": 841}
{"train_info/time_between_train_steps": 0.005251646041870117, "step": 841}
{"info/global_step": 842, "train_info/time_within_train_step": 27.6943678855896, "step": 842}
{"train_info/time_between_train_steps": 0.005115985870361328, "step": 842}
{"info/global_step": 843, "train_info/time_within_train_step": 27.794877290725708, "step": 843}
{"train_info/time_between_train_steps": 0.0050771236419677734, "step": 843}
{"info/global_step": 844, "train_info/time_within_train_step": 27.711644887924194, "step": 844}
{"train_info/time_between_train_steps": 0.005217313766479492, "step": 844}
{"info/global_step": 845, "train_info/time_within_train_step": 27.818432092666626, "step": 845}
{"train_info/time_between_train_steps": 0.005041837692260742, "step": 845}
{"info/global_step": 846, "train_info/time_within_train_step": 27.864030599594116, "step": 846}
{"train_info/time_between_train_steps": 0.004914760589599609, "step": 846}
{"info/global_step": 847, "train_info/time_within_train_step": 27.690366744995117, "step": 847}
{"train_info/time_between_train_steps": 0.004836559295654297, "step": 847}
{"info/global_step": 848, "train_info/time_within_train_step": 27.676128149032593, "step": 848}
{"train_info/time_between_train_steps": 0.005042552947998047, "step": 848}
{"info/global_step": 849, "train_info/time_within_train_step": 27.66452431678772, "step": 849}
{"train_info/time_between_train_steps": 0.004755258560180664, "step": 849}
{"info/global_step": 850, "train_info/time_within_train_step": 27.685068607330322, "step": 850}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740849287, "_runtime": 25236}, "step": 850}
{"logs": {"train/loss": 3.3698, "train/learning_rate": 0.00019444444444444443, "train/epoch": 31.01, "_timestamp": 1740849287, "_runtime": 25236}, "step": 850}
{"train_info/time_between_train_steps": 0.02595996856689453, "step": 850}
{"info/global_step": 851, "train_info/time_within_train_step": 27.68273949623108, "step": 851}
{"train_info/time_between_train_steps": 0.005045652389526367, "step": 851}
{"info/global_step": 852, "train_info/time_within_train_step": 27.74963641166687, "step": 852}
{"train_info/time_between_train_steps": 0.004904508590698242, "step": 852}
{"info/global_step": 853, "train_info/time_within_train_step": 27.67134380340576, "step": 853}
{"train_info/time_between_train_steps": 0.004901885986328125, "step": 853}
{"info/global_step": 854, "train_info/time_within_train_step": 27.672852993011475, "step": 854}
{"train_info/time_between_train_steps": 0.005174160003662109, "step": 854}
{"info/global_step": 855, "train_info/time_within_train_step": 27.678083419799805, "step": 855}
{"train_info/time_between_train_steps": 0.005341053009033203, "step": 855}
{"info/global_step": 856, "train_info/time_within_train_step": 27.68304181098938, "step": 856}
{"train_info/time_between_train_steps": 0.004997730255126953, "step": 856}
{"info/global_step": 857, "train_info/time_within_train_step": 27.696062803268433, "step": 857}
{"train_info/time_between_train_steps": 0.004931449890136719, "step": 857}
{"info/global_step": 858, "train_info/time_within_train_step": 27.744391441345215, "step": 858}
{"train_info/time_between_train_steps": 0.005387067794799805, "step": 858}
{"info/global_step": 859, "train_info/time_within_train_step": 27.710028409957886, "step": 859}
{"train_info/time_between_train_steps": 0.005006551742553711, "step": 859}
{"info/global_step": 860, "train_info/time_within_train_step": 27.673850774765015, "step": 860}
{"train_info/time_between_train_steps": 0.005009651184082031, "step": 860}
{"info/global_step": 861, "train_info/time_within_train_step": 27.67987632751465, "step": 861}
{"train_info/time_between_train_steps": 0.0057752132415771484, "step": 861}
{"info/global_step": 862, "train_info/time_within_train_step": 27.81851315498352, "step": 862}
{"train_info/time_between_train_steps": 0.0054683685302734375, "step": 862}
{"info/global_step": 863, "train_info/time_within_train_step": 27.84092140197754, "step": 863}
{"train_info/time_between_train_steps": 0.005193948745727539, "step": 863}
{"info/global_step": 864, "train_info/time_within_train_step": 27.70356583595276, "step": 864}
{"train_info/time_between_train_steps": 0.005689859390258789, "step": 864}
{"train_info/time_between_train_steps": 30.04367160797119, "step": 864}
{"info/global_step": 865, "train_info/time_within_train_step": 27.707815885543823, "step": 865}
{"train_info/time_between_train_steps": 0.0054378509521484375, "step": 865}
{"info/global_step": 866, "train_info/time_within_train_step": 27.82947301864624, "step": 866}
{"train_info/time_between_train_steps": 0.005258083343505859, "step": 866}
{"info/global_step": 867, "train_info/time_within_train_step": 27.70136857032776, "step": 867}
{"train_info/time_between_train_steps": 0.005247592926025391, "step": 867}
{"info/global_step": 868, "train_info/time_within_train_step": 27.836562395095825, "step": 868}
{"train_info/time_between_train_steps": 0.005228519439697266, "step": 868}
{"info/global_step": 869, "train_info/time_within_train_step": 27.72334861755371, "step": 869}
{"train_info/time_between_train_steps": 0.0050389766693115234, "step": 869}
{"info/global_step": 870, "train_info/time_within_train_step": 27.819096326828003, "step": 870}
{"train_info/time_between_train_steps": 0.005012035369873047, "step": 870}
{"info/global_step": 871, "train_info/time_within_train_step": 27.717029333114624, "step": 871}
{"train_info/time_between_train_steps": 0.005364894866943359, "step": 871}
{"info/global_step": 872, "train_info/time_within_train_step": 27.806649684906006, "step": 872}
{"train_info/time_between_train_steps": 0.0052394866943359375, "step": 872}
{"info/global_step": 873, "train_info/time_within_train_step": 27.697376251220703, "step": 873}
{"train_info/time_between_train_steps": 0.00490880012512207, "step": 873}
{"info/global_step": 874, "train_info/time_within_train_step": 27.691839456558228, "step": 874}
{"train_info/time_between_train_steps": 0.004852771759033203, "step": 874}
{"info/global_step": 875, "train_info/time_within_train_step": 27.731909036636353, "step": 875}
{"train_info/time_between_train_steps": 0.0049190521240234375, "step": 875}
{"info/global_step": 876, "train_info/time_within_train_step": 27.80907416343689, "step": 876}
{"train_info/time_between_train_steps": 0.005060434341430664, "step": 876}
{"info/global_step": 877, "train_info/time_within_train_step": 27.709391117095947, "step": 877}
{"train_info/time_between_train_steps": 0.005223989486694336, "step": 877}
{"info/global_step": 878, "train_info/time_within_train_step": 27.696322441101074, "step": 878}
{"train_info/time_between_train_steps": 0.004901409149169922, "step": 878}
{"info/global_step": 879, "train_info/time_within_train_step": 27.703620433807373, "step": 879}
{"train_info/time_between_train_steps": 0.005059242248535156, "step": 879}
{"info/global_step": 880, "train_info/time_within_train_step": 27.715310096740723, "step": 880}
{"train_info/time_between_train_steps": 0.005146980285644531, "step": 880}
{"info/global_step": 881, "train_info/time_within_train_step": 27.750930547714233, "step": 881}
{"train_info/time_between_train_steps": 0.005077362060546875, "step": 881}
{"info/global_step": 882, "train_info/time_within_train_step": 27.681193351745605, "step": 882}
{"train_info/time_between_train_steps": 0.004918575286865234, "step": 882}
{"info/global_step": 883, "train_info/time_within_train_step": 27.733229875564575, "step": 883}
{"train_info/time_between_train_steps": 0.009912490844726562, "step": 883}
{"info/global_step": 884, "train_info/time_within_train_step": 27.683032989501953, "step": 884}
{"train_info/time_between_train_steps": 0.005019187927246094, "step": 884}
{"info/global_step": 885, "train_info/time_within_train_step": 27.68564009666443, "step": 885}
{"train_info/time_between_train_steps": 0.005006074905395508, "step": 885}
{"info/global_step": 886, "train_info/time_within_train_step": 27.719985961914062, "step": 886}
{"train_info/time_between_train_steps": 0.004923582077026367, "step": 886}
{"info/global_step": 887, "train_info/time_within_train_step": 27.67688298225403, "step": 887}
{"train_info/time_between_train_steps": 0.005051612854003906, "step": 887}
{"info/global_step": 888, "train_info/time_within_train_step": 27.680904626846313, "step": 888}
{"train_info/time_between_train_steps": 0.005121469497680664, "step": 888}
{"info/global_step": 889, "train_info/time_within_train_step": 27.682843685150146, "step": 889}
{"train_info/time_between_train_steps": 0.005907297134399414, "step": 889}
{"info/global_step": 890, "train_info/time_within_train_step": 27.68255043029785, "step": 890}
{"train_info/time_between_train_steps": 0.00507044792175293, "step": 890}
{"info/global_step": 891, "train_info/time_within_train_step": 27.69603943824768, "step": 891}
{"train_info/time_between_train_steps": 0.005517721176147461, "step": 891}
{"train_info/time_between_train_steps": 29.60942840576172, "step": 891}
{"info/global_step": 892, "train_info/time_within_train_step": 27.69633412361145, "step": 892}
{"train_info/time_between_train_steps": 0.004930019378662109, "step": 892}
{"info/global_step": 893, "train_info/time_within_train_step": 27.82957124710083, "step": 893}
{"train_info/time_between_train_steps": 0.004895210266113281, "step": 893}
{"info/global_step": 894, "train_info/time_within_train_step": 27.702529191970825, "step": 894}
{"train_info/time_between_train_steps": 0.004828691482543945, "step": 894}
{"info/global_step": 895, "train_info/time_within_train_step": 27.80821132659912, "step": 895}
{"train_info/time_between_train_steps": 0.005245208740234375, "step": 895}
{"info/global_step": 896, "train_info/time_within_train_step": 27.69315457344055, "step": 896}
{"train_info/time_between_train_steps": 0.0051805973052978516, "step": 896}
{"info/global_step": 897, "train_info/time_within_train_step": 27.815571546554565, "step": 897}
{"train_info/time_between_train_steps": 0.005429744720458984, "step": 897}
{"info/global_step": 898, "train_info/time_within_train_step": 27.681856393814087, "step": 898}
{"train_info/time_between_train_steps": 0.005034923553466797, "step": 898}
{"info/global_step": 899, "train_info/time_within_train_step": 27.75200581550598, "step": 899}
{"train_info/time_between_train_steps": 0.005106449127197266, "step": 899}
{"info/global_step": 900, "train_info/time_within_train_step": 27.69036078453064, "step": 900}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740850734, "_runtime": 26683}, "step": 900}
{"logs": {"train/loss": 3.3143, "train/learning_rate": 0.00016666666666666666, "train/epoch": 33.01, "_timestamp": 1740850734, "_runtime": 26683}, "step": 900}
{"train_info/time_between_train_steps": 44.171876430511475, "step": 900}
{"info/global_step": 901, "train_info/time_within_train_step": 27.90126132965088, "step": 901}
{"train_info/time_between_train_steps": 0.005309581756591797, "step": 901}
{"info/global_step": 902, "train_info/time_within_train_step": 28.000173807144165, "step": 902}
{"train_info/time_between_train_steps": 0.005929231643676758, "step": 902}
{"info/global_step": 903, "train_info/time_within_train_step": 27.743350505828857, "step": 903}
{"train_info/time_between_train_steps": 0.006230592727661133, "step": 903}
{"info/global_step": 904, "train_info/time_within_train_step": 27.69213557243347, "step": 904}
{"train_info/time_between_train_steps": 0.005218982696533203, "step": 904}
{"info/global_step": 905, "train_info/time_within_train_step": 27.6908016204834, "step": 905}
{"train_info/time_between_train_steps": 0.005041837692260742, "step": 905}
{"info/global_step": 906, "train_info/time_within_train_step": 27.697402715682983, "step": 906}
{"train_info/time_between_train_steps": 0.005144834518432617, "step": 906}
{"info/global_step": 907, "train_info/time_within_train_step": 27.82841181755066, "step": 907}
{"train_info/time_between_train_steps": 0.005238056182861328, "step": 907}
{"info/global_step": 908, "train_info/time_within_train_step": 27.710054397583008, "step": 908}
{"train_info/time_between_train_steps": 0.005133152008056641, "step": 908}
{"info/global_step": 909, "train_info/time_within_train_step": 27.760668992996216, "step": 909}
{"train_info/time_between_train_steps": 0.0050885677337646484, "step": 909}
{"info/global_step": 910, "train_info/time_within_train_step": 27.720417022705078, "step": 910}
{"train_info/time_between_train_steps": 0.005059003829956055, "step": 910}
{"info/global_step": 911, "train_info/time_within_train_step": 27.68888807296753, "step": 911}
{"train_info/time_between_train_steps": 0.0051043033599853516, "step": 911}
{"info/global_step": 912, "train_info/time_within_train_step": 27.732280731201172, "step": 912}
{"train_info/time_between_train_steps": 0.006999492645263672, "step": 912}
{"info/global_step": 913, "train_info/time_within_train_step": 27.718446493148804, "step": 913}
{"train_info/time_between_train_steps": 0.004991054534912109, "step": 913}
{"info/global_step": 914, "train_info/time_within_train_step": 27.696208715438843, "step": 914}
{"train_info/time_between_train_steps": 0.0050618648529052734, "step": 914}
{"info/global_step": 915, "train_info/time_within_train_step": 27.70871615409851, "step": 915}
{"train_info/time_between_train_steps": 0.005080699920654297, "step": 915}
{"info/global_step": 916, "train_info/time_within_train_step": 27.746038913726807, "step": 916}
{"train_info/time_between_train_steps": 0.005143165588378906, "step": 916}
{"info/global_step": 917, "train_info/time_within_train_step": 27.689635038375854, "step": 917}
{"train_info/time_between_train_steps": 0.0054738521575927734, "step": 917}
{"info/global_step": 918, "train_info/time_within_train_step": 27.698549509048462, "step": 918}
{"train_info/time_between_train_steps": 0.005518913269042969, "step": 918}
{"train_info/time_between_train_steps": 29.767155408859253, "step": 918}
{"info/global_step": 919, "train_info/time_within_train_step": 27.719228267669678, "step": 919}
{"train_info/time_between_train_steps": 0.0048389434814453125, "step": 919}
{"info/global_step": 920, "train_info/time_within_train_step": 27.799683094024658, "step": 920}
{"train_info/time_between_train_steps": 0.0049591064453125, "step": 920}
{"info/global_step": 921, "train_info/time_within_train_step": 27.77600622177124, "step": 921}
{"train_info/time_between_train_steps": 0.00482940673828125, "step": 921}
{"info/global_step": 922, "train_info/time_within_train_step": 27.83393359184265, "step": 922}
{"train_info/time_between_train_steps": 0.005200862884521484, "step": 922}
{"info/global_step": 923, "train_info/time_within_train_step": 27.68931746482849, "step": 923}
{"train_info/time_between_train_steps": 0.0054569244384765625, "step": 923}
{"info/global_step": 924, "train_info/time_within_train_step": 27.79341435432434, "step": 924}
{"train_info/time_between_train_steps": 0.007645130157470703, "step": 924}
{"info/global_step": 925, "train_info/time_within_train_step": 29.26663827896118, "step": 925}
{"train_info/time_between_train_steps": 0.005210161209106445, "step": 925}
{"info/global_step": 926, "train_info/time_within_train_step": 27.76277184486389, "step": 926}
{"train_info/time_between_train_steps": 0.0075664520263671875, "step": 926}
{"info/global_step": 927, "train_info/time_within_train_step": 27.711672067642212, "step": 927}
{"train_info/time_between_train_steps": 0.005106449127197266, "step": 927}
{"info/global_step": 928, "train_info/time_within_train_step": 27.696779012680054, "step": 928}
{"train_info/time_between_train_steps": 0.004862070083618164, "step": 928}
{"info/global_step": 929, "train_info/time_within_train_step": 27.668912172317505, "step": 929}
{"train_info/time_between_train_steps": 0.00500035285949707, "step": 929}
{"info/global_step": 930, "train_info/time_within_train_step": 27.67416501045227, "step": 930}
{"train_info/time_between_train_steps": 0.0050923824310302734, "step": 930}
{"info/global_step": 931, "train_info/time_within_train_step": 27.712637662887573, "step": 931}
{"train_info/time_between_train_steps": 0.00502777099609375, "step": 931}
{"info/global_step": 932, "train_info/time_within_train_step": 27.692540884017944, "step": 932}
{"train_info/time_between_train_steps": 0.005145072937011719, "step": 932}
{"info/global_step": 933, "train_info/time_within_train_step": 27.68569779396057, "step": 933}
{"train_info/time_between_train_steps": 0.004904747009277344, "step": 933}
{"info/global_step": 934, "train_info/time_within_train_step": 27.679091930389404, "step": 934}
{"train_info/time_between_train_steps": 0.005093097686767578, "step": 934}
{"info/global_step": 935, "train_info/time_within_train_step": 27.677348136901855, "step": 935}
{"train_info/time_between_train_steps": 0.004998445510864258, "step": 935}
{"info/global_step": 936, "train_info/time_within_train_step": 27.688747882843018, "step": 936}
{"train_info/time_between_train_steps": 0.005153656005859375, "step": 936}
{"info/global_step": 937, "train_info/time_within_train_step": 27.796393871307373, "step": 937}
{"train_info/time_between_train_steps": 0.004910469055175781, "step": 937}
{"info/global_step": 938, "train_info/time_within_train_step": 27.731524229049683, "step": 938}
{"train_info/time_between_train_steps": 0.005928516387939453, "step": 938}
{"info/global_step": 939, "train_info/time_within_train_step": 27.67755937576294, "step": 939}
{"train_info/time_between_train_steps": 0.005316495895385742, "step": 939}
{"info/global_step": 940, "train_info/time_within_train_step": 27.686074256896973, "step": 940}
{"train_info/time_between_train_steps": 0.005161762237548828, "step": 940}
{"info/global_step": 941, "train_info/time_within_train_step": 27.701130390167236, "step": 941}
{"train_info/time_between_train_steps": 0.004944562911987305, "step": 941}
{"info/global_step": 942, "train_info/time_within_train_step": 27.72839379310608, "step": 942}
{"train_info/time_between_train_steps": 0.005320310592651367, "step": 942}
{"info/global_step": 943, "train_info/time_within_train_step": 27.738743543624878, "step": 943}
{"train_info/time_between_train_steps": 0.011515378952026367, "step": 943}
{"info/global_step": 944, "train_info/time_within_train_step": 27.698099851608276, "step": 944}
{"train_info/time_between_train_steps": 0.005238533020019531, "step": 944}
{"info/global_step": 945, "train_info/time_within_train_step": 27.722442626953125, "step": 945}
{"train_info/time_between_train_steps": 0.005635738372802734, "step": 945}
{"train_info/time_between_train_steps": 29.960261821746826, "step": 945}
{"info/global_step": 946, "train_info/time_within_train_step": 27.686065912246704, "step": 946}
{"train_info/time_between_train_steps": 0.004873991012573242, "step": 946}
{"info/global_step": 947, "train_info/time_within_train_step": 27.799901962280273, "step": 947}
{"train_info/time_between_train_steps": 0.00489044189453125, "step": 947}
{"info/global_step": 948, "train_info/time_within_train_step": 27.677647590637207, "step": 948}
{"train_info/time_between_train_steps": 0.0053136348724365234, "step": 948}
{"info/global_step": 949, "train_info/time_within_train_step": 27.84376072883606, "step": 949}
{"train_info/time_between_train_steps": 0.006299495697021484, "step": 949}
{"info/global_step": 950, "train_info/time_within_train_step": 27.759663581848145, "step": 950}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740852229, "_runtime": 28178}, "step": 950}
{"logs": {"train/loss": 3.2639, "train/learning_rate": 0.0001388888888888889, "train/epoch": 35.0, "_timestamp": 1740852229, "_runtime": 28178}, "step": 950}
{"train_info/time_between_train_steps": 0.025829076766967773, "step": 950}
{"info/global_step": 951, "train_info/time_within_train_step": 27.887420654296875, "step": 951}
{"train_info/time_between_train_steps": 0.011326313018798828, "step": 951}
{"info/global_step": 952, "train_info/time_within_train_step": 27.783405780792236, "step": 952}
{"train_info/time_between_train_steps": 0.005148649215698242, "step": 952}
{"info/global_step": 953, "train_info/time_within_train_step": 27.809897899627686, "step": 953}
{"train_info/time_between_train_steps": 0.011486053466796875, "step": 953}
{"info/global_step": 954, "train_info/time_within_train_step": 27.711515188217163, "step": 954}
{"train_info/time_between_train_steps": 0.0050127506256103516, "step": 954}
{"info/global_step": 955, "train_info/time_within_train_step": 27.697843551635742, "step": 955}
{"train_info/time_between_train_steps": 0.005132436752319336, "step": 955}
{"info/global_step": 956, "train_info/time_within_train_step": 27.754255056381226, "step": 956}
{"train_info/time_between_train_steps": 0.00507044792175293, "step": 956}
{"info/global_step": 957, "train_info/time_within_train_step": 27.7044677734375, "step": 957}
{"train_info/time_between_train_steps": 0.00531768798828125, "step": 957}
{"info/global_step": 958, "train_info/time_within_train_step": 27.72556233406067, "step": 958}
{"train_info/time_between_train_steps": 0.005191802978515625, "step": 958}
{"info/global_step": 959, "train_info/time_within_train_step": 27.699970960617065, "step": 959}
{"train_info/time_between_train_steps": 0.004980802536010742, "step": 959}
{"info/global_step": 960, "train_info/time_within_train_step": 27.704877138137817, "step": 960}
{"train_info/time_between_train_steps": 0.0061206817626953125, "step": 960}
{"info/global_step": 961, "train_info/time_within_train_step": 27.7079496383667, "step": 961}
{"train_info/time_between_train_steps": 0.006025075912475586, "step": 961}
{"info/global_step": 962, "train_info/time_within_train_step": 27.69909930229187, "step": 962}
{"train_info/time_between_train_steps": 0.005297660827636719, "step": 962}
{"info/global_step": 963, "train_info/time_within_train_step": 27.71964979171753, "step": 963}
{"train_info/time_between_train_steps": 0.005063295364379883, "step": 963}
{"info/global_step": 964, "train_info/time_within_train_step": 27.71163296699524, "step": 964}
{"train_info/time_between_train_steps": 0.0050885677337646484, "step": 964}
{"info/global_step": 965, "train_info/time_within_train_step": 27.719051599502563, "step": 965}
{"train_info/time_between_train_steps": 0.004924774169921875, "step": 965}
{"info/global_step": 966, "train_info/time_within_train_step": 27.702669143676758, "step": 966}
{"train_info/time_between_train_steps": 0.005282878875732422, "step": 966}
{"info/global_step": 967, "train_info/time_within_train_step": 27.768574953079224, "step": 967}
{"train_info/time_between_train_steps": 0.00501704216003418, "step": 967}
{"info/global_step": 968, "train_info/time_within_train_step": 27.69939923286438, "step": 968}
{"train_info/time_between_train_steps": 0.0049474239349365234, "step": 968}
{"info/global_step": 969, "train_info/time_within_train_step": 27.70941162109375, "step": 969}
{"train_info/time_between_train_steps": 0.005654096603393555, "step": 969}
{"info/global_step": 970, "train_info/time_within_train_step": 27.70650339126587, "step": 970}
{"train_info/time_between_train_steps": 0.005235433578491211, "step": 970}
{"info/global_step": 971, "train_info/time_within_train_step": 27.714507818222046, "step": 971}
{"train_info/time_between_train_steps": 0.007652997970581055, "step": 971}
{"info/global_step": 972, "train_info/time_within_train_step": 27.762444972991943, "step": 972}
{"train_info/time_between_train_steps": 0.00531005859375, "step": 972}
{"train_info/time_between_train_steps": 29.684876680374146, "step": 972}
{"info/global_step": 973, "train_info/time_within_train_step": 27.769051551818848, "step": 973}
{"train_info/time_between_train_steps": 0.005354642868041992, "step": 973}
{"info/global_step": 974, "train_info/time_within_train_step": 27.832839727401733, "step": 974}
{"train_info/time_between_train_steps": 0.005819082260131836, "step": 974}
{"info/global_step": 975, "train_info/time_within_train_step": 27.714015007019043, "step": 975}
{"train_info/time_between_train_steps": 0.005135774612426758, "step": 975}
{"info/global_step": 976, "train_info/time_within_train_step": 27.804633617401123, "step": 976}
{"train_info/time_between_train_steps": 0.005151271820068359, "step": 976}
{"info/global_step": 977, "train_info/time_within_train_step": 27.736013889312744, "step": 977}
{"train_info/time_between_train_steps": 0.006240129470825195, "step": 977}
{"info/global_step": 978, "train_info/time_within_train_step": 27.83270764350891, "step": 978}
{"train_info/time_between_train_steps": 0.0052607059478759766, "step": 978}
{"info/global_step": 979, "train_info/time_within_train_step": 27.715281009674072, "step": 979}
{"train_info/time_between_train_steps": 0.005099296569824219, "step": 979}
{"info/global_step": 980, "train_info/time_within_train_step": 27.756693840026855, "step": 980}
{"train_info/time_between_train_steps": 0.005257129669189453, "step": 980}
{"info/global_step": 981, "train_info/time_within_train_step": 27.740006923675537, "step": 981}
{"train_info/time_between_train_steps": 0.005687713623046875, "step": 981}
{"info/global_step": 982, "train_info/time_within_train_step": 27.797641038894653, "step": 982}
{"train_info/time_between_train_steps": 0.0050182342529296875, "step": 982}
{"info/global_step": 983, "train_info/time_within_train_step": 27.716996669769287, "step": 983}
{"train_info/time_between_train_steps": 0.0049076080322265625, "step": 983}
{"info/global_step": 984, "train_info/time_within_train_step": 27.695619821548462, "step": 984}
{"train_info/time_between_train_steps": 0.004867076873779297, "step": 984}
{"info/global_step": 985, "train_info/time_within_train_step": 27.722055196762085, "step": 985}
{"train_info/time_between_train_steps": 0.004982471466064453, "step": 985}
{"info/global_step": 986, "train_info/time_within_train_step": 27.721017837524414, "step": 986}
{"train_info/time_between_train_steps": 0.00493931770324707, "step": 986}
{"info/global_step": 987, "train_info/time_within_train_step": 27.699114322662354, "step": 987}
{"train_info/time_between_train_steps": 0.006012916564941406, "step": 987}
{"info/global_step": 988, "train_info/time_within_train_step": 27.74301791191101, "step": 988}
{"train_info/time_between_train_steps": 0.005124807357788086, "step": 988}
{"info/global_step": 989, "train_info/time_within_train_step": 27.71071743965149, "step": 989}
{"train_info/time_between_train_steps": 0.005101442337036133, "step": 989}
{"info/global_step": 990, "train_info/time_within_train_step": 27.737481355667114, "step": 990}
{"train_info/time_between_train_steps": 0.00513458251953125, "step": 990}
{"info/global_step": 991, "train_info/time_within_train_step": 27.729920148849487, "step": 991}
{"train_info/time_between_train_steps": 0.005026817321777344, "step": 991}
{"info/global_step": 992, "train_info/time_within_train_step": 27.68966317176819, "step": 992}
{"train_info/time_between_train_steps": 0.0060498714447021484, "step": 992}
{"info/global_step": 993, "train_info/time_within_train_step": 27.695364952087402, "step": 993}
{"train_info/time_between_train_steps": 0.005030393600463867, "step": 993}
{"info/global_step": 994, "train_info/time_within_train_step": 27.706636905670166, "step": 994}
{"train_info/time_between_train_steps": 0.006405353546142578, "step": 994}
{"info/global_step": 995, "train_info/time_within_train_step": 27.69776749610901, "step": 995}
{"train_info/time_between_train_steps": 0.009327173233032227, "step": 995}
{"info/global_step": 996, "train_info/time_within_train_step": 27.715208768844604, "step": 996}
{"train_info/time_between_train_steps": 0.004992008209228516, "step": 996}
{"info/global_step": 997, "train_info/time_within_train_step": 27.7818500995636, "step": 997}
{"train_info/time_between_train_steps": 0.0069026947021484375, "step": 997}
{"info/global_step": 998, "train_info/time_within_train_step": 27.731788635253906, "step": 998}
{"train_info/time_between_train_steps": 0.005379676818847656, "step": 998}
{"info/global_step": 999, "train_info/time_within_train_step": 27.74721884727478, "step": 999}
{"train_info/time_between_train_steps": 0.00545048713684082, "step": 999}
{"train_info/time_between_train_steps": 29.724198818206787, "step": 999}
{"info/global_step": 1000, "train_info/time_within_train_step": 27.688565254211426, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740853676, "_runtime": 29625}, "step": 1000}
{"logs": {"train/loss": 3.2163, "train/learning_rate": 0.00011111111111111109, "train/epoch": 37.0, "_timestamp": 1740853676, "_runtime": 29625}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740853680, "_runtime": 29629}, "step": 1000}
{"logs": {"eval/loss": 4.151810169219971, "eval/runtime": 4.074, "eval/samples_per_second": 49.828, "eval/steps_per_second": 3.191, "train/epoch": 37.0, "_timestamp": 1740853680, "_runtime": 29629}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740853680, "_runtime": 29629}, "step": 1000}
{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.151810169219971, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 63.548930563193956, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.074, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 49.828, "train/epoch": 37.0, "_timestamp": 1740853680, "_runtime": 29629}, "step": 1000}
{"train_info/time_between_train_steps": 43.36605477333069, "step": 1000}
{"info/global_step": 1001, "train_info/time_within_train_step": 28.000293493270874, "step": 1001}
{"train_info/time_between_train_steps": 0.005351066589355469, "step": 1001}
{"info/global_step": 1002, "train_info/time_within_train_step": 27.870596408843994, "step": 1002}
{"train_info/time_between_train_steps": 0.0053098201751708984, "step": 1002}
{"info/global_step": 1003, "train_info/time_within_train_step": 27.874591827392578, "step": 1003}
{"train_info/time_between_train_steps": 0.009335756301879883, "step": 1003}
{"info/global_step": 1004, "train_info/time_within_train_step": 27.702943086624146, "step": 1004}
{"train_info/time_between_train_steps": 0.005999088287353516, "step": 1004}
{"info/global_step": 1005, "train_info/time_within_train_step": 27.81688404083252, "step": 1005}
{"train_info/time_between_train_steps": 0.0051996707916259766, "step": 1005}
{"info/global_step": 1006, "train_info/time_within_train_step": 27.708719730377197, "step": 1006}
{"train_info/time_between_train_steps": 0.005308866500854492, "step": 1006}
{"info/global_step": 1007, "train_info/time_within_train_step": 27.78282356262207, "step": 1007}
{"train_info/time_between_train_steps": 0.005166292190551758, "step": 1007}
{"info/global_step": 1008, "train_info/time_within_train_step": 27.686821460723877, "step": 1008}
{"train_info/time_between_train_steps": 0.004780292510986328, "step": 1008}
{"info/global_step": 1009, "train_info/time_within_train_step": 27.703312635421753, "step": 1009}
{"train_info/time_between_train_steps": 0.004992961883544922, "step": 1009}
{"info/global_step": 1010, "train_info/time_within_train_step": 27.69071125984192, "step": 1010}
{"train_info/time_between_train_steps": 0.005003690719604492, "step": 1010}
{"info/global_step": 1011, "train_info/time_within_train_step": 27.71597695350647, "step": 1011}
{"train_info/time_between_train_steps": 0.005227804183959961, "step": 1011}
{"info/global_step": 1012, "train_info/time_within_train_step": 27.79442286491394, "step": 1012}
{"train_info/time_between_train_steps": 0.005912303924560547, "step": 1012}
{"info/global_step": 1013, "train_info/time_within_train_step": 27.686455965042114, "step": 1013}
{"train_info/time_between_train_steps": 0.004822969436645508, "step": 1013}
{"info/global_step": 1014, "train_info/time_within_train_step": 27.681681871414185, "step": 1014}
{"train_info/time_between_train_steps": 0.00495147705078125, "step": 1014}
{"info/global_step": 1015, "train_info/time_within_train_step": 27.703522443771362, "step": 1015}
{"train_info/time_between_train_steps": 0.005167484283447266, "step": 1015}
{"info/global_step": 1016, "train_info/time_within_train_step": 27.712687730789185, "step": 1016}
{"train_info/time_between_train_steps": 0.004875898361206055, "step": 1016}
{"info/global_step": 1017, "train_info/time_within_train_step": 27.671220064163208, "step": 1017}
{"train_info/time_between_train_steps": 0.0050661563873291016, "step": 1017}
{"info/global_step": 1018, "train_info/time_within_train_step": 27.696019649505615, "step": 1018}
{"train_info/time_between_train_steps": 0.005045175552368164, "step": 1018}
{"info/global_step": 1019, "train_info/time_within_train_step": 27.684862852096558, "step": 1019}
{"train_info/time_between_train_steps": 0.01546478271484375, "step": 1019}
{"info/global_step": 1020, "train_info/time_within_train_step": 27.67762017250061, "step": 1020}
{"train_info/time_between_train_steps": 0.004844188690185547, "step": 1020}
{"info/global_step": 1021, "train_info/time_within_train_step": 27.676417350769043, "step": 1021}
{"train_info/time_between_train_steps": 0.004984378814697266, "step": 1021}
{"info/global_step": 1022, "train_info/time_within_train_step": 27.695767879486084, "step": 1022}
{"train_info/time_between_train_steps": 0.005397319793701172, "step": 1022}
{"info/global_step": 1023, "train_info/time_within_train_step": 27.93650460243225, "step": 1023}
{"train_info/time_between_train_steps": 0.00986337661743164, "step": 1023}
{"info/global_step": 1024, "train_info/time_within_train_step": 27.712936878204346, "step": 1024}
{"train_info/time_between_train_steps": 0.004930257797241211, "step": 1024}
{"info/global_step": 1025, "train_info/time_within_train_step": 27.69081473350525, "step": 1025}
{"train_info/time_between_train_steps": 0.0051648616790771484, "step": 1025}
{"info/global_step": 1026, "train_info/time_within_train_step": 27.696756839752197, "step": 1026}
{"train_info/time_between_train_steps": 0.005416393280029297, "step": 1026}
{"train_info/time_between_train_steps": 29.801055431365967, "step": 1026}
{"info/global_step": 1027, "train_info/time_within_train_step": 27.76788592338562, "step": 1027}
{"train_info/time_between_train_steps": 0.005841255187988281, "step": 1027}
{"info/global_step": 1028, "train_info/time_within_train_step": 27.792548656463623, "step": 1028}
{"train_info/time_between_train_steps": 0.005135297775268555, "step": 1028}
{"info/global_step": 1029, "train_info/time_within_train_step": 27.68139624595642, "step": 1029}
{"train_info/time_between_train_steps": 0.004940986633300781, "step": 1029}
{"info/global_step": 1030, "train_info/time_within_train_step": 27.79544425010681, "step": 1030}
{"train_info/time_between_train_steps": 0.005193471908569336, "step": 1030}
{"info/global_step": 1031, "train_info/time_within_train_step": 27.697800874710083, "step": 1031}
{"train_info/time_between_train_steps": 0.005063295364379883, "step": 1031}
{"info/global_step": 1032, "train_info/time_within_train_step": 27.871296405792236, "step": 1032}
{"train_info/time_between_train_steps": 0.005288362503051758, "step": 1032}
{"info/global_step": 1033, "train_info/time_within_train_step": 27.69260001182556, "step": 1033}
{"train_info/time_between_train_steps": 0.005006074905395508, "step": 1033}
{"info/global_step": 1034, "train_info/time_within_train_step": 27.757064819335938, "step": 1034}
{"train_info/time_between_train_steps": 0.005165815353393555, "step": 1034}
{"info/global_step": 1035, "train_info/time_within_train_step": 27.699219703674316, "step": 1035}
{"train_info/time_between_train_steps": 0.004901885986328125, "step": 1035}
{"info/global_step": 1036, "train_info/time_within_train_step": 27.716142654418945, "step": 1036}
{"train_info/time_between_train_steps": 0.0048732757568359375, "step": 1036}
{"info/global_step": 1037, "train_info/time_within_train_step": 27.704490423202515, "step": 1037}
{"train_info/time_between_train_steps": 0.0050661563873291016, "step": 1037}
{"info/global_step": 1038, "train_info/time_within_train_step": 27.6817569732666, "step": 1038}
{"train_info/time_between_train_steps": 0.004983425140380859, "step": 1038}
{"info/global_step": 1039, "train_info/time_within_train_step": 27.70174527168274, "step": 1039}
{"train_info/time_between_train_steps": 0.005151033401489258, "step": 1039}
{"info/global_step": 1040, "train_info/time_within_train_step": 27.68877911567688, "step": 1040}
{"train_info/time_between_train_steps": 0.0049610137939453125, "step": 1040}
{"info/global_step": 1041, "train_info/time_within_train_step": 27.72638511657715, "step": 1041}
{"train_info/time_between_train_steps": 0.004918813705444336, "step": 1041}
{"info/global_step": 1042, "train_info/time_within_train_step": 27.801883459091187, "step": 1042}
{"train_info/time_between_train_steps": 0.0051496028900146484, "step": 1042}
{"info/global_step": 1043, "train_info/time_within_train_step": 27.683640480041504, "step": 1043}
{"train_info/time_between_train_steps": 0.004891872406005859, "step": 1043}
{"info/global_step": 1044, "train_info/time_within_train_step": 27.679919004440308, "step": 1044}
{"train_info/time_between_train_steps": 0.005937337875366211, "step": 1044}
{"info/global_step": 1045, "train_info/time_within_train_step": 27.736676692962646, "step": 1045}
{"train_info/time_between_train_steps": 0.005287647247314453, "step": 1045}
{"info/global_step": 1046, "train_info/time_within_train_step": 27.70685315132141, "step": 1046}
{"train_info/time_between_train_steps": 0.0052416324615478516, "step": 1046}
{"info/global_step": 1047, "train_info/time_within_train_step": 27.70112657546997, "step": 1047}
{"train_info/time_between_train_steps": 0.0051839351654052734, "step": 1047}
{"info/global_step": 1048, "train_info/time_within_train_step": 27.70680546760559, "step": 1048}
{"train_info/time_between_train_steps": 0.004974842071533203, "step": 1048}
{"info/global_step": 1049, "train_info/time_within_train_step": 27.696149349212646, "step": 1049}
{"train_info/time_between_train_steps": 0.005005836486816406, "step": 1049}
{"info/global_step": 1050, "train_info/time_within_train_step": 27.69243288040161, "step": 1050}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740855138, "_runtime": 31087}, "step": 1050}
{"logs": {"train/loss": 3.1173, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 38.02, "_timestamp": 1740855138, "_runtime": 31087}, "step": 1050}
{"train_info/time_between_train_steps": 0.025829792022705078, "step": 1050}
{"info/global_step": 1051, "train_info/time_within_train_step": 27.74435567855835, "step": 1051}
{"train_info/time_between_train_steps": 0.005174160003662109, "step": 1051}
{"info/global_step": 1052, "train_info/time_within_train_step": 27.74781060218811, "step": 1052}
{"train_info/time_between_train_steps": 0.005259513854980469, "step": 1052}
{"info/global_step": 1053, "train_info/time_within_train_step": 27.70914363861084, "step": 1053}
{"train_info/time_between_train_steps": 0.005623340606689453, "step": 1053}
{"train_info/time_between_train_steps": 29.710018396377563, "step": 1053}
{"info/global_step": 1054, "train_info/time_within_train_step": 27.71225118637085, "step": 1054}
{"train_info/time_between_train_steps": 0.0052947998046875, "step": 1054}
{"info/global_step": 1055, "train_info/time_within_train_step": 27.84862518310547, "step": 1055}
{"train_info/time_between_train_steps": 0.005180835723876953, "step": 1055}
{"info/global_step": 1056, "train_info/time_within_train_step": 27.730132341384888, "step": 1056}
{"train_info/time_between_train_steps": 0.005624055862426758, "step": 1056}
{"info/global_step": 1057, "train_info/time_within_train_step": 27.94749617576599, "step": 1057}
{"train_info/time_between_train_steps": 0.005332469940185547, "step": 1057}
{"info/global_step": 1058, "train_info/time_within_train_step": 27.698956727981567, "step": 1058}
{"train_info/time_between_train_steps": 0.005093812942504883, "step": 1058}
{"info/global_step": 1059, "train_info/time_within_train_step": 27.832836151123047, "step": 1059}
{"train_info/time_between_train_steps": 0.0049669742584228516, "step": 1059}
{"info/global_step": 1060, "train_info/time_within_train_step": 27.70452380180359, "step": 1060}
{"train_info/time_between_train_steps": 0.005288839340209961, "step": 1060}
{"info/global_step": 1061, "train_info/time_within_train_step": 27.786941051483154, "step": 1061}
{"train_info/time_between_train_steps": 0.0068171024322509766, "step": 1061}
{"info/global_step": 1062, "train_info/time_within_train_step": 27.69574999809265, "step": 1062}
{"train_info/time_between_train_steps": 0.005157470703125, "step": 1062}
{"info/global_step": 1063, "train_info/time_within_train_step": 27.67673635482788, "step": 1063}
{"train_info/time_between_train_steps": 0.0049746036529541016, "step": 1063}
{"info/global_step": 1064, "train_info/time_within_train_step": 27.685830116271973, "step": 1064}
{"train_info/time_between_train_steps": 0.004913806915283203, "step": 1064}
{"info/global_step": 1065, "train_info/time_within_train_step": 27.69575810432434, "step": 1065}
{"train_info/time_between_train_steps": 0.005175113677978516, "step": 1065}
{"info/global_step": 1066, "train_info/time_within_train_step": 27.695711851119995, "step": 1066}
{"train_info/time_between_train_steps": 0.004931211471557617, "step": 1066}
{"info/global_step": 1067, "train_info/time_within_train_step": 27.954797983169556, "step": 1067}
{"train_info/time_between_train_steps": 0.0048999786376953125, "step": 1067}
{"info/global_step": 1068, "train_info/time_within_train_step": 27.712567806243896, "step": 1068}
{"train_info/time_between_train_steps": 0.005145072937011719, "step": 1068}
{"info/global_step": 1069, "train_info/time_within_train_step": 27.703584671020508, "step": 1069}
{"train_info/time_between_train_steps": 0.005635499954223633, "step": 1069}
{"info/global_step": 1070, "train_info/time_within_train_step": 27.741321563720703, "step": 1070}
{"train_info/time_between_train_steps": 0.005042552947998047, "step": 1070}
{"info/global_step": 1071, "train_info/time_within_train_step": 27.694608449935913, "step": 1071}
{"train_info/time_between_train_steps": 0.005138874053955078, "step": 1071}
{"info/global_step": 1072, "train_info/time_within_train_step": 27.73574995994568, "step": 1072}
{"train_info/time_between_train_steps": 0.00514674186706543, "step": 1072}
{"info/global_step": 1073, "train_info/time_within_train_step": 27.812591314315796, "step": 1073}
{"train_info/time_between_train_steps": 0.004973649978637695, "step": 1073}
{"info/global_step": 1074, "train_info/time_within_train_step": 27.69587540626526, "step": 1074}
{"train_info/time_between_train_steps": 0.0050046443939208984, "step": 1074}
{"info/global_step": 1075, "train_info/time_within_train_step": 27.730485439300537, "step": 1075}
{"train_info/time_between_train_steps": 0.0048961639404296875, "step": 1075}
{"info/global_step": 1076, "train_info/time_within_train_step": 27.696619033813477, "step": 1076}
{"train_info/time_between_train_steps": 0.0049173831939697266, "step": 1076}
{"info/global_step": 1077, "train_info/time_within_train_step": 27.674572706222534, "step": 1077}
{"train_info/time_between_train_steps": 0.005046367645263672, "step": 1077}
{"info/global_step": 1078, "train_info/time_within_train_step": 27.7299907207489, "step": 1078}
{"train_info/time_between_train_steps": 0.005077838897705078, "step": 1078}
{"info/global_step": 1079, "train_info/time_within_train_step": 27.712668657302856, "step": 1079}
{"train_info/time_between_train_steps": 0.005385875701904297, "step": 1079}
{"info/global_step": 1080, "train_info/time_within_train_step": 27.72298789024353, "step": 1080}
{"train_info/time_between_train_steps": 0.005451202392578125, "step": 1080}
{"train_info/time_between_train_steps": 29.762459993362427, "step": 1080}
{"info/global_step": 1081, "train_info/time_within_train_step": 27.740341663360596, "step": 1081}
{"train_info/time_between_train_steps": 0.005019426345825195, "step": 1081}
{"info/global_step": 1082, "train_info/time_within_train_step": 27.85689353942871, "step": 1082}
{"train_info/time_between_train_steps": 0.004942417144775391, "step": 1082}
{"info/global_step": 1083, "train_info/time_within_train_step": 27.691681385040283, "step": 1083}
{"train_info/time_between_train_steps": 0.005137443542480469, "step": 1083}
{"info/global_step": 1084, "train_info/time_within_train_step": 27.83687734603882, "step": 1084}
{"train_info/time_between_train_steps": 0.005265951156616211, "step": 1084}
{"info/global_step": 1085, "train_info/time_within_train_step": 27.727338075637817, "step": 1085}
{"train_info/time_between_train_steps": 0.00560760498046875, "step": 1085}
{"info/global_step": 1086, "train_info/time_within_train_step": 27.904183626174927, "step": 1086}
{"train_info/time_between_train_steps": 0.005445718765258789, "step": 1086}
{"info/global_step": 1087, "train_info/time_within_train_step": 27.834667205810547, "step": 1087}
{"train_info/time_between_train_steps": 0.0051877498626708984, "step": 1087}
{"info/global_step": 1088, "train_info/time_within_train_step": 27.77045726776123, "step": 1088}
{"train_info/time_between_train_steps": 0.0052182674407958984, "step": 1088}
{"info/global_step": 1089, "train_info/time_within_train_step": 27.71987748146057, "step": 1089}
{"train_info/time_between_train_steps": 0.00492405891418457, "step": 1089}
{"info/global_step": 1090, "train_info/time_within_train_step": 27.695985794067383, "step": 1090}
{"train_info/time_between_train_steps": 0.005131721496582031, "step": 1090}
{"info/global_step": 1091, "train_info/time_within_train_step": 27.71149778366089, "step": 1091}
{"train_info/time_between_train_steps": 0.00494837760925293, "step": 1091}
{"info/global_step": 1092, "train_info/time_within_train_step": 27.738033294677734, "step": 1092}
{"train_info/time_between_train_steps": 0.0054056644439697266, "step": 1092}
{"info/global_step": 1093, "train_info/time_within_train_step": 27.685067892074585, "step": 1093}
{"train_info/time_between_train_steps": 0.005060911178588867, "step": 1093}
{"info/global_step": 1094, "train_info/time_within_train_step": 27.7299382686615, "step": 1094}
{"train_info/time_between_train_steps": 0.004908561706542969, "step": 1094}
{"info/global_step": 1095, "train_info/time_within_train_step": 27.68550181388855, "step": 1095}
{"train_info/time_between_train_steps": 0.00502467155456543, "step": 1095}
{"info/global_step": 1096, "train_info/time_within_train_step": 27.68264651298523, "step": 1096}
{"train_info/time_between_train_steps": 0.005059242248535156, "step": 1096}
{"info/global_step": 1097, "train_info/time_within_train_step": 27.719717979431152, "step": 1097}
{"train_info/time_between_train_steps": 0.0051422119140625, "step": 1097}
{"info/global_step": 1098, "train_info/time_within_train_step": 27.69098711013794, "step": 1098}
{"train_info/time_between_train_steps": 0.005074501037597656, "step": 1098}
{"info/global_step": 1099, "train_info/time_within_train_step": 27.68382740020752, "step": 1099}
{"train_info/time_between_train_steps": 0.004937410354614258, "step": 1099}
{"info/global_step": 1100, "train_info/time_within_train_step": 27.683674812316895, "step": 1100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740856586, "_runtime": 32535}, "step": 1100}
{"logs": {"train/loss": 3.142, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 40.02, "_timestamp": 1740856586, "_runtime": 32535}, "step": 1100}
{"train_info/time_between_train_steps": 41.02827215194702, "step": 1100}
{"info/global_step": 1101, "train_info/time_within_train_step": 27.998775243759155, "step": 1101}
{"train_info/time_between_train_steps": 0.0052111148834228516, "step": 1101}
{"info/global_step": 1102, "train_info/time_within_train_step": 28.6092848777771, "step": 1102}
{"train_info/time_between_train_steps": 0.005062580108642578, "step": 1102}
{"info/global_step": 1103, "train_info/time_within_train_step": 27.798083305358887, "step": 1103}
{"train_info/time_between_train_steps": 0.005140781402587891, "step": 1103}
{"info/global_step": 1104, "train_info/time_within_train_step": 27.723987579345703, "step": 1104}
{"train_info/time_between_train_steps": 0.005644559860229492, "step": 1104}
{"info/global_step": 1105, "train_info/time_within_train_step": 27.713963985443115, "step": 1105}
{"train_info/time_between_train_steps": 0.005319833755493164, "step": 1105}
{"info/global_step": 1106, "train_info/time_within_train_step": 27.74254536628723, "step": 1106}
{"train_info/time_between_train_steps": 0.005207538604736328, "step": 1106}
{"info/global_step": 1107, "train_info/time_within_train_step": 27.734828233718872, "step": 1107}
{"train_info/time_between_train_steps": 0.005782604217529297, "step": 1107}
{"train_info/time_between_train_steps": 30.005472898483276, "step": 1107}
{"info/global_step": 1108, "train_info/time_within_train_step": 27.70647621154785, "step": 1108}
{"train_info/time_between_train_steps": 0.004958391189575195, "step": 1108}
{"info/global_step": 1109, "train_info/time_within_train_step": 27.84903049468994, "step": 1109}
{"train_info/time_between_train_steps": 0.004988670349121094, "step": 1109}
{"info/global_step": 1110, "train_info/time_within_train_step": 27.687151432037354, "step": 1110}
{"train_info/time_between_train_steps": 0.004788398742675781, "step": 1110}
{"info/global_step": 1111, "train_info/time_within_train_step": 27.840144395828247, "step": 1111}
{"train_info/time_between_train_steps": 0.005113840103149414, "step": 1111}
{"info/global_step": 1112, "train_info/time_within_train_step": 27.70552897453308, "step": 1112}
{"train_info/time_between_train_steps": 0.005121946334838867, "step": 1112}
{"info/global_step": 1113, "train_info/time_within_train_step": 27.824426651000977, "step": 1113}
{"train_info/time_between_train_steps": 0.0052623748779296875, "step": 1113}
{"info/global_step": 1114, "train_info/time_within_train_step": 27.709877490997314, "step": 1114}
{"train_info/time_between_train_steps": 0.005372047424316406, "step": 1114}
{"info/global_step": 1115, "train_info/time_within_train_step": 27.772328853607178, "step": 1115}
{"train_info/time_between_train_steps": 0.0052165985107421875, "step": 1115}
{"info/global_step": 1116, "train_info/time_within_train_step": 27.696478843688965, "step": 1116}
{"train_info/time_between_train_steps": 0.005136966705322266, "step": 1116}
{"info/global_step": 1117, "train_info/time_within_train_step": 27.686715126037598, "step": 1117}
{"train_info/time_between_train_steps": 0.005037546157836914, "step": 1117}
{"info/global_step": 1118, "train_info/time_within_train_step": 27.836971521377563, "step": 1118}
{"train_info/time_between_train_steps": 0.005316734313964844, "step": 1118}
{"info/global_step": 1119, "train_info/time_within_train_step": 28.03602147102356, "step": 1119}
{"train_info/time_between_train_steps": 0.004899740219116211, "step": 1119}
{"info/global_step": 1120, "train_info/time_within_train_step": 28.90098738670349, "step": 1120}
{"train_info/time_between_train_steps": 0.005036354064941406, "step": 1120}
{"info/global_step": 1121, "train_info/time_within_train_step": 27.708167552947998, "step": 1121}
{"train_info/time_between_train_steps": 0.004911184310913086, "step": 1121}
{"info/global_step": 1122, "train_info/time_within_train_step": 27.735175848007202, "step": 1122}
{"train_info/time_between_train_steps": 0.005074501037597656, "step": 1122}
{"info/global_step": 1123, "train_info/time_within_train_step": 27.688118934631348, "step": 1123}
{"train_info/time_between_train_steps": 0.005179405212402344, "step": 1123}
{"info/global_step": 1124, "train_info/time_within_train_step": 27.746726989746094, "step": 1124}
{"train_info/time_between_train_steps": 0.0060520172119140625, "step": 1124}
{"info/global_step": 1125, "train_info/time_within_train_step": 27.70869493484497, "step": 1125}
{"train_info/time_between_train_steps": 0.004938364028930664, "step": 1125}
{"info/global_step": 1126, "train_info/time_within_train_step": 27.744354724884033, "step": 1126}
{"train_info/time_between_train_steps": 0.005226850509643555, "step": 1126}
{"info/global_step": 1127, "train_info/time_within_train_step": 27.699812173843384, "step": 1127}
{"train_info/time_between_train_steps": 0.005067110061645508, "step": 1127}
{"info/global_step": 1128, "train_info/time_within_train_step": 27.692742109298706, "step": 1128}
{"train_info/time_between_train_steps": 0.00508880615234375, "step": 1128}
{"info/global_step": 1129, "train_info/time_within_train_step": 27.738450288772583, "step": 1129}
{"train_info/time_between_train_steps": 0.0048291683197021484, "step": 1129}
{"info/global_step": 1130, "train_info/time_within_train_step": 27.684617042541504, "step": 1130}
{"train_info/time_between_train_steps": 0.005114078521728516, "step": 1130}
{"info/global_step": 1131, "train_info/time_within_train_step": 27.7275333404541, "step": 1131}
{"train_info/time_between_train_steps": 0.005097627639770508, "step": 1131}
{"info/global_step": 1132, "train_info/time_within_train_step": 27.714468479156494, "step": 1132}
{"train_info/time_between_train_steps": 0.005156040191650391, "step": 1132}
{"info/global_step": 1133, "train_info/time_within_train_step": 27.846184015274048, "step": 1133}
{"train_info/time_between_train_steps": 0.00514531135559082, "step": 1133}
{"info/global_step": 1134, "train_info/time_within_train_step": 27.755210876464844, "step": 1134}
{"train_info/time_between_train_steps": 0.005201578140258789, "step": 1134}
{"train_info/time_between_train_steps": 29.83916997909546, "step": 1134}
{"info/global_step": 1135, "train_info/time_within_train_step": 27.697821140289307, "step": 1135}
{"train_info/time_between_train_steps": 0.005738019943237305, "step": 1135}
{"info/global_step": 1136, "train_info/time_within_train_step": 27.847658395767212, "step": 1136}
{"train_info/time_between_train_steps": 0.00481104850769043, "step": 1136}
{"info/global_step": 1137, "train_info/time_within_train_step": 27.68674087524414, "step": 1137}
{"train_info/time_between_train_steps": 0.004817008972167969, "step": 1137}
{"info/global_step": 1138, "train_info/time_within_train_step": 27.867809534072876, "step": 1138}
{"train_info/time_between_train_steps": 0.0051021575927734375, "step": 1138}
{"info/global_step": 1139, "train_info/time_within_train_step": 27.762470483779907, "step": 1139}
{"train_info/time_between_train_steps": 0.005422830581665039, "step": 1139}
{"info/global_step": 1140, "train_info/time_within_train_step": 27.887553453445435, "step": 1140}
{"train_info/time_between_train_steps": 0.01693558692932129, "step": 1140}
{"info/global_step": 1141, "train_info/time_within_train_step": 27.73496985435486, "step": 1141}
{"train_info/time_between_train_steps": 0.005130767822265625, "step": 1141}
{"info/global_step": 1142, "train_info/time_within_train_step": 27.759283781051636, "step": 1142}
{"train_info/time_between_train_steps": 0.0051577091217041016, "step": 1142}
{"info/global_step": 1143, "train_info/time_within_train_step": 27.710222959518433, "step": 1143}
{"train_info/time_between_train_steps": 0.004961252212524414, "step": 1143}
{"info/global_step": 1144, "train_info/time_within_train_step": 27.687845945358276, "step": 1144}
{"train_info/time_between_train_steps": 0.0058765411376953125, "step": 1144}
{"info/global_step": 1145, "train_info/time_within_train_step": 27.707916736602783, "step": 1145}
{"train_info/time_between_train_steps": 0.004926919937133789, "step": 1145}
{"info/global_step": 1146, "train_info/time_within_train_step": 27.685908555984497, "step": 1146}
{"train_info/time_between_train_steps": 0.00485682487487793, "step": 1146}
{"info/global_step": 1147, "train_info/time_within_train_step": 27.72572922706604, "step": 1147}
{"train_info/time_between_train_steps": 0.004899263381958008, "step": 1147}
{"info/global_step": 1148, "train_info/time_within_train_step": 27.76492977142334, "step": 1148}
{"train_info/time_between_train_steps": 0.009741544723510742, "step": 1148}
{"info/global_step": 1149, "train_info/time_within_train_step": 27.723357439041138, "step": 1149}
{"train_info/time_between_train_steps": 0.004979610443115234, "step": 1149}
{"info/global_step": 1150, "train_info/time_within_train_step": 27.695191621780396, "step": 1150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740858080, "_runtime": 34029}, "step": 1150}
{"logs": {"train/loss": 3.1114, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 42.01, "_timestamp": 1740858080, "_runtime": 34029}, "step": 1150}
{"train_info/time_between_train_steps": 0.02635049819946289, "step": 1150}
{"info/global_step": 1151, "train_info/time_within_train_step": 27.67681336402893, "step": 1151}
{"train_info/time_between_train_steps": 0.004891157150268555, "step": 1151}
{"info/global_step": 1152, "train_info/time_within_train_step": 27.693902492523193, "step": 1152}
{"train_info/time_between_train_steps": 0.00596928596496582, "step": 1152}
{"info/global_step": 1153, "train_info/time_within_train_step": 27.69721508026123, "step": 1153}
{"train_info/time_between_train_steps": 0.00495457649230957, "step": 1153}
{"info/global_step": 1154, "train_info/time_within_train_step": 27.68316340446472, "step": 1154}
{"train_info/time_between_train_steps": 0.005010843276977539, "step": 1154}
{"info/global_step": 1155, "train_info/time_within_train_step": 27.68389368057251, "step": 1155}
{"train_info/time_between_train_steps": 0.005175352096557617, "step": 1155}
{"info/global_step": 1156, "train_info/time_within_train_step": 27.734208583831787, "step": 1156}
{"train_info/time_between_train_steps": 0.005148887634277344, "step": 1156}
{"info/global_step": 1157, "train_info/time_within_train_step": 27.703547716140747, "step": 1157}
{"train_info/time_between_train_steps": 0.005231618881225586, "step": 1157}
{"info/global_step": 1158, "train_info/time_within_train_step": 27.72550940513611, "step": 1158}
{"train_info/time_between_train_steps": 0.005006551742553711, "step": 1158}
{"info/global_step": 1159, "train_info/time_within_train_step": 27.690680503845215, "step": 1159}
{"train_info/time_between_train_steps": 0.0054171085357666016, "step": 1159}
{"info/global_step": 1160, "train_info/time_within_train_step": 27.73633646965027, "step": 1160}
{"train_info/time_between_train_steps": 0.0052683353424072266, "step": 1160}
{"info/global_step": 1161, "train_info/time_within_train_step": 27.72842502593994, "step": 1161}
{"train_info/time_between_train_steps": 0.005506992340087891, "step": 1161}
{"train_info/time_between_train_steps": 29.790043115615845, "step": 1161}
{"info/global_step": 1162, "train_info/time_within_train_step": 27.7026150226593, "step": 1162}
{"train_info/time_between_train_steps": 0.004858493804931641, "step": 1162}
{"info/global_step": 1163, "train_info/time_within_train_step": 27.970237731933594, "step": 1163}
{"train_info/time_between_train_steps": 0.00524449348449707, "step": 1163}
{"info/global_step": 1164, "train_info/time_within_train_step": 27.69316864013672, "step": 1164}
{"train_info/time_between_train_steps": 0.005135774612426758, "step": 1164}
{"info/global_step": 1165, "train_info/time_within_train_step": 27.819489002227783, "step": 1165}
{"train_info/time_between_train_steps": 0.0052144527435302734, "step": 1165}
{"info/global_step": 1166, "train_info/time_within_train_step": 27.705933332443237, "step": 1166}
{"train_info/time_between_train_steps": 0.004927158355712891, "step": 1166}
{"info/global_step": 1167, "train_info/time_within_train_step": 27.819119453430176, "step": 1167}
{"train_info/time_between_train_steps": 0.00518345832824707, "step": 1167}
{"info/global_step": 1168, "train_info/time_within_train_step": 27.758617877960205, "step": 1168}
{"train_info/time_between_train_steps": 0.00533294677734375, "step": 1168}
{"info/global_step": 1169, "train_info/time_within_train_step": 27.79144310951233, "step": 1169}
{"train_info/time_between_train_steps": 0.005267620086669922, "step": 1169}
{"info/global_step": 1170, "train_info/time_within_train_step": 27.737929582595825, "step": 1170}
{"train_info/time_between_train_steps": 0.0057294368743896484, "step": 1170}
{"info/global_step": 1171, "train_info/time_within_train_step": 27.70017671585083, "step": 1171}
{"train_info/time_between_train_steps": 0.0049936771392822266, "step": 1171}
{"info/global_step": 1172, "train_info/time_within_train_step": 27.740699291229248, "step": 1172}
{"train_info/time_between_train_steps": 0.004912614822387695, "step": 1172}
{"info/global_step": 1173, "train_info/time_within_train_step": 27.68489980697632, "step": 1173}
{"train_info/time_between_train_steps": 0.004923343658447266, "step": 1173}
{"info/global_step": 1174, "train_info/time_within_train_step": 27.72490406036377, "step": 1174}
{"train_info/time_between_train_steps": 0.005075931549072266, "step": 1174}
{"info/global_step": 1175, "train_info/time_within_train_step": 27.68814754486084, "step": 1175}
{"train_info/time_between_train_steps": 0.004799604415893555, "step": 1175}
{"info/global_step": 1176, "train_info/time_within_train_step": 27.722071409225464, "step": 1176}
{"train_info/time_between_train_steps": 0.0052225589752197266, "step": 1176}
{"info/global_step": 1177, "train_info/time_within_train_step": 27.688185453414917, "step": 1177}
{"train_info/time_between_train_steps": 0.0050847530364990234, "step": 1177}
{"info/global_step": 1178, "train_info/time_within_train_step": 27.769520044326782, "step": 1178}
{"train_info/time_between_train_steps": 0.0049211978912353516, "step": 1178}
{"info/global_step": 1179, "train_info/time_within_train_step": 27.696720123291016, "step": 1179}
{"train_info/time_between_train_steps": 0.0050046443939208984, "step": 1179}
{"info/global_step": 1180, "train_info/time_within_train_step": 27.69837260246277, "step": 1180}
{"train_info/time_between_train_steps": 0.005074024200439453, "step": 1180}
{"info/global_step": 1181, "train_info/time_within_train_step": 27.717630863189697, "step": 1181}
{"train_info/time_between_train_steps": 0.004993915557861328, "step": 1181}
{"info/global_step": 1182, "train_info/time_within_train_step": 27.69912576675415, "step": 1182}
{"train_info/time_between_train_steps": 0.005126476287841797, "step": 1182}
{"info/global_step": 1183, "train_info/time_within_train_step": 27.730365753173828, "step": 1183}
{"train_info/time_between_train_steps": 0.004946470260620117, "step": 1183}
{"info/global_step": 1184, "train_info/time_within_train_step": 27.701728343963623, "step": 1184}
{"train_info/time_between_train_steps": 0.004911899566650391, "step": 1184}
{"info/global_step": 1185, "train_info/time_within_train_step": 27.73612904548645, "step": 1185}
{"train_info/time_between_train_steps": 0.00519871711730957, "step": 1185}
{"info/global_step": 1186, "train_info/time_within_train_step": 27.694844245910645, "step": 1186}
{"train_info/time_between_train_steps": 0.005022287368774414, "step": 1186}
{"info/global_step": 1187, "train_info/time_within_train_step": 27.734578132629395, "step": 1187}
{"train_info/time_between_train_steps": 0.005408287048339844, "step": 1187}
{"info/global_step": 1188, "train_info/time_within_train_step": 27.711532592773438, "step": 1188}
{"train_info/time_between_train_steps": 0.0056231021881103516, "step": 1188}
{"train_info/time_between_train_steps": 29.976243495941162, "step": 1188}
{"info/global_step": 1189, "train_info/time_within_train_step": 27.691545724868774, "step": 1189}
{"train_info/time_between_train_steps": 0.005637168884277344, "step": 1189}
{"info/global_step": 1190, "train_info/time_within_train_step": 27.8354971408844, "step": 1190}
{"train_info/time_between_train_steps": 0.005497455596923828, "step": 1190}
{"info/global_step": 1191, "train_info/time_within_train_step": 27.717230081558228, "step": 1191}
{"train_info/time_between_train_steps": 0.005144596099853516, "step": 1191}
{"info/global_step": 1192, "train_info/time_within_train_step": 27.81442618370056, "step": 1192}
{"train_info/time_between_train_steps": 0.00510406494140625, "step": 1192}
{"info/global_step": 1193, "train_info/time_within_train_step": 27.837268829345703, "step": 1193}
{"train_info/time_between_train_steps": 0.005037784576416016, "step": 1193}
{"info/global_step": 1194, "train_info/time_within_train_step": 27.85683298110962, "step": 1194}
{"train_info/time_between_train_steps": 0.005466461181640625, "step": 1194}
{"info/global_step": 1195, "train_info/time_within_train_step": 27.75145387649536, "step": 1195}
{"train_info/time_between_train_steps": 0.00521087646484375, "step": 1195}
{"info/global_step": 1196, "train_info/time_within_train_step": 27.760989904403687, "step": 1196}
{"train_info/time_between_train_steps": 0.005158662796020508, "step": 1196}
{"info/global_step": 1197, "train_info/time_within_train_step": 27.6898353099823, "step": 1197}
{"train_info/time_between_train_steps": 0.004963874816894531, "step": 1197}
{"info/global_step": 1198, "train_info/time_within_train_step": 27.672107458114624, "step": 1198}
{"train_info/time_between_train_steps": 0.004807233810424805, "step": 1198}
{"info/global_step": 1199, "train_info/time_within_train_step": 27.719714641571045, "step": 1199}
{"train_info/time_between_train_steps": 0.00517582893371582, "step": 1199}
{"info/global_step": 1200, "train_info/time_within_train_step": 27.68014931678772, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859528, "_runtime": 35477}, "step": 1200}
{"logs": {"train/loss": 3.0867, "train/learning_rate": 0.0, "train/epoch": 44.01, "_timestamp": 1740859528, "_runtime": 35477}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859569, "_runtime": 35518}, "step": 1200}
{"logs": {"train/train_runtime": 35519.5303, "train/train_samples_per_second": 17.298, "train/train_steps_per_second": 0.034, "train/total_flos": 3.32296573943808e+17, "train/train_loss": 4.049262095292409, "train/epoch": 44.01, "_timestamp": 1740859569, "_runtime": 35518}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859599, "_runtime": 35548}, "step": 1200}
{"logs": {"eval/loss": 4.187204837799072, "eval/runtime": 5.6239, "eval/samples_per_second": 36.096, "eval/steps_per_second": 2.312, "train/epoch": 44.01, "_timestamp": 1740859599, "_runtime": 35548}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859600, "_runtime": 35549}, "step": 1200}
{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.187204837799072, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 65.83850422635916, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.6239, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.096, "train/epoch": 44.01, "_timestamp": 1740859600, "_runtime": 35549}, "step": 1200}