ZH_GPT2 / metrics.json
xiulinyang's picture
Adding model checkpoints and config files
ad3f244
{"num_parameters": 102068736, "trainable_parameters": 102068736, "step": 0}
{"train_info/time_between_train_steps": 3.325666904449463, "step": 0}
{"info/global_step": 1, "train_info/time_within_train_step": 25.406368255615234, "step": 1}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 17273.5732421875, "train_info/memory_reserved": 18442.0, "train_info/memory_max_reserved": 18442.0, "_timestamp": 1734206971, "_runtime": 33}, "step": 1}
{"logs": {"train/loss": 10.1084, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1734206971, "_runtime": 33}, "step": 1}
{"train_info/time_between_train_steps": 0.008052349090576172, "step": 1}
{"info/global_step": 2, "train_info/time_within_train_step": 25.160895586013794, "step": 2}
{"train_info/time_between_train_steps": 0.006456851959228516, "step": 2}
{"info/global_step": 3, "train_info/time_within_train_step": 24.865103721618652, "step": 3}
{"train_info/time_between_train_steps": 0.0057446956634521484, "step": 3}
{"info/global_step": 4, "train_info/time_within_train_step": 25.059681177139282, "step": 4}
{"train_info/time_between_train_steps": 0.005551576614379883, "step": 4}
{"info/global_step": 5, "train_info/time_within_train_step": 25.307673454284668, "step": 5}
{"train_info/time_between_train_steps": 0.007093906402587891, "step": 5}
{"info/global_step": 6, "train_info/time_within_train_step": 25.492204189300537, "step": 6}
{"train_info/time_between_train_steps": 0.00558781623840332, "step": 6}
{"info/global_step": 7, "train_info/time_within_train_step": 24.92021656036377, "step": 7}
{"train_info/time_between_train_steps": 0.005933284759521484, "step": 7}
{"info/global_step": 8, "train_info/time_within_train_step": 25.128674745559692, "step": 8}
{"train_info/time_between_train_steps": 0.005925893783569336, "step": 8}
{"info/global_step": 9, "train_info/time_within_train_step": 25.122132778167725, "step": 9}
{"train_info/time_between_train_steps": 0.0053446292877197266, "step": 9}
{"info/global_step": 10, "train_info/time_within_train_step": 25.140045642852783, "step": 10}
{"train_info/time_between_train_steps": 0.0060176849365234375, "step": 10}
{"info/global_step": 11, "train_info/time_within_train_step": 24.90731716156006, "step": 11}
{"train_info/time_between_train_steps": 0.006730794906616211, "step": 11}
{"info/global_step": 12, "train_info/time_within_train_step": 25.071826934814453, "step": 12}
{"train_info/time_between_train_steps": 0.005986452102661133, "step": 12}
{"info/global_step": 13, "train_info/time_within_train_step": 24.902277946472168, "step": 13}
{"train_info/time_between_train_steps": 0.005963325500488281, "step": 13}
{"info/global_step": 14, "train_info/time_within_train_step": 25.178427934646606, "step": 14}
{"train_info/time_between_train_steps": 0.00610041618347168, "step": 14}
{"info/global_step": 15, "train_info/time_within_train_step": 24.862053394317627, "step": 15}
{"train_info/time_between_train_steps": 0.005817890167236328, "step": 15}
{"info/global_step": 16, "train_info/time_within_train_step": 25.208113193511963, "step": 16}
{"train_info/time_between_train_steps": 0.010947942733764648, "step": 16}
{"info/global_step": 17, "train_info/time_within_train_step": 24.899478673934937, "step": 17}
{"train_info/time_between_train_steps": 0.005217552185058594, "step": 17}
{"info/global_step": 18, "train_info/time_within_train_step": 24.84860873222351, "step": 18}
{"train_info/time_between_train_steps": 0.007694244384765625, "step": 18}
{"info/global_step": 19, "train_info/time_within_train_step": 24.846209049224854, "step": 19}
{"train_info/time_between_train_steps": 0.00541996955871582, "step": 19}
{"info/global_step": 20, "train_info/time_within_train_step": 24.845118522644043, "step": 20}
{"train_info/time_between_train_steps": 0.00536036491394043, "step": 20}
{"info/global_step": 21, "train_info/time_within_train_step": 24.832807779312134, "step": 21}
{"train_info/time_between_train_steps": 0.005287647247314453, "step": 21}
{"info/global_step": 22, "train_info/time_within_train_step": 24.922903776168823, "step": 22}
{"train_info/time_between_train_steps": 0.005577564239501953, "step": 22}
{"info/global_step": 23, "train_info/time_within_train_step": 24.87640118598938, "step": 23}
{"train_info/time_between_train_steps": 0.011613130569458008, "step": 23}
{"info/global_step": 24, "train_info/time_within_train_step": 25.007306814193726, "step": 24}
{"train_info/time_between_train_steps": 0.005690336227416992, "step": 24}
{"info/global_step": 25, "train_info/time_within_train_step": 24.888710260391235, "step": 25}
{"train_info/time_between_train_steps": 0.0062487125396728516, "step": 25}
{"info/global_step": 26, "train_info/time_within_train_step": 25.036595582962036, "step": 26}
{"train_info/time_between_train_steps": 0.009528160095214844, "step": 26}
{"info/global_step": 27, "train_info/time_within_train_step": 24.911707162857056, "step": 27}
{"train_info/time_between_train_steps": 0.01253509521484375, "step": 27}
{"info/global_step": 28, "train_info/time_within_train_step": 24.92010498046875, "step": 28}
{"train_info/time_between_train_steps": 0.010548591613769531, "step": 28}
{"info/global_step": 29, "train_info/time_within_train_step": 24.87119960784912, "step": 29}
{"train_info/time_between_train_steps": 0.0054743289947509766, "step": 29}
{"info/global_step": 30, "train_info/time_within_train_step": 24.92220711708069, "step": 30}
{"train_info/time_between_train_steps": 0.005434513092041016, "step": 30}
{"info/global_step": 31, "train_info/time_within_train_step": 24.896255493164062, "step": 31}
{"train_info/time_between_train_steps": 0.0066487789154052734, "step": 31}
{"info/global_step": 32, "train_info/time_within_train_step": 24.940733432769775, "step": 32}
{"train_info/time_between_train_steps": 0.005598545074462891, "step": 32}
{"info/global_step": 33, "train_info/time_within_train_step": 24.979548454284668, "step": 33}
{"train_info/time_between_train_steps": 0.005549430847167969, "step": 33}
{"info/global_step": 34, "train_info/time_within_train_step": 24.91555118560791, "step": 34}
{"train_info/time_between_train_steps": 0.00542449951171875, "step": 34}
{"info/global_step": 35, "train_info/time_within_train_step": 24.9018714427948, "step": 35}
{"train_info/time_between_train_steps": 0.00621485710144043, "step": 35}
{"info/global_step": 36, "train_info/time_within_train_step": 25.000617742538452, "step": 36}
{"train_info/time_between_train_steps": 0.00643157958984375, "step": 36}
{"train_info/time_between_train_steps": 13.162453889846802, "step": 36}
{"info/global_step": 37, "train_info/time_within_train_step": 24.87821674346924, "step": 37}
{"train_info/time_between_train_steps": 0.005349636077880859, "step": 37}
{"info/global_step": 38, "train_info/time_within_train_step": 25.160878658294678, "step": 38}
{"train_info/time_between_train_steps": 0.010500669479370117, "step": 38}
{"info/global_step": 39, "train_info/time_within_train_step": 24.87971806526184, "step": 39}
{"train_info/time_between_train_steps": 0.005312681198120117, "step": 39}
{"info/global_step": 40, "train_info/time_within_train_step": 25.0943021774292, "step": 40}
{"train_info/time_between_train_steps": 0.005498647689819336, "step": 40}
{"info/global_step": 41, "train_info/time_within_train_step": 24.94641399383545, "step": 41}
{"train_info/time_between_train_steps": 0.006617546081542969, "step": 41}
{"info/global_step": 42, "train_info/time_within_train_step": 25.059454202651978, "step": 42}
{"train_info/time_between_train_steps": 0.0062334537506103516, "step": 42}
{"info/global_step": 43, "train_info/time_within_train_step": 24.94077491760254, "step": 43}
{"train_info/time_between_train_steps": 0.012566089630126953, "step": 43}
{"info/global_step": 44, "train_info/time_within_train_step": 25.056201696395874, "step": 44}
{"train_info/time_between_train_steps": 0.005408287048339844, "step": 44}
{"info/global_step": 45, "train_info/time_within_train_step": 24.928580284118652, "step": 45}
{"train_info/time_between_train_steps": 0.0058557987213134766, "step": 45}
{"info/global_step": 46, "train_info/time_within_train_step": 25.18645429611206, "step": 46}
{"train_info/time_between_train_steps": 0.011163949966430664, "step": 46}
{"info/global_step": 47, "train_info/time_within_train_step": 25.25889492034912, "step": 47}
{"train_info/time_between_train_steps": 0.011180639266967773, "step": 47}
{"info/global_step": 48, "train_info/time_within_train_step": 25.100855112075806, "step": 48}
{"train_info/time_between_train_steps": 0.011225461959838867, "step": 48}
{"info/global_step": 49, "train_info/time_within_train_step": 24.90419030189514, "step": 49}
{"train_info/time_between_train_steps": 0.005940675735473633, "step": 49}
{"info/global_step": 50, "train_info/time_within_train_step": 25.061166286468506, "step": 50}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734208210, "_runtime": 1272}, "step": 50}
{"logs": {"train/loss": 6.9633, "train/learning_rate": 0.00025, "train/epoch": 1.01, "_timestamp": 1734208210, "_runtime": 1272}, "step": 50}
{"train_info/time_between_train_steps": 0.008846282958984375, "step": 50}
{"info/global_step": 51, "train_info/time_within_train_step": 24.914175987243652, "step": 51}
{"train_info/time_between_train_steps": 0.005938291549682617, "step": 51}
{"info/global_step": 52, "train_info/time_within_train_step": 24.992482900619507, "step": 52}
{"train_info/time_between_train_steps": 0.008324384689331055, "step": 52}
{"info/global_step": 53, "train_info/time_within_train_step": 24.906115531921387, "step": 53}
{"train_info/time_between_train_steps": 0.005383014678955078, "step": 53}
{"info/global_step": 54, "train_info/time_within_train_step": 24.82204270362854, "step": 54}
{"train_info/time_between_train_steps": 0.00536346435546875, "step": 54}
{"info/global_step": 55, "train_info/time_within_train_step": 24.914961099624634, "step": 55}
{"train_info/time_between_train_steps": 0.0054149627685546875, "step": 55}
{"info/global_step": 56, "train_info/time_within_train_step": 24.8582923412323, "step": 56}
{"train_info/time_between_train_steps": 0.005262136459350586, "step": 56}
{"info/global_step": 57, "train_info/time_within_train_step": 24.83730459213257, "step": 57}
{"train_info/time_between_train_steps": 0.006285905838012695, "step": 57}
{"info/global_step": 58, "train_info/time_within_train_step": 24.815717697143555, "step": 58}
{"train_info/time_between_train_steps": 0.005408525466918945, "step": 58}
{"info/global_step": 59, "train_info/time_within_train_step": 24.9020357131958, "step": 59}
{"train_info/time_between_train_steps": 0.011100053787231445, "step": 59}
{"info/global_step": 60, "train_info/time_within_train_step": 24.907873392105103, "step": 60}
{"train_info/time_between_train_steps": 0.0056378841400146484, "step": 60}
{"info/global_step": 61, "train_info/time_within_train_step": 24.900803565979004, "step": 61}
{"train_info/time_between_train_steps": 0.005426645278930664, "step": 61}
{"info/global_step": 62, "train_info/time_within_train_step": 24.841233491897583, "step": 62}
{"train_info/time_between_train_steps": 0.005470752716064453, "step": 62}
{"info/global_step": 63, "train_info/time_within_train_step": 24.95102071762085, "step": 63}
{"train_info/time_between_train_steps": 0.01322627067565918, "step": 63}
{"info/global_step": 64, "train_info/time_within_train_step": 24.8836669921875, "step": 64}
{"train_info/time_between_train_steps": 0.010794401168823242, "step": 64}
{"info/global_step": 65, "train_info/time_within_train_step": 24.850148916244507, "step": 65}
{"train_info/time_between_train_steps": 0.005468130111694336, "step": 65}
{"info/global_step": 66, "train_info/time_within_train_step": 24.910802841186523, "step": 66}
{"train_info/time_between_train_steps": 0.005391836166381836, "step": 66}
{"info/global_step": 67, "train_info/time_within_train_step": 24.91977572441101, "step": 67}
{"train_info/time_between_train_steps": 0.0054018497467041016, "step": 67}
{"info/global_step": 68, "train_info/time_within_train_step": 24.844653606414795, "step": 68}
{"train_info/time_between_train_steps": 0.0055675506591796875, "step": 68}
{"info/global_step": 69, "train_info/time_within_train_step": 24.96964931488037, "step": 69}
{"train_info/time_between_train_steps": 0.0056912899017333984, "step": 69}
{"info/global_step": 70, "train_info/time_within_train_step": 24.915760040283203, "step": 70}
{"train_info/time_between_train_steps": 0.010409116744995117, "step": 70}
{"info/global_step": 71, "train_info/time_within_train_step": 25.1025869846344, "step": 71}
{"train_info/time_between_train_steps": 0.006013393402099609, "step": 71}
{"info/global_step": 72, "train_info/time_within_train_step": 25.00511622428894, "step": 72}
{"train_info/time_between_train_steps": 0.006620168685913086, "step": 72}
{"train_info/time_between_train_steps": 13.340702772140503, "step": 72}
{"info/global_step": 73, "train_info/time_within_train_step": 24.849769592285156, "step": 73}
{"train_info/time_between_train_steps": 0.005877971649169922, "step": 73}
{"info/global_step": 74, "train_info/time_within_train_step": 25.08607316017151, "step": 74}
{"train_info/time_between_train_steps": 0.005627155303955078, "step": 74}
{"info/global_step": 75, "train_info/time_within_train_step": 24.855902194976807, "step": 75}
{"train_info/time_between_train_steps": 0.005429744720458984, "step": 75}
{"info/global_step": 76, "train_info/time_within_train_step": 25.11769199371338, "step": 76}
{"train_info/time_between_train_steps": 0.005606174468994141, "step": 76}
{"info/global_step": 77, "train_info/time_within_train_step": 24.893296480178833, "step": 77}
{"train_info/time_between_train_steps": 0.0055735111236572266, "step": 77}
{"info/global_step": 78, "train_info/time_within_train_step": 25.16429567337036, "step": 78}
{"train_info/time_between_train_steps": 0.007089138031005859, "step": 78}
{"info/global_step": 79, "train_info/time_within_train_step": 24.893405199050903, "step": 79}
{"train_info/time_between_train_steps": 0.005434513092041016, "step": 79}
{"info/global_step": 80, "train_info/time_within_train_step": 25.04255771636963, "step": 80}
{"train_info/time_between_train_steps": 0.012215852737426758, "step": 80}
{"info/global_step": 81, "train_info/time_within_train_step": 24.974236488342285, "step": 81}
{"train_info/time_between_train_steps": 0.01126551628112793, "step": 81}
{"info/global_step": 82, "train_info/time_within_train_step": 25.094693183898926, "step": 82}
{"train_info/time_between_train_steps": 0.006161212921142578, "step": 82}
{"info/global_step": 83, "train_info/time_within_train_step": 25.02604103088379, "step": 83}
{"train_info/time_between_train_steps": 0.005602359771728516, "step": 83}
{"info/global_step": 84, "train_info/time_within_train_step": 25.089378595352173, "step": 84}
{"train_info/time_between_train_steps": 0.00556635856628418, "step": 84}
{"info/global_step": 85, "train_info/time_within_train_step": 24.98328685760498, "step": 85}
{"train_info/time_between_train_steps": 0.0072634220123291016, "step": 85}
{"info/global_step": 86, "train_info/time_within_train_step": 25.138654232025146, "step": 86}
{"train_info/time_between_train_steps": 0.010809183120727539, "step": 86}
{"info/global_step": 87, "train_info/time_within_train_step": 24.96003246307373, "step": 87}
{"train_info/time_between_train_steps": 0.006005287170410156, "step": 87}
{"info/global_step": 88, "train_info/time_within_train_step": 25.081493854522705, "step": 88}
{"train_info/time_between_train_steps": 0.005613803863525391, "step": 88}
{"info/global_step": 89, "train_info/time_within_train_step": 24.903080701828003, "step": 89}
{"train_info/time_between_train_steps": 0.005251646041870117, "step": 89}
{"info/global_step": 90, "train_info/time_within_train_step": 24.86359691619873, "step": 90}
{"train_info/time_between_train_steps": 0.005402803421020508, "step": 90}
{"info/global_step": 91, "train_info/time_within_train_step": 24.849433660507202, "step": 91}
{"train_info/time_between_train_steps": 0.005277395248413086, "step": 91}
{"info/global_step": 92, "train_info/time_within_train_step": 24.825590133666992, "step": 92}
{"train_info/time_between_train_steps": 0.010381221771240234, "step": 92}
{"info/global_step": 93, "train_info/time_within_train_step": 25.070675134658813, "step": 93}
{"train_info/time_between_train_steps": 0.0063593387603759766, "step": 93}
{"info/global_step": 94, "train_info/time_within_train_step": 24.862594604492188, "step": 94}
{"train_info/time_between_train_steps": 0.005373239517211914, "step": 94}
{"info/global_step": 95, "train_info/time_within_train_step": 24.884901523590088, "step": 95}
{"train_info/time_between_train_steps": 0.006795167922973633, "step": 95}
{"info/global_step": 96, "train_info/time_within_train_step": 24.91721224784851, "step": 96}
{"train_info/time_between_train_steps": 0.00624537467956543, "step": 96}
{"info/global_step": 97, "train_info/time_within_train_step": 24.931349992752075, "step": 97}
{"train_info/time_between_train_steps": 0.006420135498046875, "step": 97}
{"info/global_step": 98, "train_info/time_within_train_step": 24.8648099899292, "step": 98}
{"train_info/time_between_train_steps": 0.005453348159790039, "step": 98}
{"info/global_step": 99, "train_info/time_within_train_step": 25.012843370437622, "step": 99}
{"train_info/time_between_train_steps": 0.00517582893371582, "step": 99}
{"info/global_step": 100, "train_info/time_within_train_step": 25.00153613090515, "step": 100}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734209471, "_runtime": 2533}, "step": 100}
{"logs": {"train/loss": 4.9297, "train/learning_rate": 0.0005, "train/epoch": 2.02, "_timestamp": 1734209471, "_runtime": 2533}, "step": 100}
{"train_info/time_between_train_steps": 2.0369246006011963, "step": 100}
{"info/global_step": 101, "train_info/time_within_train_step": 24.916253328323364, "step": 101}
{"train_info/time_between_train_steps": 0.010499715805053711, "step": 101}
{"info/global_step": 102, "train_info/time_within_train_step": 24.95295262336731, "step": 102}
{"train_info/time_between_train_steps": 0.005132436752319336, "step": 102}
{"info/global_step": 103, "train_info/time_within_train_step": 24.89792537689209, "step": 103}
{"train_info/time_between_train_steps": 0.009358882904052734, "step": 103}
{"info/global_step": 104, "train_info/time_within_train_step": 24.984108924865723, "step": 104}
{"train_info/time_between_train_steps": 0.0053212642669677734, "step": 104}
{"info/global_step": 105, "train_info/time_within_train_step": 24.836453437805176, "step": 105}
{"train_info/time_between_train_steps": 0.005225181579589844, "step": 105}
{"info/global_step": 106, "train_info/time_within_train_step": 24.90648365020752, "step": 106}
{"train_info/time_between_train_steps": 0.005568504333496094, "step": 106}
{"info/global_step": 107, "train_info/time_within_train_step": 24.84886121749878, "step": 107}
{"train_info/time_between_train_steps": 0.0057451725006103516, "step": 107}
{"info/global_step": 108, "train_info/time_within_train_step": 24.922604084014893, "step": 108}
{"train_info/time_between_train_steps": 0.0072138309478759766, "step": 108}
{"train_info/time_between_train_steps": 13.406117916107178, "step": 108}
{"info/global_step": 109, "train_info/time_within_train_step": 25.02498745918274, "step": 109}
{"train_info/time_between_train_steps": 0.0055081844329833984, "step": 109}
{"info/global_step": 110, "train_info/time_within_train_step": 24.95828413963318, "step": 110}
{"train_info/time_between_train_steps": 0.005054473876953125, "step": 110}
{"info/global_step": 111, "train_info/time_within_train_step": 24.904242277145386, "step": 111}
{"train_info/time_between_train_steps": 0.010266542434692383, "step": 111}
{"info/global_step": 112, "train_info/time_within_train_step": 25.00249719619751, "step": 112}
{"train_info/time_between_train_steps": 0.005674123764038086, "step": 112}
{"info/global_step": 113, "train_info/time_within_train_step": 24.939833641052246, "step": 113}
{"train_info/time_between_train_steps": 0.005337238311767578, "step": 113}
{"info/global_step": 114, "train_info/time_within_train_step": 25.067042112350464, "step": 114}
{"train_info/time_between_train_steps": 0.005332469940185547, "step": 114}
{"info/global_step": 115, "train_info/time_within_train_step": 24.883205890655518, "step": 115}
{"train_info/time_between_train_steps": 0.005698204040527344, "step": 115}
{"info/global_step": 116, "train_info/time_within_train_step": 25.128238439559937, "step": 116}
{"train_info/time_between_train_steps": 0.00665283203125, "step": 116}
{"info/global_step": 117, "train_info/time_within_train_step": 24.82863974571228, "step": 117}
{"train_info/time_between_train_steps": 0.005799770355224609, "step": 117}
{"info/global_step": 118, "train_info/time_within_train_step": 25.009989738464355, "step": 118}
{"train_info/time_between_train_steps": 0.0060765743255615234, "step": 118}
{"info/global_step": 119, "train_info/time_within_train_step": 24.844016075134277, "step": 119}
{"train_info/time_between_train_steps": 0.005425453186035156, "step": 119}
{"info/global_step": 120, "train_info/time_within_train_step": 25.02705478668213, "step": 120}
{"train_info/time_between_train_steps": 0.005595684051513672, "step": 120}
{"info/global_step": 121, "train_info/time_within_train_step": 24.919214248657227, "step": 121}
{"train_info/time_between_train_steps": 0.010033130645751953, "step": 121}
{"info/global_step": 122, "train_info/time_within_train_step": 25.005303859710693, "step": 122}
{"train_info/time_between_train_steps": 0.005437374114990234, "step": 122}
{"info/global_step": 123, "train_info/time_within_train_step": 24.94881844520569, "step": 123}
{"train_info/time_between_train_steps": 0.010691642761230469, "step": 123}
{"info/global_step": 124, "train_info/time_within_train_step": 25.055193424224854, "step": 124}
{"train_info/time_between_train_steps": 0.0055124759674072266, "step": 124}
{"info/global_step": 125, "train_info/time_within_train_step": 24.886231899261475, "step": 125}
{"train_info/time_between_train_steps": 0.005133390426635742, "step": 125}
{"info/global_step": 126, "train_info/time_within_train_step": 24.933918952941895, "step": 126}
{"train_info/time_between_train_steps": 0.0052509307861328125, "step": 126}
{"info/global_step": 127, "train_info/time_within_train_step": 24.87064528465271, "step": 127}
{"train_info/time_between_train_steps": 0.0069806575775146484, "step": 127}
{"info/global_step": 128, "train_info/time_within_train_step": 24.918933868408203, "step": 128}
{"train_info/time_between_train_steps": 0.005364656448364258, "step": 128}
{"info/global_step": 129, "train_info/time_within_train_step": 24.893049478530884, "step": 129}
{"train_info/time_between_train_steps": 0.006857633590698242, "step": 129}
{"info/global_step": 130, "train_info/time_within_train_step": 24.938287019729614, "step": 130}
{"train_info/time_between_train_steps": 0.005484104156494141, "step": 130}
{"info/global_step": 131, "train_info/time_within_train_step": 24.91978621482849, "step": 131}
{"train_info/time_between_train_steps": 0.009602546691894531, "step": 131}
{"info/global_step": 132, "train_info/time_within_train_step": 24.88787841796875, "step": 132}
{"train_info/time_between_train_steps": 0.00685572624206543, "step": 132}
{"info/global_step": 133, "train_info/time_within_train_step": 24.849631309509277, "step": 133}
{"train_info/time_between_train_steps": 0.005385398864746094, "step": 133}
{"info/global_step": 134, "train_info/time_within_train_step": 24.97623610496521, "step": 134}
{"train_info/time_between_train_steps": 0.005451202392578125, "step": 134}
{"info/global_step": 135, "train_info/time_within_train_step": 24.84294819831848, "step": 135}
{"train_info/time_between_train_steps": 0.005650043487548828, "step": 135}
{"info/global_step": 136, "train_info/time_within_train_step": 24.933789253234863, "step": 136}
{"train_info/time_between_train_steps": 0.009846687316894531, "step": 136}
{"info/global_step": 137, "train_info/time_within_train_step": 24.863856554031372, "step": 137}
{"train_info/time_between_train_steps": 0.005458354949951172, "step": 137}
{"info/global_step": 138, "train_info/time_within_train_step": 24.858383417129517, "step": 138}
{"train_info/time_between_train_steps": 0.0054700374603271484, "step": 138}
{"info/global_step": 139, "train_info/time_within_train_step": 24.872615098953247, "step": 139}
{"train_info/time_between_train_steps": 0.0055084228515625, "step": 139}
{"info/global_step": 140, "train_info/time_within_train_step": 24.978452920913696, "step": 140}
{"train_info/time_between_train_steps": 0.005413532257080078, "step": 140}
{"info/global_step": 141, "train_info/time_within_train_step": 24.91903066635132, "step": 141}
{"train_info/time_between_train_steps": 0.005554676055908203, "step": 141}
{"info/global_step": 142, "train_info/time_within_train_step": 24.873474836349487, "step": 142}
{"train_info/time_between_train_steps": 0.010571718215942383, "step": 142}
{"info/global_step": 143, "train_info/time_within_train_step": 24.943849802017212, "step": 143}
{"train_info/time_between_train_steps": 0.011824369430541992, "step": 143}
{"info/global_step": 144, "train_info/time_within_train_step": 24.9464430809021, "step": 144}
{"train_info/time_between_train_steps": 0.009253263473510742, "step": 144}
{"train_info/time_between_train_steps": 13.076478719711304, "step": 144}
{"info/global_step": 145, "train_info/time_within_train_step": 24.86982250213623, "step": 145}
{"train_info/time_between_train_steps": 0.005377054214477539, "step": 145}
{"info/global_step": 146, "train_info/time_within_train_step": 24.974772930145264, "step": 146}
{"train_info/time_between_train_steps": 0.005389690399169922, "step": 146}
{"info/global_step": 147, "train_info/time_within_train_step": 24.884573936462402, "step": 147}
{"train_info/time_between_train_steps": 0.005650997161865234, "step": 147}
{"info/global_step": 148, "train_info/time_within_train_step": 25.077871322631836, "step": 148}
{"train_info/time_between_train_steps": 0.008154869079589844, "step": 148}
{"info/global_step": 149, "train_info/time_within_train_step": 24.877070665359497, "step": 149}
{"train_info/time_between_train_steps": 0.010944604873657227, "step": 149}
{"info/global_step": 150, "train_info/time_within_train_step": 25.0344340801239, "step": 150}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734210746, "_runtime": 3808}, "step": 150}
{"logs": {"train/loss": 4.3196, "train/learning_rate": 0.0005833333333333333, "train/epoch": 4.0, "_timestamp": 1734210746, "_runtime": 3808}, "step": 150}
{"train_info/time_between_train_steps": 0.007256984710693359, "step": 150}
{"info/global_step": 151, "train_info/time_within_train_step": 24.861627101898193, "step": 151}
{"train_info/time_between_train_steps": 0.005614519119262695, "step": 151}
{"info/global_step": 152, "train_info/time_within_train_step": 25.286144256591797, "step": 152}
{"train_info/time_between_train_steps": 0.006071329116821289, "step": 152}
{"info/global_step": 153, "train_info/time_within_train_step": 24.91106677055359, "step": 153}
{"train_info/time_between_train_steps": 0.005959033966064453, "step": 153}
{"info/global_step": 154, "train_info/time_within_train_step": 25.185601949691772, "step": 154}
{"train_info/time_between_train_steps": 0.00549769401550293, "step": 154}
{"info/global_step": 155, "train_info/time_within_train_step": 25.089903593063354, "step": 155}
{"train_info/time_between_train_steps": 0.01040506362915039, "step": 155}
{"info/global_step": 156, "train_info/time_within_train_step": 25.110015153884888, "step": 156}
{"train_info/time_between_train_steps": 0.006028652191162109, "step": 156}
{"info/global_step": 157, "train_info/time_within_train_step": 24.90322208404541, "step": 157}
{"train_info/time_between_train_steps": 0.005911827087402344, "step": 157}
{"info/global_step": 158, "train_info/time_within_train_step": 25.069775581359863, "step": 158}
{"train_info/time_between_train_steps": 0.005621433258056641, "step": 158}
{"info/global_step": 159, "train_info/time_within_train_step": 24.889246940612793, "step": 159}
{"train_info/time_between_train_steps": 0.011209249496459961, "step": 159}
{"info/global_step": 160, "train_info/time_within_train_step": 25.049574375152588, "step": 160}
{"train_info/time_between_train_steps": 0.005481719970703125, "step": 160}
{"info/global_step": 161, "train_info/time_within_train_step": 24.912283658981323, "step": 161}
{"train_info/time_between_train_steps": 0.005211830139160156, "step": 161}
{"info/global_step": 162, "train_info/time_within_train_step": 24.84698510169983, "step": 162}
{"train_info/time_between_train_steps": 0.0052793025970458984, "step": 162}
{"info/global_step": 163, "train_info/time_within_train_step": 24.869690418243408, "step": 163}
{"train_info/time_between_train_steps": 0.005274295806884766, "step": 163}
{"info/global_step": 164, "train_info/time_within_train_step": 24.874542713165283, "step": 164}
{"train_info/time_between_train_steps": 0.009765863418579102, "step": 164}
{"info/global_step": 165, "train_info/time_within_train_step": 24.86597442626953, "step": 165}
{"train_info/time_between_train_steps": 0.010759830474853516, "step": 165}
{"info/global_step": 166, "train_info/time_within_train_step": 24.911798000335693, "step": 166}
{"train_info/time_between_train_steps": 0.005497932434082031, "step": 166}
{"info/global_step": 167, "train_info/time_within_train_step": 24.851471185684204, "step": 167}
{"train_info/time_between_train_steps": 0.010444879531860352, "step": 167}
{"info/global_step": 168, "train_info/time_within_train_step": 24.864485025405884, "step": 168}
{"train_info/time_between_train_steps": 0.006955146789550781, "step": 168}
{"info/global_step": 169, "train_info/time_within_train_step": 24.934401750564575, "step": 169}
{"train_info/time_between_train_steps": 0.006943702697753906, "step": 169}
{"info/global_step": 170, "train_info/time_within_train_step": 24.866469383239746, "step": 170}
{"train_info/time_between_train_steps": 0.005459785461425781, "step": 170}
{"info/global_step": 171, "train_info/time_within_train_step": 25.100874185562134, "step": 171}
{"train_info/time_between_train_steps": 0.005554676055908203, "step": 171}
{"info/global_step": 172, "train_info/time_within_train_step": 24.9100980758667, "step": 172}
{"train_info/time_between_train_steps": 0.005565166473388672, "step": 172}
{"info/global_step": 173, "train_info/time_within_train_step": 24.894034385681152, "step": 173}
{"train_info/time_between_train_steps": 0.0054776668548583984, "step": 173}
{"info/global_step": 174, "train_info/time_within_train_step": 24.953580379486084, "step": 174}
{"train_info/time_between_train_steps": 0.0054318904876708984, "step": 174}
{"info/global_step": 175, "train_info/time_within_train_step": 24.893527030944824, "step": 175}
{"train_info/time_between_train_steps": 0.006974220275878906, "step": 175}
{"info/global_step": 176, "train_info/time_within_train_step": 24.869704008102417, "step": 176}
{"train_info/time_between_train_steps": 0.007455348968505859, "step": 176}
{"info/global_step": 177, "train_info/time_within_train_step": 24.874552488327026, "step": 177}
{"train_info/time_between_train_steps": 0.0065762996673583984, "step": 177}
{"info/global_step": 178, "train_info/time_within_train_step": 24.900020837783813, "step": 178}
{"train_info/time_between_train_steps": 0.005883693695068359, "step": 178}
{"info/global_step": 179, "train_info/time_within_train_step": 25.011664152145386, "step": 179}
{"train_info/time_between_train_steps": 0.007769584655761719, "step": 179}
{"info/global_step": 180, "train_info/time_within_train_step": 24.971932649612427, "step": 180}
{"train_info/time_between_train_steps": 0.007539033889770508, "step": 180}
{"train_info/time_between_train_steps": 13.307325601577759, "step": 180}
{"info/global_step": 181, "train_info/time_within_train_step": 24.86577272415161, "step": 181}
{"train_info/time_between_train_steps": 0.011174201965332031, "step": 181}
{"info/global_step": 182, "train_info/time_within_train_step": 25.07520341873169, "step": 182}
{"train_info/time_between_train_steps": 0.005872249603271484, "step": 182}
{"info/global_step": 183, "train_info/time_within_train_step": 24.873721837997437, "step": 183}
{"train_info/time_between_train_steps": 0.006951808929443359, "step": 183}
{"info/global_step": 184, "train_info/time_within_train_step": 25.032206058502197, "step": 184}
{"train_info/time_between_train_steps": 0.005800962448120117, "step": 184}
{"info/global_step": 185, "train_info/time_within_train_step": 25.009496688842773, "step": 185}
{"train_info/time_between_train_steps": 0.005461215972900391, "step": 185}
{"info/global_step": 186, "train_info/time_within_train_step": 25.162333488464355, "step": 186}
{"train_info/time_between_train_steps": 0.01027822494506836, "step": 186}
{"info/global_step": 187, "train_info/time_within_train_step": 24.87339162826538, "step": 187}
{"train_info/time_between_train_steps": 0.005775928497314453, "step": 187}
{"info/global_step": 188, "train_info/time_within_train_step": 25.025610208511353, "step": 188}
{"train_info/time_between_train_steps": 0.005467414855957031, "step": 188}
{"info/global_step": 189, "train_info/time_within_train_step": 24.906704425811768, "step": 189}
{"train_info/time_between_train_steps": 0.017201900482177734, "step": 189}
{"info/global_step": 190, "train_info/time_within_train_step": 24.997477769851685, "step": 190}
{"train_info/time_between_train_steps": 0.005568504333496094, "step": 190}
{"info/global_step": 191, "train_info/time_within_train_step": 24.919697046279907, "step": 191}
{"train_info/time_between_train_steps": 0.005572319030761719, "step": 191}
{"info/global_step": 192, "train_info/time_within_train_step": 25.048991203308105, "step": 192}
{"train_info/time_between_train_steps": 0.010869979858398438, "step": 192}
{"info/global_step": 193, "train_info/time_within_train_step": 24.878507137298584, "step": 193}
{"train_info/time_between_train_steps": 0.005508899688720703, "step": 193}
{"info/global_step": 194, "train_info/time_within_train_step": 25.07304573059082, "step": 194}
{"train_info/time_between_train_steps": 0.005430698394775391, "step": 194}
{"info/global_step": 195, "train_info/time_within_train_step": 24.917802333831787, "step": 195}
{"train_info/time_between_train_steps": 0.005308866500854492, "step": 195}
{"info/global_step": 196, "train_info/time_within_train_step": 25.011653661727905, "step": 196}
{"train_info/time_between_train_steps": 0.006376504898071289, "step": 196}
{"info/global_step": 197, "train_info/time_within_train_step": 24.91886591911316, "step": 197}
{"train_info/time_between_train_steps": 0.009919404983520508, "step": 197}
{"info/global_step": 198, "train_info/time_within_train_step": 24.855730772018433, "step": 198}
{"train_info/time_between_train_steps": 0.005482912063598633, "step": 198}
{"info/global_step": 199, "train_info/time_within_train_step": 24.803208827972412, "step": 199}
{"train_info/time_between_train_steps": 0.00518798828125, "step": 199}
{"info/global_step": 200, "train_info/time_within_train_step": 24.81581950187683, "step": 200}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734212008, "_runtime": 5070}, "step": 200}
{"logs": {"train/loss": 4.0137, "train/learning_rate": 0.0005555555555555556, "train/epoch": 5.02, "_timestamp": 1734212008, "_runtime": 5070}, "step": 200}
{"train_info/time_between_train_steps": 1.932051658630371, "step": 200}
{"info/global_step": 201, "train_info/time_within_train_step": 24.88471245765686, "step": 201}
{"train_info/time_between_train_steps": 0.005265712738037109, "step": 201}
{"info/global_step": 202, "train_info/time_within_train_step": 24.909485340118408, "step": 202}
{"train_info/time_between_train_steps": 0.005313396453857422, "step": 202}
{"info/global_step": 203, "train_info/time_within_train_step": 24.886298656463623, "step": 203}
{"train_info/time_between_train_steps": 0.005344867706298828, "step": 203}
{"info/global_step": 204, "train_info/time_within_train_step": 24.822962284088135, "step": 204}
{"train_info/time_between_train_steps": 0.010063409805297852, "step": 204}
{"info/global_step": 205, "train_info/time_within_train_step": 24.824721336364746, "step": 205}
{"train_info/time_between_train_steps": 0.005793094635009766, "step": 205}
{"info/global_step": 206, "train_info/time_within_train_step": 24.84752058982849, "step": 206}
{"train_info/time_between_train_steps": 0.005402803421020508, "step": 206}
{"info/global_step": 207, "train_info/time_within_train_step": 24.90465497970581, "step": 207}
{"train_info/time_between_train_steps": 0.009957313537597656, "step": 207}
{"info/global_step": 208, "train_info/time_within_train_step": 24.883785724639893, "step": 208}
{"train_info/time_between_train_steps": 0.00612187385559082, "step": 208}
{"info/global_step": 209, "train_info/time_within_train_step": 24.86066436767578, "step": 209}
{"train_info/time_between_train_steps": 0.005373716354370117, "step": 209}
{"info/global_step": 210, "train_info/time_within_train_step": 24.862574577331543, "step": 210}
{"train_info/time_between_train_steps": 0.0068624019622802734, "step": 210}
{"info/global_step": 211, "train_info/time_within_train_step": 24.856642484664917, "step": 211}
{"train_info/time_between_train_steps": 0.005285739898681641, "step": 211}
{"info/global_step": 212, "train_info/time_within_train_step": 24.84770941734314, "step": 212}
{"train_info/time_between_train_steps": 0.006346940994262695, "step": 212}
{"info/global_step": 213, "train_info/time_within_train_step": 24.854345321655273, "step": 213}
{"train_info/time_between_train_steps": 0.005914926528930664, "step": 213}
{"info/global_step": 214, "train_info/time_within_train_step": 24.843870162963867, "step": 214}
{"train_info/time_between_train_steps": 0.0055353641510009766, "step": 214}
{"info/global_step": 215, "train_info/time_within_train_step": 24.836204767227173, "step": 215}
{"train_info/time_between_train_steps": 0.005821704864501953, "step": 215}
{"info/global_step": 216, "train_info/time_within_train_step": 24.94162130355835, "step": 216}
{"train_info/time_between_train_steps": 0.006092071533203125, "step": 216}
{"train_info/time_between_train_steps": 13.292507648468018, "step": 216}
{"info/global_step": 217, "train_info/time_within_train_step": 24.885307788848877, "step": 217}
{"train_info/time_between_train_steps": 0.005488157272338867, "step": 217}
{"info/global_step": 218, "train_info/time_within_train_step": 24.997565269470215, "step": 218}
{"train_info/time_between_train_steps": 0.010660648345947266, "step": 218}
{"info/global_step": 219, "train_info/time_within_train_step": 24.899702310562134, "step": 219}
{"train_info/time_between_train_steps": 0.0067348480224609375, "step": 219}
{"info/global_step": 220, "train_info/time_within_train_step": 25.002742528915405, "step": 220}
{"train_info/time_between_train_steps": 0.01683783531188965, "step": 220}
{"info/global_step": 221, "train_info/time_within_train_step": 24.837127923965454, "step": 221}
{"train_info/time_between_train_steps": 0.0071103572845458984, "step": 221}
{"info/global_step": 222, "train_info/time_within_train_step": 25.01784920692444, "step": 222}
{"train_info/time_between_train_steps": 0.005528926849365234, "step": 222}
{"info/global_step": 223, "train_info/time_within_train_step": 24.94238781929016, "step": 223}
{"train_info/time_between_train_steps": 0.01035928726196289, "step": 223}
{"info/global_step": 224, "train_info/time_within_train_step": 25.065098524093628, "step": 224}
{"train_info/time_between_train_steps": 0.005425453186035156, "step": 224}
{"info/global_step": 225, "train_info/time_within_train_step": 24.82388925552368, "step": 225}
{"train_info/time_between_train_steps": 0.00544285774230957, "step": 225}
{"info/global_step": 226, "train_info/time_within_train_step": 25.01997137069702, "step": 226}
{"train_info/time_between_train_steps": 0.0054705142974853516, "step": 226}
{"info/global_step": 227, "train_info/time_within_train_step": 24.893545627593994, "step": 227}
{"train_info/time_between_train_steps": 0.005353212356567383, "step": 227}
{"info/global_step": 228, "train_info/time_within_train_step": 24.96111249923706, "step": 228}
{"train_info/time_between_train_steps": 0.007420778274536133, "step": 228}
{"info/global_step": 229, "train_info/time_within_train_step": 24.862775802612305, "step": 229}
{"train_info/time_between_train_steps": 0.00557708740234375, "step": 229}
{"info/global_step": 230, "train_info/time_within_train_step": 24.940409898757935, "step": 230}
{"train_info/time_between_train_steps": 0.006149768829345703, "step": 230}
{"info/global_step": 231, "train_info/time_within_train_step": 24.882670164108276, "step": 231}
{"train_info/time_between_train_steps": 0.005683422088623047, "step": 231}
{"info/global_step": 232, "train_info/time_within_train_step": 25.110250234603882, "step": 232}
{"train_info/time_between_train_steps": 0.01001882553100586, "step": 232}
{"info/global_step": 233, "train_info/time_within_train_step": 24.96982502937317, "step": 233}
{"train_info/time_between_train_steps": 0.005166530609130859, "step": 233}
{"info/global_step": 234, "train_info/time_within_train_step": 24.893041849136353, "step": 234}
{"train_info/time_between_train_steps": 0.005430459976196289, "step": 234}
{"info/global_step": 235, "train_info/time_within_train_step": 24.882646560668945, "step": 235}
{"train_info/time_between_train_steps": 0.010118722915649414, "step": 235}
{"info/global_step": 236, "train_info/time_within_train_step": 24.826845169067383, "step": 236}
{"train_info/time_between_train_steps": 0.005211591720581055, "step": 236}
{"info/global_step": 237, "train_info/time_within_train_step": 24.82408380508423, "step": 237}
{"train_info/time_between_train_steps": 0.006913900375366211, "step": 237}
{"info/global_step": 238, "train_info/time_within_train_step": 24.854823112487793, "step": 238}
{"train_info/time_between_train_steps": 0.0053670406341552734, "step": 238}
{"info/global_step": 239, "train_info/time_within_train_step": 24.888372659683228, "step": 239}
{"train_info/time_between_train_steps": 0.0054280757904052734, "step": 239}
{"info/global_step": 240, "train_info/time_within_train_step": 24.918115377426147, "step": 240}
{"train_info/time_between_train_steps": 0.009479284286499023, "step": 240}
{"info/global_step": 241, "train_info/time_within_train_step": 24.960683345794678, "step": 241}
{"train_info/time_between_train_steps": 0.0053484439849853516, "step": 241}
{"info/global_step": 242, "train_info/time_within_train_step": 24.820125102996826, "step": 242}
{"train_info/time_between_train_steps": 0.0069959163665771484, "step": 242}
{"info/global_step": 243, "train_info/time_within_train_step": 24.940065383911133, "step": 243}
{"train_info/time_between_train_steps": 0.005227088928222656, "step": 243}
{"info/global_step": 244, "train_info/time_within_train_step": 24.81384587287903, "step": 244}
{"train_info/time_between_train_steps": 0.005224466323852539, "step": 244}
{"info/global_step": 245, "train_info/time_within_train_step": 24.85681676864624, "step": 245}
{"train_info/time_between_train_steps": 0.01051640510559082, "step": 245}
{"info/global_step": 246, "train_info/time_within_train_step": 24.834664583206177, "step": 246}
{"train_info/time_between_train_steps": 0.009917020797729492, "step": 246}
{"info/global_step": 247, "train_info/time_within_train_step": 24.808242321014404, "step": 247}
{"train_info/time_between_train_steps": 0.005237102508544922, "step": 247}
{"info/global_step": 248, "train_info/time_within_train_step": 24.978769063949585, "step": 248}
{"train_info/time_between_train_steps": 0.01111745834350586, "step": 248}
{"info/global_step": 249, "train_info/time_within_train_step": 24.86954092979431, "step": 249}
{"train_info/time_between_train_steps": 0.005465984344482422, "step": 249}
{"info/global_step": 250, "train_info/time_within_train_step": 24.897323846817017, "step": 250}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734213268, "_runtime": 6330}, "step": 250}
{"logs": {"train/loss": 3.9029, "train/learning_rate": 0.0005277777777777777, "train/epoch": 6.03, "_timestamp": 1734213268, "_runtime": 6330}, "step": 250}
{"train_info/time_between_train_steps": 0.016666650772094727, "step": 250}
{"info/global_step": 251, "train_info/time_within_train_step": 24.903759956359863, "step": 251}
{"train_info/time_between_train_steps": 0.011228799819946289, "step": 251}
{"info/global_step": 252, "train_info/time_within_train_step": 24.863126754760742, "step": 252}
{"train_info/time_between_train_steps": 0.008084535598754883, "step": 252}
{"train_info/time_between_train_steps": 13.01759123802185, "step": 252}
{"info/global_step": 253, "train_info/time_within_train_step": 24.94504165649414, "step": 253}
{"train_info/time_between_train_steps": 0.005425691604614258, "step": 253}
{"info/global_step": 254, "train_info/time_within_train_step": 25.018428325653076, "step": 254}
{"train_info/time_between_train_steps": 0.010597467422485352, "step": 254}
{"info/global_step": 255, "train_info/time_within_train_step": 24.936859130859375, "step": 255}
{"train_info/time_between_train_steps": 0.005828142166137695, "step": 255}
{"info/global_step": 256, "train_info/time_within_train_step": 25.08136224746704, "step": 256}
{"train_info/time_between_train_steps": 0.0056073665618896484, "step": 256}
{"info/global_step": 257, "train_info/time_within_train_step": 24.935802221298218, "step": 257}
{"train_info/time_between_train_steps": 0.006558656692504883, "step": 257}
{"info/global_step": 258, "train_info/time_within_train_step": 25.050493240356445, "step": 258}
{"train_info/time_between_train_steps": 0.005554914474487305, "step": 258}
{"info/global_step": 259, "train_info/time_within_train_step": 24.967090129852295, "step": 259}
{"train_info/time_between_train_steps": 0.0057525634765625, "step": 259}
{"info/global_step": 260, "train_info/time_within_train_step": 25.026280641555786, "step": 260}
{"train_info/time_between_train_steps": 0.010426521301269531, "step": 260}
{"info/global_step": 261, "train_info/time_within_train_step": 24.884389638900757, "step": 261}
{"train_info/time_between_train_steps": 0.0058476924896240234, "step": 261}
{"info/global_step": 262, "train_info/time_within_train_step": 25.0195951461792, "step": 262}
{"train_info/time_between_train_steps": 0.005640745162963867, "step": 262}
{"info/global_step": 263, "train_info/time_within_train_step": 25.013587951660156, "step": 263}
{"train_info/time_between_train_steps": 0.005822420120239258, "step": 263}
{"info/global_step": 264, "train_info/time_within_train_step": 25.012345790863037, "step": 264}
{"train_info/time_between_train_steps": 0.009751558303833008, "step": 264}
{"info/global_step": 265, "train_info/time_within_train_step": 25.001656532287598, "step": 265}
{"train_info/time_between_train_steps": 0.005994558334350586, "step": 265}
{"info/global_step": 266, "train_info/time_within_train_step": 25.04388952255249, "step": 266}
{"train_info/time_between_train_steps": 0.010688543319702148, "step": 266}
{"info/global_step": 267, "train_info/time_within_train_step": 24.961931228637695, "step": 267}
{"train_info/time_between_train_steps": 0.005805015563964844, "step": 267}
{"info/global_step": 268, "train_info/time_within_train_step": 24.948965787887573, "step": 268}
{"train_info/time_between_train_steps": 0.0053522586822509766, "step": 268}
{"info/global_step": 269, "train_info/time_within_train_step": 24.96134328842163, "step": 269}
{"train_info/time_between_train_steps": 0.005149126052856445, "step": 269}
{"info/global_step": 270, "train_info/time_within_train_step": 24.891313314437866, "step": 270}
{"train_info/time_between_train_steps": 0.010120391845703125, "step": 270}
{"info/global_step": 271, "train_info/time_within_train_step": 24.851669549942017, "step": 271}
{"train_info/time_between_train_steps": 0.006440162658691406, "step": 271}
{"info/global_step": 272, "train_info/time_within_train_step": 24.844814777374268, "step": 272}
{"train_info/time_between_train_steps": 0.005360841751098633, "step": 272}
{"info/global_step": 273, "train_info/time_within_train_step": 24.893392086029053, "step": 273}
{"train_info/time_between_train_steps": 0.009541988372802734, "step": 273}
{"info/global_step": 274, "train_info/time_within_train_step": 24.849641799926758, "step": 274}
{"train_info/time_between_train_steps": 0.010251998901367188, "step": 274}
{"info/global_step": 275, "train_info/time_within_train_step": 24.977076292037964, "step": 275}
{"train_info/time_between_train_steps": 0.005931377410888672, "step": 275}
{"info/global_step": 276, "train_info/time_within_train_step": 24.83186912536621, "step": 276}
{"train_info/time_between_train_steps": 0.005894184112548828, "step": 276}
{"info/global_step": 277, "train_info/time_within_train_step": 24.81696391105652, "step": 277}
{"train_info/time_between_train_steps": 0.005488872528076172, "step": 277}
{"info/global_step": 278, "train_info/time_within_train_step": 24.85843849182129, "step": 278}
{"train_info/time_between_train_steps": 0.005313396453857422, "step": 278}
{"info/global_step": 279, "train_info/time_within_train_step": 25.00822687149048, "step": 279}
{"train_info/time_between_train_steps": 0.005247831344604492, "step": 279}
{"info/global_step": 280, "train_info/time_within_train_step": 24.88455057144165, "step": 280}
{"train_info/time_between_train_steps": 0.010106086730957031, "step": 280}
{"info/global_step": 281, "train_info/time_within_train_step": 24.901116847991943, "step": 281}
{"train_info/time_between_train_steps": 0.0060122013092041016, "step": 281}
{"info/global_step": 282, "train_info/time_within_train_step": 24.802021503448486, "step": 282}
{"train_info/time_between_train_steps": 0.005308866500854492, "step": 282}
{"info/global_step": 283, "train_info/time_within_train_step": 24.867289543151855, "step": 283}
{"train_info/time_between_train_steps": 0.0062863826751708984, "step": 283}
{"info/global_step": 284, "train_info/time_within_train_step": 24.8084716796875, "step": 284}
{"train_info/time_between_train_steps": 0.005555391311645508, "step": 284}
{"info/global_step": 285, "train_info/time_within_train_step": 24.846987009048462, "step": 285}
{"train_info/time_between_train_steps": 0.009639978408813477, "step": 285}
{"info/global_step": 286, "train_info/time_within_train_step": 24.855891942977905, "step": 286}
{"train_info/time_between_train_steps": 0.005594015121459961, "step": 286}
{"info/global_step": 287, "train_info/time_within_train_step": 24.857786417007446, "step": 287}
{"train_info/time_between_train_steps": 0.006183624267578125, "step": 287}
{"info/global_step": 288, "train_info/time_within_train_step": 24.894160747528076, "step": 288}
{"train_info/time_between_train_steps": 0.006384134292602539, "step": 288}
{"train_info/time_between_train_steps": 13.093126058578491, "step": 288}
{"info/global_step": 289, "train_info/time_within_train_step": 24.83834719657898, "step": 289}
{"train_info/time_between_train_steps": 0.005922794342041016, "step": 289}
{"info/global_step": 290, "train_info/time_within_train_step": 25.147078275680542, "step": 290}
{"train_info/time_between_train_steps": 0.005624055862426758, "step": 290}
{"info/global_step": 291, "train_info/time_within_train_step": 24.890918493270874, "step": 291}
{"train_info/time_between_train_steps": 0.005839109420776367, "step": 291}
{"info/global_step": 292, "train_info/time_within_train_step": 25.109105110168457, "step": 292}
{"train_info/time_between_train_steps": 0.0056345462799072266, "step": 292}
{"info/global_step": 293, "train_info/time_within_train_step": 24.898302793502808, "step": 293}
{"train_info/time_between_train_steps": 0.005544185638427734, "step": 293}
{"info/global_step": 294, "train_info/time_within_train_step": 25.208381175994873, "step": 294}
{"train_info/time_between_train_steps": 0.0056209564208984375, "step": 294}
{"info/global_step": 295, "train_info/time_within_train_step": 24.8821861743927, "step": 295}
{"train_info/time_between_train_steps": 0.006108283996582031, "step": 295}
{"info/global_step": 296, "train_info/time_within_train_step": 25.007360458374023, "step": 296}
{"train_info/time_between_train_steps": 0.005401134490966797, "step": 296}
{"info/global_step": 297, "train_info/time_within_train_step": 24.856505632400513, "step": 297}
{"train_info/time_between_train_steps": 0.007401466369628906, "step": 297}
{"info/global_step": 298, "train_info/time_within_train_step": 25.041173219680786, "step": 298}
{"train_info/time_between_train_steps": 0.005653858184814453, "step": 298}
{"info/global_step": 299, "train_info/time_within_train_step": 24.981230974197388, "step": 299}
{"train_info/time_between_train_steps": 0.010766267776489258, "step": 299}
{"info/global_step": 300, "train_info/time_within_train_step": 25.11930251121521, "step": 300}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734214542, "_runtime": 7604}, "step": 300}
{"logs": {"train/loss": 3.7899, "train/learning_rate": 0.0005, "train/epoch": 8.01, "_timestamp": 1734214542, "_runtime": 7604}, "step": 300}
{"train_info/time_between_train_steps": 2.388540267944336, "step": 300}
{"info/global_step": 301, "train_info/time_within_train_step": 24.88838768005371, "step": 301}
{"train_info/time_between_train_steps": 0.01630091667175293, "step": 301}
{"info/global_step": 302, "train_info/time_within_train_step": 25.08246922492981, "step": 302}
{"train_info/time_between_train_steps": 0.010592222213745117, "step": 302}
{"info/global_step": 303, "train_info/time_within_train_step": 24.918703079223633, "step": 303}
{"train_info/time_between_train_steps": 0.0058896541595458984, "step": 303}
{"info/global_step": 304, "train_info/time_within_train_step": 25.027841091156006, "step": 304}
{"train_info/time_between_train_steps": 0.0071451663970947266, "step": 304}
{"info/global_step": 305, "train_info/time_within_train_step": 24.89165496826172, "step": 305}
{"train_info/time_between_train_steps": 0.005272626876831055, "step": 305}
{"info/global_step": 306, "train_info/time_within_train_step": 24.83725929260254, "step": 306}
{"train_info/time_between_train_steps": 0.010246515274047852, "step": 306}
{"info/global_step": 307, "train_info/time_within_train_step": 24.880266427993774, "step": 307}
{"train_info/time_between_train_steps": 0.005323648452758789, "step": 307}
{"info/global_step": 308, "train_info/time_within_train_step": 24.836944103240967, "step": 308}
{"train_info/time_between_train_steps": 0.005502462387084961, "step": 308}
{"info/global_step": 309, "train_info/time_within_train_step": 24.85126256942749, "step": 309}
{"train_info/time_between_train_steps": 0.005712747573852539, "step": 309}
{"info/global_step": 310, "train_info/time_within_train_step": 24.928619146347046, "step": 310}
{"train_info/time_between_train_steps": 0.005765438079833984, "step": 310}
{"info/global_step": 311, "train_info/time_within_train_step": 24.860400915145874, "step": 311}
{"train_info/time_between_train_steps": 0.005412578582763672, "step": 311}
{"info/global_step": 312, "train_info/time_within_train_step": 24.821285247802734, "step": 312}
{"train_info/time_between_train_steps": 0.005625247955322266, "step": 312}
{"info/global_step": 313, "train_info/time_within_train_step": 25.004396438598633, "step": 313}
{"train_info/time_between_train_steps": 0.009962797164916992, "step": 313}
{"info/global_step": 314, "train_info/time_within_train_step": 24.85015559196472, "step": 314}
{"train_info/time_between_train_steps": 0.005515336990356445, "step": 314}
{"info/global_step": 315, "train_info/time_within_train_step": 24.898874759674072, "step": 315}
{"train_info/time_between_train_steps": 0.010351181030273438, "step": 315}
{"info/global_step": 316, "train_info/time_within_train_step": 24.8937726020813, "step": 316}
{"train_info/time_between_train_steps": 0.0056269168853759766, "step": 316}
{"info/global_step": 317, "train_info/time_within_train_step": 24.82955574989319, "step": 317}
{"train_info/time_between_train_steps": 0.00551605224609375, "step": 317}
{"info/global_step": 318, "train_info/time_within_train_step": 24.835761070251465, "step": 318}
{"train_info/time_between_train_steps": 0.006252288818359375, "step": 318}
{"info/global_step": 319, "train_info/time_within_train_step": 24.953991413116455, "step": 319}
{"train_info/time_between_train_steps": 0.005506277084350586, "step": 319}
{"info/global_step": 320, "train_info/time_within_train_step": 24.872405767440796, "step": 320}
{"train_info/time_between_train_steps": 0.0057141780853271484, "step": 320}
{"info/global_step": 321, "train_info/time_within_train_step": 24.933335304260254, "step": 321}
{"train_info/time_between_train_steps": 0.006697654724121094, "step": 321}
{"info/global_step": 322, "train_info/time_within_train_step": 24.865835905075073, "step": 322}
{"train_info/time_between_train_steps": 0.00559687614440918, "step": 322}
{"info/global_step": 323, "train_info/time_within_train_step": 24.8659188747406, "step": 323}
{"train_info/time_between_train_steps": 0.006099700927734375, "step": 323}
{"info/global_step": 324, "train_info/time_within_train_step": 24.86483144760132, "step": 324}
{"train_info/time_between_train_steps": 0.00811457633972168, "step": 324}
{"train_info/time_between_train_steps": 13.211657524108887, "step": 324}
{"info/global_step": 325, "train_info/time_within_train_step": 24.946476459503174, "step": 325}
{"train_info/time_between_train_steps": 0.009289741516113281, "step": 325}
{"info/global_step": 326, "train_info/time_within_train_step": 25.0505690574646, "step": 326}
{"train_info/time_between_train_steps": 0.00558161735534668, "step": 326}
{"info/global_step": 327, "train_info/time_within_train_step": 24.860196113586426, "step": 327}
{"train_info/time_between_train_steps": 0.006824016571044922, "step": 327}
{"info/global_step": 328, "train_info/time_within_train_step": 25.074062824249268, "step": 328}
{"train_info/time_between_train_steps": 0.005507946014404297, "step": 328}
{"info/global_step": 329, "train_info/time_within_train_step": 24.92974019050598, "step": 329}
{"train_info/time_between_train_steps": 0.005366802215576172, "step": 329}
{"info/global_step": 330, "train_info/time_within_train_step": 25.049667835235596, "step": 330}
{"train_info/time_between_train_steps": 0.0058786869049072266, "step": 330}
{"info/global_step": 331, "train_info/time_within_train_step": 24.88335609436035, "step": 331}
{"train_info/time_between_train_steps": 0.0055065155029296875, "step": 331}
{"info/global_step": 332, "train_info/time_within_train_step": 24.986125469207764, "step": 332}
{"train_info/time_between_train_steps": 0.005266904830932617, "step": 332}
{"info/global_step": 333, "train_info/time_within_train_step": 24.812370538711548, "step": 333}
{"train_info/time_between_train_steps": 0.006308794021606445, "step": 333}
{"info/global_step": 334, "train_info/time_within_train_step": 24.97426962852478, "step": 334}
{"train_info/time_between_train_steps": 0.005411386489868164, "step": 334}
{"info/global_step": 335, "train_info/time_within_train_step": 24.89386296272278, "step": 335}
{"train_info/time_between_train_steps": 0.005531787872314453, "step": 335}
{"info/global_step": 336, "train_info/time_within_train_step": 25.062605381011963, "step": 336}
{"train_info/time_between_train_steps": 0.005633354187011719, "step": 336}
{"info/global_step": 337, "train_info/time_within_train_step": 25.039831161499023, "step": 337}
{"train_info/time_between_train_steps": 0.010043144226074219, "step": 337}
{"info/global_step": 338, "train_info/time_within_train_step": 24.983750104904175, "step": 338}
{"train_info/time_between_train_steps": 0.010913610458374023, "step": 338}
{"info/global_step": 339, "train_info/time_within_train_step": 24.85790491104126, "step": 339}
{"train_info/time_between_train_steps": 0.0058362483978271484, "step": 339}
{"info/global_step": 340, "train_info/time_within_train_step": 24.99598002433777, "step": 340}
{"train_info/time_between_train_steps": 0.005830526351928711, "step": 340}
{"info/global_step": 341, "train_info/time_within_train_step": 24.96384859085083, "step": 341}
{"train_info/time_between_train_steps": 0.005340099334716797, "step": 341}
{"info/global_step": 342, "train_info/time_within_train_step": 24.945833206176758, "step": 342}
{"train_info/time_between_train_steps": 0.005404472351074219, "step": 342}
{"info/global_step": 343, "train_info/time_within_train_step": 24.82914090156555, "step": 343}
{"train_info/time_between_train_steps": 0.0054225921630859375, "step": 343}
{"info/global_step": 344, "train_info/time_within_train_step": 24.952817916870117, "step": 344}
{"train_info/time_between_train_steps": 0.00537109375, "step": 344}
{"info/global_step": 345, "train_info/time_within_train_step": 24.86605215072632, "step": 345}
{"train_info/time_between_train_steps": 0.005690574645996094, "step": 345}
{"info/global_step": 346, "train_info/time_within_train_step": 24.86221408843994, "step": 346}
{"train_info/time_between_train_steps": 0.005446195602416992, "step": 346}
{"info/global_step": 347, "train_info/time_within_train_step": 24.82545828819275, "step": 347}
{"train_info/time_between_train_steps": 0.0053784847259521484, "step": 347}
{"info/global_step": 348, "train_info/time_within_train_step": 24.81764006614685, "step": 348}
{"train_info/time_between_train_steps": 0.00538325309753418, "step": 348}
{"info/global_step": 349, "train_info/time_within_train_step": 24.85469698905945, "step": 349}
{"train_info/time_between_train_steps": 0.005774259567260742, "step": 349}
{"info/global_step": 350, "train_info/time_within_train_step": 24.884614944458008, "step": 350}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734215804, "_runtime": 8866}, "step": 350}
{"logs": {"train/loss": 3.5919, "train/learning_rate": 0.00047222222222222224, "train/epoch": 9.02, "_timestamp": 1734215804, "_runtime": 8866}, "step": 350}
{"train_info/time_between_train_steps": 0.013303756713867188, "step": 350}
{"info/global_step": 351, "train_info/time_within_train_step": 24.88477396965027, "step": 351}
{"train_info/time_between_train_steps": 0.010265827178955078, "step": 351}
{"info/global_step": 352, "train_info/time_within_train_step": 24.839761972427368, "step": 352}
{"train_info/time_between_train_steps": 0.0055408477783203125, "step": 352}
{"info/global_step": 353, "train_info/time_within_train_step": 24.855896949768066, "step": 353}
{"train_info/time_between_train_steps": 0.005388975143432617, "step": 353}
{"info/global_step": 354, "train_info/time_within_train_step": 24.85132384300232, "step": 354}
{"train_info/time_between_train_steps": 0.005551338195800781, "step": 354}
{"info/global_step": 355, "train_info/time_within_train_step": 24.941690683364868, "step": 355}
{"train_info/time_between_train_steps": 0.010711908340454102, "step": 355}
{"info/global_step": 356, "train_info/time_within_train_step": 25.001883029937744, "step": 356}
{"train_info/time_between_train_steps": 0.010606050491333008, "step": 356}
{"info/global_step": 357, "train_info/time_within_train_step": 24.946747541427612, "step": 357}
{"train_info/time_between_train_steps": 0.009262323379516602, "step": 357}
{"info/global_step": 358, "train_info/time_within_train_step": 24.95362877845764, "step": 358}
{"train_info/time_between_train_steps": 0.005706071853637695, "step": 358}
{"info/global_step": 359, "train_info/time_within_train_step": 24.952430248260498, "step": 359}
{"train_info/time_between_train_steps": 0.006322383880615234, "step": 359}
{"info/global_step": 360, "train_info/time_within_train_step": 24.858439922332764, "step": 360}
{"train_info/time_between_train_steps": 0.008992433547973633, "step": 360}
{"train_info/time_between_train_steps": 13.45431137084961, "step": 360}
{"info/global_step": 361, "train_info/time_within_train_step": 24.889763832092285, "step": 361}
{"train_info/time_between_train_steps": 0.01692056655883789, "step": 361}
{"info/global_step": 362, "train_info/time_within_train_step": 25.11146354675293, "step": 362}
{"train_info/time_between_train_steps": 0.01067209243774414, "step": 362}
{"info/global_step": 363, "train_info/time_within_train_step": 24.88152813911438, "step": 363}
{"train_info/time_between_train_steps": 0.005693197250366211, "step": 363}
{"info/global_step": 364, "train_info/time_within_train_step": 25.043079376220703, "step": 364}
{"train_info/time_between_train_steps": 0.0057942867279052734, "step": 364}
{"info/global_step": 365, "train_info/time_within_train_step": 24.87569499015808, "step": 365}
{"train_info/time_between_train_steps": 0.01018834114074707, "step": 365}
{"info/global_step": 366, "train_info/time_within_train_step": 25.029598236083984, "step": 366}
{"train_info/time_between_train_steps": 0.010955333709716797, "step": 366}
{"info/global_step": 367, "train_info/time_within_train_step": 24.893351793289185, "step": 367}
{"train_info/time_between_train_steps": 0.005953788757324219, "step": 367}
{"info/global_step": 368, "train_info/time_within_train_step": 25.083839893341064, "step": 368}
{"train_info/time_between_train_steps": 0.00962519645690918, "step": 368}
{"info/global_step": 369, "train_info/time_within_train_step": 24.81716299057007, "step": 369}
{"train_info/time_between_train_steps": 0.00583195686340332, "step": 369}
{"info/global_step": 370, "train_info/time_within_train_step": 25.041694402694702, "step": 370}
{"train_info/time_between_train_steps": 0.005511045455932617, "step": 370}
{"info/global_step": 371, "train_info/time_within_train_step": 24.89528203010559, "step": 371}
{"train_info/time_between_train_steps": 0.006165742874145508, "step": 371}
{"info/global_step": 372, "train_info/time_within_train_step": 25.175849676132202, "step": 372}
{"train_info/time_between_train_steps": 0.0063626766204833984, "step": 372}
{"info/global_step": 373, "train_info/time_within_train_step": 24.915322303771973, "step": 373}
{"train_info/time_between_train_steps": 0.006043434143066406, "step": 373}
{"info/global_step": 374, "train_info/time_within_train_step": 25.299225091934204, "step": 374}
{"train_info/time_between_train_steps": 0.0058515071868896484, "step": 374}
{"info/global_step": 375, "train_info/time_within_train_step": 24.89828658103943, "step": 375}
{"train_info/time_between_train_steps": 0.005881071090698242, "step": 375}
{"info/global_step": 376, "train_info/time_within_train_step": 24.9776930809021, "step": 376}
{"train_info/time_between_train_steps": 0.0061833858489990234, "step": 376}
{"info/global_step": 377, "train_info/time_within_train_step": 24.917136192321777, "step": 377}
{"train_info/time_between_train_steps": 0.005347728729248047, "step": 377}
{"info/global_step": 378, "train_info/time_within_train_step": 24.91069507598877, "step": 378}
{"train_info/time_between_train_steps": 0.009222030639648438, "step": 378}
{"info/global_step": 379, "train_info/time_within_train_step": 24.84232258796692, "step": 379}
{"train_info/time_between_train_steps": 0.010336160659790039, "step": 379}
{"info/global_step": 380, "train_info/time_within_train_step": 24.916059255599976, "step": 380}
{"train_info/time_between_train_steps": 0.005433797836303711, "step": 380}
{"info/global_step": 381, "train_info/time_within_train_step": 24.861359119415283, "step": 381}
{"train_info/time_between_train_steps": 0.005272865295410156, "step": 381}
{"info/global_step": 382, "train_info/time_within_train_step": 24.828530311584473, "step": 382}
{"train_info/time_between_train_steps": 0.006895542144775391, "step": 382}
{"info/global_step": 383, "train_info/time_within_train_step": 24.9397029876709, "step": 383}
{"train_info/time_between_train_steps": 0.010035037994384766, "step": 383}
{"info/global_step": 384, "train_info/time_within_train_step": 24.945846796035767, "step": 384}
{"train_info/time_between_train_steps": 0.009778976440429688, "step": 384}
{"info/global_step": 385, "train_info/time_within_train_step": 24.841657161712646, "step": 385}
{"train_info/time_between_train_steps": 0.0053594112396240234, "step": 385}
{"info/global_step": 386, "train_info/time_within_train_step": 24.852642059326172, "step": 386}
{"train_info/time_between_train_steps": 0.005386829376220703, "step": 386}
{"info/global_step": 387, "train_info/time_within_train_step": 24.938583374023438, "step": 387}
{"train_info/time_between_train_steps": 0.005384922027587891, "step": 387}
{"info/global_step": 388, "train_info/time_within_train_step": 24.81153178215027, "step": 388}
{"train_info/time_between_train_steps": 0.010523080825805664, "step": 388}
{"info/global_step": 389, "train_info/time_within_train_step": 24.895782232284546, "step": 389}
{"train_info/time_between_train_steps": 0.005300998687744141, "step": 389}
{"info/global_step": 390, "train_info/time_within_train_step": 24.84665536880493, "step": 390}
{"train_info/time_between_train_steps": 0.005300045013427734, "step": 390}
{"info/global_step": 391, "train_info/time_within_train_step": 24.809829473495483, "step": 391}
{"train_info/time_between_train_steps": 0.005358219146728516, "step": 391}
{"info/global_step": 392, "train_info/time_within_train_step": 24.959929943084717, "step": 392}
{"train_info/time_between_train_steps": 0.006313323974609375, "step": 392}
{"info/global_step": 393, "train_info/time_within_train_step": 24.869346141815186, "step": 393}
{"train_info/time_between_train_steps": 0.005440235137939453, "step": 393}
{"info/global_step": 394, "train_info/time_within_train_step": 24.824390172958374, "step": 394}
{"train_info/time_between_train_steps": 0.010342121124267578, "step": 394}
{"info/global_step": 395, "train_info/time_within_train_step": 24.824865341186523, "step": 395}
{"train_info/time_between_train_steps": 0.006227016448974609, "step": 395}
{"info/global_step": 396, "train_info/time_within_train_step": 24.864031553268433, "step": 396}
{"train_info/time_between_train_steps": 0.0060138702392578125, "step": 396}
{"train_info/time_between_train_steps": 13.396280527114868, "step": 396}
{"info/global_step": 397, "train_info/time_within_train_step": 24.884256601333618, "step": 397}
{"train_info/time_between_train_steps": 0.011018514633178711, "step": 397}
{"info/global_step": 398, "train_info/time_within_train_step": 24.984291553497314, "step": 398}
{"train_info/time_between_train_steps": 0.0062563419342041016, "step": 398}
{"info/global_step": 399, "train_info/time_within_train_step": 24.946089267730713, "step": 399}
{"train_info/time_between_train_steps": 0.006129026412963867, "step": 399}
{"info/global_step": 400, "train_info/time_within_train_step": 25.04699945449829, "step": 400}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734217077, "_runtime": 10139}, "step": 400}
{"logs": {"train/loss": 3.453, "train/learning_rate": 0.00044444444444444436, "train/epoch": 11.0, "_timestamp": 1734217077, "_runtime": 10139}, "step": 400}
{"train_info/time_between_train_steps": 1.9608182907104492, "step": 400}
{"info/global_step": 401, "train_info/time_within_train_step": 24.915778398513794, "step": 401}
{"train_info/time_between_train_steps": 0.01158595085144043, "step": 401}
{"info/global_step": 402, "train_info/time_within_train_step": 25.162737369537354, "step": 402}
{"train_info/time_between_train_steps": 0.011310100555419922, "step": 402}
{"info/global_step": 403, "train_info/time_within_train_step": 24.943198204040527, "step": 403}
{"train_info/time_between_train_steps": 0.006440162658691406, "step": 403}
{"info/global_step": 404, "train_info/time_within_train_step": 25.02364730834961, "step": 404}
{"train_info/time_between_train_steps": 0.006096839904785156, "step": 404}
{"info/global_step": 405, "train_info/time_within_train_step": 24.870959997177124, "step": 405}
{"train_info/time_between_train_steps": 0.01081395149230957, "step": 405}
{"info/global_step": 406, "train_info/time_within_train_step": 25.060346126556396, "step": 406}
{"train_info/time_between_train_steps": 0.006929874420166016, "step": 406}
{"info/global_step": 407, "train_info/time_within_train_step": 24.91776990890503, "step": 407}
{"train_info/time_between_train_steps": 0.008065223693847656, "step": 407}
{"info/global_step": 408, "train_info/time_within_train_step": 25.10583233833313, "step": 408}
{"train_info/time_between_train_steps": 0.00678706169128418, "step": 408}
{"info/global_step": 409, "train_info/time_within_train_step": 24.894089221954346, "step": 409}
{"train_info/time_between_train_steps": 0.006717205047607422, "step": 409}
{"info/global_step": 410, "train_info/time_within_train_step": 25.095668077468872, "step": 410}
{"train_info/time_between_train_steps": 0.005941867828369141, "step": 410}
{"info/global_step": 411, "train_info/time_within_train_step": 24.911051034927368, "step": 411}
{"train_info/time_between_train_steps": 0.011005878448486328, "step": 411}
{"info/global_step": 412, "train_info/time_within_train_step": 25.056235313415527, "step": 412}
{"train_info/time_between_train_steps": 0.0068531036376953125, "step": 412}
{"info/global_step": 413, "train_info/time_within_train_step": 24.99116849899292, "step": 413}
{"train_info/time_between_train_steps": 0.0055806636810302734, "step": 413}
{"info/global_step": 414, "train_info/time_within_train_step": 24.860852241516113, "step": 414}
{"train_info/time_between_train_steps": 0.005757808685302734, "step": 414}
{"info/global_step": 415, "train_info/time_within_train_step": 24.91022539138794, "step": 415}
{"train_info/time_between_train_steps": 0.01083230972290039, "step": 415}
{"info/global_step": 416, "train_info/time_within_train_step": 24.872500896453857, "step": 416}
{"train_info/time_between_train_steps": 0.010846376419067383, "step": 416}
{"info/global_step": 417, "train_info/time_within_train_step": 25.02698302268982, "step": 417}
{"train_info/time_between_train_steps": 0.005712270736694336, "step": 417}
{"info/global_step": 418, "train_info/time_within_train_step": 25.033369541168213, "step": 418}
{"train_info/time_between_train_steps": 0.010378599166870117, "step": 418}
{"info/global_step": 419, "train_info/time_within_train_step": 24.911820888519287, "step": 419}
{"train_info/time_between_train_steps": 0.006056070327758789, "step": 419}
{"info/global_step": 420, "train_info/time_within_train_step": 24.86754298210144, "step": 420}
{"train_info/time_between_train_steps": 0.0057904720306396484, "step": 420}
{"info/global_step": 421, "train_info/time_within_train_step": 24.876885890960693, "step": 421}
{"train_info/time_between_train_steps": 0.00567173957824707, "step": 421}
{"info/global_step": 422, "train_info/time_within_train_step": 24.944352865219116, "step": 422}
{"train_info/time_between_train_steps": 0.00609588623046875, "step": 422}
{"info/global_step": 423, "train_info/time_within_train_step": 24.880650997161865, "step": 423}
{"train_info/time_between_train_steps": 0.006038188934326172, "step": 423}
{"info/global_step": 424, "train_info/time_within_train_step": 24.877254247665405, "step": 424}
{"train_info/time_between_train_steps": 0.005781888961791992, "step": 424}
{"info/global_step": 425, "train_info/time_within_train_step": 24.845020294189453, "step": 425}
{"train_info/time_between_train_steps": 0.005571126937866211, "step": 425}
{"info/global_step": 426, "train_info/time_within_train_step": 24.882921934127808, "step": 426}
{"train_info/time_between_train_steps": 0.010240554809570312, "step": 426}
{"info/global_step": 427, "train_info/time_within_train_step": 24.904297351837158, "step": 427}
{"train_info/time_between_train_steps": 0.0059735774993896484, "step": 427}
{"info/global_step": 428, "train_info/time_within_train_step": 24.909223079681396, "step": 428}
{"train_info/time_between_train_steps": 0.01742696762084961, "step": 428}
{"info/global_step": 429, "train_info/time_within_train_step": 24.845442533493042, "step": 429}
{"train_info/time_between_train_steps": 0.010320901870727539, "step": 429}
{"info/global_step": 430, "train_info/time_within_train_step": 24.851266145706177, "step": 430}
{"train_info/time_between_train_steps": 0.006230354309082031, "step": 430}
{"info/global_step": 431, "train_info/time_within_train_step": 24.909881830215454, "step": 431}
{"train_info/time_between_train_steps": 0.006415843963623047, "step": 431}
{"info/global_step": 432, "train_info/time_within_train_step": 24.959266662597656, "step": 432}
{"train_info/time_between_train_steps": 0.00711822509765625, "step": 432}
{"train_info/time_between_train_steps": 13.201626300811768, "step": 432}
{"info/global_step": 433, "train_info/time_within_train_step": 24.941280126571655, "step": 433}
{"train_info/time_between_train_steps": 0.005092144012451172, "step": 433}
{"info/global_step": 434, "train_info/time_within_train_step": 24.99517273902893, "step": 434}
{"train_info/time_between_train_steps": 0.005399942398071289, "step": 434}
{"info/global_step": 435, "train_info/time_within_train_step": 24.88100028038025, "step": 435}
{"train_info/time_between_train_steps": 0.00666046142578125, "step": 435}
{"info/global_step": 436, "train_info/time_within_train_step": 24.959471464157104, "step": 436}
{"train_info/time_between_train_steps": 0.005605936050415039, "step": 436}
{"info/global_step": 437, "train_info/time_within_train_step": 24.862772941589355, "step": 437}
{"train_info/time_between_train_steps": 0.005354404449462891, "step": 437}
{"info/global_step": 438, "train_info/time_within_train_step": 25.004945755004883, "step": 438}
{"train_info/time_between_train_steps": 0.016587495803833008, "step": 438}
{"info/global_step": 439, "train_info/time_within_train_step": 24.863866329193115, "step": 439}
{"train_info/time_between_train_steps": 0.005599021911621094, "step": 439}
{"info/global_step": 440, "train_info/time_within_train_step": 24.970765352249146, "step": 440}
{"train_info/time_between_train_steps": 0.005338907241821289, "step": 440}
{"info/global_step": 441, "train_info/time_within_train_step": 24.890894412994385, "step": 441}
{"train_info/time_between_train_steps": 0.0052433013916015625, "step": 441}
{"info/global_step": 442, "train_info/time_within_train_step": 25.010895490646362, "step": 442}
{"train_info/time_between_train_steps": 0.0055751800537109375, "step": 442}
{"info/global_step": 443, "train_info/time_within_train_step": 24.83497142791748, "step": 443}
{"train_info/time_between_train_steps": 0.00546717643737793, "step": 443}
{"info/global_step": 444, "train_info/time_within_train_step": 25.007905960083008, "step": 444}
{"train_info/time_between_train_steps": 0.005450248718261719, "step": 444}
{"info/global_step": 445, "train_info/time_within_train_step": 25.05889582633972, "step": 445}
{"train_info/time_between_train_steps": 0.005694866180419922, "step": 445}
{"info/global_step": 446, "train_info/time_within_train_step": 25.04794478416443, "step": 446}
{"train_info/time_between_train_steps": 0.006073951721191406, "step": 446}
{"info/global_step": 447, "train_info/time_within_train_step": 24.865086317062378, "step": 447}
{"train_info/time_between_train_steps": 0.005313396453857422, "step": 447}
{"info/global_step": 448, "train_info/time_within_train_step": 24.925817012786865, "step": 448}
{"train_info/time_between_train_steps": 0.01648092269897461, "step": 448}
{"info/global_step": 449, "train_info/time_within_train_step": 24.981168508529663, "step": 449}
{"train_info/time_between_train_steps": 0.005155801773071289, "step": 449}
{"info/global_step": 450, "train_info/time_within_train_step": 24.999817609786987, "step": 450}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734218340, "_runtime": 11402}, "step": 450}
{"logs": {"train/loss": 3.2894, "train/learning_rate": 0.00041666666666666664, "train/epoch": 12.02, "_timestamp": 1734218340, "_runtime": 11402}, "step": 450}
{"train_info/time_between_train_steps": 0.007303714752197266, "step": 450}
{"info/global_step": 451, "train_info/time_within_train_step": 24.958624601364136, "step": 451}
{"train_info/time_between_train_steps": 0.005357027053833008, "step": 451}
{"info/global_step": 452, "train_info/time_within_train_step": 24.81814694404602, "step": 452}
{"train_info/time_between_train_steps": 0.005127668380737305, "step": 452}
{"info/global_step": 453, "train_info/time_within_train_step": 24.87054419517517, "step": 453}
{"train_info/time_between_train_steps": 0.009902238845825195, "step": 453}
{"info/global_step": 454, "train_info/time_within_train_step": 24.803868532180786, "step": 454}
{"train_info/time_between_train_steps": 0.0052568912506103516, "step": 454}
{"info/global_step": 455, "train_info/time_within_train_step": 24.8432035446167, "step": 455}
{"train_info/time_between_train_steps": 0.00998544692993164, "step": 455}
{"info/global_step": 456, "train_info/time_within_train_step": 24.897125244140625, "step": 456}
{"train_info/time_between_train_steps": 0.005254983901977539, "step": 456}
{"info/global_step": 457, "train_info/time_within_train_step": 25.075998783111572, "step": 457}
{"train_info/time_between_train_steps": 0.009683847427368164, "step": 457}
{"info/global_step": 458, "train_info/time_within_train_step": 24.89471673965454, "step": 458}
{"train_info/time_between_train_steps": 0.005135059356689453, "step": 458}
{"info/global_step": 459, "train_info/time_within_train_step": 24.93579125404358, "step": 459}
{"train_info/time_between_train_steps": 0.0061495304107666016, "step": 459}
{"info/global_step": 460, "train_info/time_within_train_step": 24.861058950424194, "step": 460}
{"train_info/time_between_train_steps": 0.005362749099731445, "step": 460}
{"info/global_step": 461, "train_info/time_within_train_step": 24.80672836303711, "step": 461}
{"train_info/time_between_train_steps": 0.005156993865966797, "step": 461}
{"info/global_step": 462, "train_info/time_within_train_step": 24.8741455078125, "step": 462}
{"train_info/time_between_train_steps": 0.008953571319580078, "step": 462}
{"info/global_step": 463, "train_info/time_within_train_step": 24.879088163375854, "step": 463}
{"train_info/time_between_train_steps": 0.005253791809082031, "step": 463}
{"info/global_step": 464, "train_info/time_within_train_step": 24.852242708206177, "step": 464}
{"train_info/time_between_train_steps": 0.005296230316162109, "step": 464}
{"info/global_step": 465, "train_info/time_within_train_step": 25.007609128952026, "step": 465}
{"train_info/time_between_train_steps": 0.005368232727050781, "step": 465}
{"info/global_step": 466, "train_info/time_within_train_step": 24.906289100646973, "step": 466}
{"train_info/time_between_train_steps": 0.010174036026000977, "step": 466}
{"info/global_step": 467, "train_info/time_within_train_step": 24.953768253326416, "step": 467}
{"train_info/time_between_train_steps": 0.005896091461181641, "step": 467}
{"info/global_step": 468, "train_info/time_within_train_step": 24.93068289756775, "step": 468}
{"train_info/time_between_train_steps": 0.01153707504272461, "step": 468}
{"train_info/time_between_train_steps": 13.2455153465271, "step": 468}
{"info/global_step": 469, "train_info/time_within_train_step": 24.86289668083191, "step": 469}
{"train_info/time_between_train_steps": 0.008642435073852539, "step": 469}
{"info/global_step": 470, "train_info/time_within_train_step": 25.07168483734131, "step": 470}
{"train_info/time_between_train_steps": 0.005402565002441406, "step": 470}
{"info/global_step": 471, "train_info/time_within_train_step": 24.881560564041138, "step": 471}
{"train_info/time_between_train_steps": 0.009321928024291992, "step": 471}
{"info/global_step": 472, "train_info/time_within_train_step": 25.133789777755737, "step": 472}
{"train_info/time_between_train_steps": 0.00586700439453125, "step": 472}
{"info/global_step": 473, "train_info/time_within_train_step": 24.856048583984375, "step": 473}
{"train_info/time_between_train_steps": 0.005964517593383789, "step": 473}
{"info/global_step": 474, "train_info/time_within_train_step": 25.0996572971344, "step": 474}
{"train_info/time_between_train_steps": 0.005662679672241211, "step": 474}
{"info/global_step": 475, "train_info/time_within_train_step": 25.005157232284546, "step": 475}
{"train_info/time_between_train_steps": 0.005824089050292969, "step": 475}
{"info/global_step": 476, "train_info/time_within_train_step": 25.11406660079956, "step": 476}
{"train_info/time_between_train_steps": 0.005961894989013672, "step": 476}
{"info/global_step": 477, "train_info/time_within_train_step": 24.837961673736572, "step": 477}
{"train_info/time_between_train_steps": 0.005842447280883789, "step": 477}
{"info/global_step": 478, "train_info/time_within_train_step": 25.064075708389282, "step": 478}
{"train_info/time_between_train_steps": 0.005596160888671875, "step": 478}
{"info/global_step": 479, "train_info/time_within_train_step": 24.83051300048828, "step": 479}
{"train_info/time_between_train_steps": 0.005865573883056641, "step": 479}
{"info/global_step": 480, "train_info/time_within_train_step": 25.10558843612671, "step": 480}
{"train_info/time_between_train_steps": 0.005792379379272461, "step": 480}
{"info/global_step": 481, "train_info/time_within_train_step": 24.890981912612915, "step": 481}
{"train_info/time_between_train_steps": 0.007261514663696289, "step": 481}
{"info/global_step": 482, "train_info/time_within_train_step": 25.197689294815063, "step": 482}
{"train_info/time_between_train_steps": 0.007628440856933594, "step": 482}
{"info/global_step": 483, "train_info/time_within_train_step": 24.93272876739502, "step": 483}
{"train_info/time_between_train_steps": 0.010264873504638672, "step": 483}
{"info/global_step": 484, "train_info/time_within_train_step": 25.13609504699707, "step": 484}
{"train_info/time_between_train_steps": 0.005661964416503906, "step": 484}
{"info/global_step": 485, "train_info/time_within_train_step": 24.89974856376648, "step": 485}
{"train_info/time_between_train_steps": 0.0052988529205322266, "step": 485}
{"info/global_step": 486, "train_info/time_within_train_step": 24.852144479751587, "step": 486}
{"train_info/time_between_train_steps": 0.005437135696411133, "step": 486}
{"info/global_step": 487, "train_info/time_within_train_step": 24.846823930740356, "step": 487}
{"train_info/time_between_train_steps": 0.011287689208984375, "step": 487}
{"info/global_step": 488, "train_info/time_within_train_step": 24.914772272109985, "step": 488}
{"train_info/time_between_train_steps": 0.009269237518310547, "step": 488}
{"info/global_step": 489, "train_info/time_within_train_step": 24.947255611419678, "step": 489}
{"train_info/time_between_train_steps": 0.005305290222167969, "step": 489}
{"info/global_step": 490, "train_info/time_within_train_step": 24.861377239227295, "step": 490}
{"train_info/time_between_train_steps": 0.0055468082427978516, "step": 490}
{"info/global_step": 491, "train_info/time_within_train_step": 24.82470726966858, "step": 491}
{"train_info/time_between_train_steps": 0.0069081783294677734, "step": 491}
{"info/global_step": 492, "train_info/time_within_train_step": 24.82248616218567, "step": 492}
{"train_info/time_between_train_steps": 0.0052835941314697266, "step": 492}
{"info/global_step": 493, "train_info/time_within_train_step": 24.795273303985596, "step": 493}
{"train_info/time_between_train_steps": 0.006873607635498047, "step": 493}
{"info/global_step": 494, "train_info/time_within_train_step": 24.913888216018677, "step": 494}
{"train_info/time_between_train_steps": 0.005329608917236328, "step": 494}
{"info/global_step": 495, "train_info/time_within_train_step": 24.922534704208374, "step": 495}
{"train_info/time_between_train_steps": 0.010369539260864258, "step": 495}
{"info/global_step": 496, "train_info/time_within_train_step": 24.88800883293152, "step": 496}
{"train_info/time_between_train_steps": 0.005483865737915039, "step": 496}
{"info/global_step": 497, "train_info/time_within_train_step": 24.836721420288086, "step": 497}
{"train_info/time_between_train_steps": 0.005776405334472656, "step": 497}
{"info/global_step": 498, "train_info/time_within_train_step": 24.833728075027466, "step": 498}
{"train_info/time_between_train_steps": 0.005445241928100586, "step": 498}
{"info/global_step": 499, "train_info/time_within_train_step": 24.84612274169922, "step": 499}
{"train_info/time_between_train_steps": 0.00521087646484375, "step": 499}
{"info/global_step": 500, "train_info/time_within_train_step": 24.851053953170776, "step": 500}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734219600, "_runtime": 12662}, "step": 500}
{"logs": {"train/loss": 3.1879, "train/learning_rate": 0.00038888888888888887, "train/epoch": 13.03, "_timestamp": 1734219600, "_runtime": 12662}, "step": 500}
{"train_info/time_between_train_steps": 1.8675737380981445, "step": 500}
{"info/global_step": 501, "train_info/time_within_train_step": 24.80376434326172, "step": 501}
{"train_info/time_between_train_steps": 0.005285739898681641, "step": 501}
{"info/global_step": 502, "train_info/time_within_train_step": 24.85712218284607, "step": 502}
{"train_info/time_between_train_steps": 0.005399227142333984, "step": 502}
{"info/global_step": 503, "train_info/time_within_train_step": 24.840795516967773, "step": 503}
{"train_info/time_between_train_steps": 0.005771636962890625, "step": 503}
{"info/global_step": 504, "train_info/time_within_train_step": 24.871382236480713, "step": 504}
{"train_info/time_between_train_steps": 0.006017208099365234, "step": 504}
{"train_info/time_between_train_steps": 12.913892269134521, "step": 504}
{"info/global_step": 505, "train_info/time_within_train_step": 24.850293159484863, "step": 505}
{"train_info/time_between_train_steps": 0.005494117736816406, "step": 505}
{"info/global_step": 506, "train_info/time_within_train_step": 24.94628119468689, "step": 506}
{"train_info/time_between_train_steps": 0.005418062210083008, "step": 506}
{"info/global_step": 507, "train_info/time_within_train_step": 24.86908793449402, "step": 507}
{"train_info/time_between_train_steps": 0.005275726318359375, "step": 507}
{"info/global_step": 508, "train_info/time_within_train_step": 25.00569176673889, "step": 508}
{"train_info/time_between_train_steps": 0.00555109977722168, "step": 508}
{"info/global_step": 509, "train_info/time_within_train_step": 24.89737582206726, "step": 509}
{"train_info/time_between_train_steps": 0.005739450454711914, "step": 509}
{"info/global_step": 510, "train_info/time_within_train_step": 25.09162950515747, "step": 510}
{"train_info/time_between_train_steps": 0.005973339080810547, "step": 510}
{"info/global_step": 511, "train_info/time_within_train_step": 24.962091207504272, "step": 511}
{"train_info/time_between_train_steps": 0.010114669799804688, "step": 511}
{"info/global_step": 512, "train_info/time_within_train_step": 25.117517709732056, "step": 512}
{"train_info/time_between_train_steps": 0.0054285526275634766, "step": 512}
{"info/global_step": 513, "train_info/time_within_train_step": 24.912519454956055, "step": 513}
{"train_info/time_between_train_steps": 0.011022329330444336, "step": 513}
{"info/global_step": 514, "train_info/time_within_train_step": 25.005185842514038, "step": 514}
{"train_info/time_between_train_steps": 0.011158943176269531, "step": 514}
{"info/global_step": 515, "train_info/time_within_train_step": 24.89017915725708, "step": 515}
{"train_info/time_between_train_steps": 0.0068666934967041016, "step": 515}
{"info/global_step": 516, "train_info/time_within_train_step": 25.13925814628601, "step": 516}
{"train_info/time_between_train_steps": 0.00557708740234375, "step": 516}
{"info/global_step": 517, "train_info/time_within_train_step": 24.836405515670776, "step": 517}
{"train_info/time_between_train_steps": 0.005829811096191406, "step": 517}
{"info/global_step": 518, "train_info/time_within_train_step": 24.99944829940796, "step": 518}
{"train_info/time_between_train_steps": 0.0052759647369384766, "step": 518}
{"info/global_step": 519, "train_info/time_within_train_step": 24.942430019378662, "step": 519}
{"train_info/time_between_train_steps": 0.0074388980865478516, "step": 519}
{"info/global_step": 520, "train_info/time_within_train_step": 25.003775596618652, "step": 520}
{"train_info/time_between_train_steps": 0.005394697189331055, "step": 520}
{"info/global_step": 521, "train_info/time_within_train_step": 24.920836687088013, "step": 521}
{"train_info/time_between_train_steps": 0.009518623352050781, "step": 521}
{"info/global_step": 522, "train_info/time_within_train_step": 24.846921920776367, "step": 522}
{"train_info/time_between_train_steps": 0.0051381587982177734, "step": 522}
{"info/global_step": 523, "train_info/time_within_train_step": 24.86945629119873, "step": 523}
{"train_info/time_between_train_steps": 0.005387067794799805, "step": 523}
{"info/global_step": 524, "train_info/time_within_train_step": 24.889779806137085, "step": 524}
{"train_info/time_between_train_steps": 0.006894826889038086, "step": 524}
{"info/global_step": 525, "train_info/time_within_train_step": 24.894327402114868, "step": 525}
{"train_info/time_between_train_steps": 0.005495309829711914, "step": 525}
{"info/global_step": 526, "train_info/time_within_train_step": 24.908384561538696, "step": 526}
{"train_info/time_between_train_steps": 0.0054433345794677734, "step": 526}
{"info/global_step": 527, "train_info/time_within_train_step": 24.869102001190186, "step": 527}
{"train_info/time_between_train_steps": 0.00543975830078125, "step": 527}
{"info/global_step": 528, "train_info/time_within_train_step": 24.950337409973145, "step": 528}
{"train_info/time_between_train_steps": 0.010113716125488281, "step": 528}
{"info/global_step": 529, "train_info/time_within_train_step": 24.86682105064392, "step": 529}
{"train_info/time_between_train_steps": 0.005478858947753906, "step": 529}
{"info/global_step": 530, "train_info/time_within_train_step": 24.85325288772583, "step": 530}
{"train_info/time_between_train_steps": 0.005439043045043945, "step": 530}
{"info/global_step": 531, "train_info/time_within_train_step": 24.90516495704651, "step": 531}
{"train_info/time_between_train_steps": 0.006929874420166016, "step": 531}
{"info/global_step": 532, "train_info/time_within_train_step": 24.814308404922485, "step": 532}
{"train_info/time_between_train_steps": 0.00540471076965332, "step": 532}
{"info/global_step": 533, "train_info/time_within_train_step": 24.80941152572632, "step": 533}
{"train_info/time_between_train_steps": 0.00534510612487793, "step": 533}
{"info/global_step": 534, "train_info/time_within_train_step": 24.864794731140137, "step": 534}
{"train_info/time_between_train_steps": 0.006985664367675781, "step": 534}
{"info/global_step": 535, "train_info/time_within_train_step": 24.86086344718933, "step": 535}
{"train_info/time_between_train_steps": 0.005239009857177734, "step": 535}
{"info/global_step": 536, "train_info/time_within_train_step": 24.872230052947998, "step": 536}
{"train_info/time_between_train_steps": 0.0054934024810791016, "step": 536}
{"info/global_step": 537, "train_info/time_within_train_step": 24.83903479576111, "step": 537}
{"train_info/time_between_train_steps": 0.006072998046875, "step": 537}
{"info/global_step": 538, "train_info/time_within_train_step": 24.968612670898438, "step": 538}
{"train_info/time_between_train_steps": 0.005458354949951172, "step": 538}
{"info/global_step": 539, "train_info/time_within_train_step": 24.889281511306763, "step": 539}
{"train_info/time_between_train_steps": 0.005738019943237305, "step": 539}
{"info/global_step": 540, "train_info/time_within_train_step": 24.867523908615112, "step": 540}
{"train_info/time_between_train_steps": 0.011482000350952148, "step": 540}
{"train_info/time_between_train_steps": 13.131466388702393, "step": 540}
{"info/global_step": 541, "train_info/time_within_train_step": 24.843602895736694, "step": 541}
{"train_info/time_between_train_steps": 0.005831241607666016, "step": 541}
{"info/global_step": 542, "train_info/time_within_train_step": 25.161009788513184, "step": 542}
{"train_info/time_between_train_steps": 0.0056192874908447266, "step": 542}
{"info/global_step": 543, "train_info/time_within_train_step": 24.815701007843018, "step": 543}
{"train_info/time_between_train_steps": 0.005819797515869141, "step": 543}
{"info/global_step": 544, "train_info/time_within_train_step": 25.058030366897583, "step": 544}
{"train_info/time_between_train_steps": 0.011285066604614258, "step": 544}
{"info/global_step": 545, "train_info/time_within_train_step": 24.895073652267456, "step": 545}
{"train_info/time_between_train_steps": 0.0057981014251708984, "step": 545}
{"info/global_step": 546, "train_info/time_within_train_step": 25.138479471206665, "step": 546}
{"train_info/time_between_train_steps": 0.005792140960693359, "step": 546}
{"info/global_step": 547, "train_info/time_within_train_step": 24.878005266189575, "step": 547}
{"train_info/time_between_train_steps": 0.005668163299560547, "step": 547}
{"info/global_step": 548, "train_info/time_within_train_step": 25.082815885543823, "step": 548}
{"train_info/time_between_train_steps": 0.0065877437591552734, "step": 548}
{"info/global_step": 549, "train_info/time_within_train_step": 24.885939598083496, "step": 549}
{"train_info/time_between_train_steps": 0.005832195281982422, "step": 549}
{"info/global_step": 550, "train_info/time_within_train_step": 25.080148935317993, "step": 550}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734220874, "_runtime": 13936}, "step": 550}
{"logs": {"train/loss": 3.1259, "train/learning_rate": 0.0003611111111111111, "train/epoch": 15.01, "_timestamp": 1734220874, "_runtime": 13936}, "step": 550}
{"train_info/time_between_train_steps": 0.008143424987792969, "step": 550}
{"info/global_step": 551, "train_info/time_within_train_step": 24.93157386779785, "step": 551}
{"train_info/time_between_train_steps": 0.006067991256713867, "step": 551}
{"info/global_step": 552, "train_info/time_within_train_step": 25.126056671142578, "step": 552}
{"train_info/time_between_train_steps": 0.00627446174621582, "step": 552}
{"info/global_step": 553, "train_info/time_within_train_step": 24.96405816078186, "step": 553}
{"train_info/time_between_train_steps": 0.005934715270996094, "step": 553}
{"info/global_step": 554, "train_info/time_within_train_step": 25.14659881591797, "step": 554}
{"train_info/time_between_train_steps": 0.009643077850341797, "step": 554}
{"info/global_step": 555, "train_info/time_within_train_step": 24.8339262008667, "step": 555}
{"train_info/time_between_train_steps": 0.005845546722412109, "step": 555}
{"info/global_step": 556, "train_info/time_within_train_step": 25.057020902633667, "step": 556}
{"train_info/time_between_train_steps": 0.0053822994232177734, "step": 556}
{"info/global_step": 557, "train_info/time_within_train_step": 24.9885516166687, "step": 557}
{"train_info/time_between_train_steps": 0.0050830841064453125, "step": 557}
{"info/global_step": 558, "train_info/time_within_train_step": 24.842583894729614, "step": 558}
{"train_info/time_between_train_steps": 0.0054931640625, "step": 558}
{"info/global_step": 559, "train_info/time_within_train_step": 24.827571153640747, "step": 559}
{"train_info/time_between_train_steps": 0.009921073913574219, "step": 559}
{"info/global_step": 560, "train_info/time_within_train_step": 24.952800512313843, "step": 560}
{"train_info/time_between_train_steps": 0.005112886428833008, "step": 560}
{"info/global_step": 561, "train_info/time_within_train_step": 24.82232427597046, "step": 561}
{"train_info/time_between_train_steps": 0.0066602230072021484, "step": 561}
{"info/global_step": 562, "train_info/time_within_train_step": 24.8420569896698, "step": 562}
{"train_info/time_between_train_steps": 0.005358457565307617, "step": 562}
{"info/global_step": 563, "train_info/time_within_train_step": 24.88874840736389, "step": 563}
{"train_info/time_between_train_steps": 0.005240201950073242, "step": 563}
{"info/global_step": 564, "train_info/time_within_train_step": 24.912997007369995, "step": 564}
{"train_info/time_between_train_steps": 0.0052242279052734375, "step": 564}
{"info/global_step": 565, "train_info/time_within_train_step": 24.939799785614014, "step": 565}
{"train_info/time_between_train_steps": 0.005189180374145508, "step": 565}
{"info/global_step": 566, "train_info/time_within_train_step": 24.85484790802002, "step": 566}
{"train_info/time_between_train_steps": 0.0053558349609375, "step": 566}
{"info/global_step": 567, "train_info/time_within_train_step": 24.85260319709778, "step": 567}
{"train_info/time_between_train_steps": 0.0052700042724609375, "step": 567}
{"info/global_step": 568, "train_info/time_within_train_step": 24.86409878730774, "step": 568}
{"train_info/time_between_train_steps": 0.005453824996948242, "step": 568}
{"info/global_step": 569, "train_info/time_within_train_step": 24.839359283447266, "step": 569}
{"train_info/time_between_train_steps": 0.006033658981323242, "step": 569}
{"info/global_step": 570, "train_info/time_within_train_step": 24.820981740951538, "step": 570}
{"train_info/time_between_train_steps": 0.005151510238647461, "step": 570}
{"info/global_step": 571, "train_info/time_within_train_step": 24.8035409450531, "step": 571}
{"train_info/time_between_train_steps": 0.0052759647369384766, "step": 571}
{"info/global_step": 572, "train_info/time_within_train_step": 24.885759353637695, "step": 572}
{"train_info/time_between_train_steps": 0.00526118278503418, "step": 572}
{"info/global_step": 573, "train_info/time_within_train_step": 24.941696643829346, "step": 573}
{"train_info/time_between_train_steps": 0.010706424713134766, "step": 573}
{"info/global_step": 574, "train_info/time_within_train_step": 24.95136570930481, "step": 574}
{"train_info/time_between_train_steps": 0.0054552555084228516, "step": 574}
{"info/global_step": 575, "train_info/time_within_train_step": 24.833459615707397, "step": 575}
{"train_info/time_between_train_steps": 0.005760669708251953, "step": 575}
{"info/global_step": 576, "train_info/time_within_train_step": 24.924802780151367, "step": 576}
{"train_info/time_between_train_steps": 0.010787487030029297, "step": 576}
{"train_info/time_between_train_steps": 13.188599586486816, "step": 576}
{"info/global_step": 577, "train_info/time_within_train_step": 24.88278031349182, "step": 577}
{"train_info/time_between_train_steps": 0.0051615238189697266, "step": 577}
{"info/global_step": 578, "train_info/time_within_train_step": 25.105555057525635, "step": 578}
{"train_info/time_between_train_steps": 0.0053784847259521484, "step": 578}
{"info/global_step": 579, "train_info/time_within_train_step": 24.90898823738098, "step": 579}
{"train_info/time_between_train_steps": 0.010037899017333984, "step": 579}
{"info/global_step": 580, "train_info/time_within_train_step": 24.975088834762573, "step": 580}
{"train_info/time_between_train_steps": 0.0053403377532958984, "step": 580}
{"info/global_step": 581, "train_info/time_within_train_step": 24.869656801223755, "step": 581}
{"train_info/time_between_train_steps": 0.005444765090942383, "step": 581}
{"info/global_step": 582, "train_info/time_within_train_step": 25.154178142547607, "step": 582}
{"train_info/time_between_train_steps": 0.0051500797271728516, "step": 582}
{"info/global_step": 583, "train_info/time_within_train_step": 24.825838088989258, "step": 583}
{"train_info/time_between_train_steps": 0.005334615707397461, "step": 583}
{"info/global_step": 584, "train_info/time_within_train_step": 25.056143760681152, "step": 584}
{"train_info/time_between_train_steps": 0.005424976348876953, "step": 584}
{"info/global_step": 585, "train_info/time_within_train_step": 24.861613988876343, "step": 585}
{"train_info/time_between_train_steps": 0.005391597747802734, "step": 585}
{"info/global_step": 586, "train_info/time_within_train_step": 25.058395385742188, "step": 586}
{"train_info/time_between_train_steps": 0.005341529846191406, "step": 586}
{"info/global_step": 587, "train_info/time_within_train_step": 24.880602836608887, "step": 587}
{"train_info/time_between_train_steps": 0.0053708553314208984, "step": 587}
{"info/global_step": 588, "train_info/time_within_train_step": 25.0817449092865, "step": 588}
{"train_info/time_between_train_steps": 0.0070192813873291016, "step": 588}
{"info/global_step": 589, "train_info/time_within_train_step": 24.91502046585083, "step": 589}
{"train_info/time_between_train_steps": 0.005591392517089844, "step": 589}
{"info/global_step": 590, "train_info/time_within_train_step": 25.153035163879395, "step": 590}
{"train_info/time_between_train_steps": 0.005483388900756836, "step": 590}
{"info/global_step": 591, "train_info/time_within_train_step": 24.866706371307373, "step": 591}
{"train_info/time_between_train_steps": 0.005715608596801758, "step": 591}
{"info/global_step": 592, "train_info/time_within_train_step": 24.963454484939575, "step": 592}
{"train_info/time_between_train_steps": 0.005494117736816406, "step": 592}
{"info/global_step": 593, "train_info/time_within_train_step": 24.84509253501892, "step": 593}
{"train_info/time_between_train_steps": 0.00526738166809082, "step": 593}
{"info/global_step": 594, "train_info/time_within_train_step": 24.942549228668213, "step": 594}
{"train_info/time_between_train_steps": 0.006382465362548828, "step": 594}
{"info/global_step": 595, "train_info/time_within_train_step": 24.915077209472656, "step": 595}
{"train_info/time_between_train_steps": 0.009911537170410156, "step": 595}
{"info/global_step": 596, "train_info/time_within_train_step": 24.903676748275757, "step": 596}
{"train_info/time_between_train_steps": 0.005239963531494141, "step": 596}
{"info/global_step": 597, "train_info/time_within_train_step": 24.83132839202881, "step": 597}
{"train_info/time_between_train_steps": 0.0052869319915771484, "step": 597}
{"info/global_step": 598, "train_info/time_within_train_step": 24.881170511245728, "step": 598}
{"train_info/time_between_train_steps": 0.00535130500793457, "step": 598}
{"info/global_step": 599, "train_info/time_within_train_step": 24.831544876098633, "step": 599}
{"train_info/time_between_train_steps": 0.00537109375, "step": 599}
{"info/global_step": 600, "train_info/time_within_train_step": 24.826813459396362, "step": 600}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734222134, "_runtime": 15196}, "step": 600}
{"logs": {"train/loss": 3.0262, "train/learning_rate": 0.0003333333333333333, "train/epoch": 16.02, "_timestamp": 1734222134, "_runtime": 15196}, "step": 600}
{"train_info/time_between_train_steps": 2.2007155418395996, "step": 600}
{"info/global_step": 601, "train_info/time_within_train_step": 24.884282112121582, "step": 601}
{"train_info/time_between_train_steps": 0.005409955978393555, "step": 601}
{"info/global_step": 602, "train_info/time_within_train_step": 24.86073350906372, "step": 602}
{"train_info/time_between_train_steps": 0.0052754878997802734, "step": 602}
{"info/global_step": 603, "train_info/time_within_train_step": 24.813438653945923, "step": 603}
{"train_info/time_between_train_steps": 0.006436586380004883, "step": 603}
{"info/global_step": 604, "train_info/time_within_train_step": 24.97272229194641, "step": 604}
{"train_info/time_between_train_steps": 0.010952949523925781, "step": 604}
{"info/global_step": 605, "train_info/time_within_train_step": 24.92012929916382, "step": 605}
{"train_info/time_between_train_steps": 0.00527501106262207, "step": 605}
{"info/global_step": 606, "train_info/time_within_train_step": 24.859868049621582, "step": 606}
{"train_info/time_between_train_steps": 0.005331516265869141, "step": 606}
{"info/global_step": 607, "train_info/time_within_train_step": 24.863648891448975, "step": 607}
{"train_info/time_between_train_steps": 0.010284662246704102, "step": 607}
{"info/global_step": 608, "train_info/time_within_train_step": 24.818811178207397, "step": 608}
{"train_info/time_between_train_steps": 0.005482912063598633, "step": 608}
{"info/global_step": 609, "train_info/time_within_train_step": 24.88124394416809, "step": 609}
{"train_info/time_between_train_steps": 0.0055768489837646484, "step": 609}
{"info/global_step": 610, "train_info/time_within_train_step": 24.8748562335968, "step": 610}
{"train_info/time_between_train_steps": 0.005577564239501953, "step": 610}
{"info/global_step": 611, "train_info/time_within_train_step": 24.85880184173584, "step": 611}
{"train_info/time_between_train_steps": 0.005891084671020508, "step": 611}
{"info/global_step": 612, "train_info/time_within_train_step": 24.92705750465393, "step": 612}
{"train_info/time_between_train_steps": 0.006356716156005859, "step": 612}
{"train_info/time_between_train_steps": 13.686044931411743, "step": 612}
{"info/global_step": 613, "train_info/time_within_train_step": 24.849804401397705, "step": 613}
{"train_info/time_between_train_steps": 0.0051386356353759766, "step": 613}
{"info/global_step": 614, "train_info/time_within_train_step": 25.013111114501953, "step": 614}
{"train_info/time_between_train_steps": 0.005005836486816406, "step": 614}
{"info/global_step": 615, "train_info/time_within_train_step": 24.888856649398804, "step": 615}
{"train_info/time_between_train_steps": 0.009951591491699219, "step": 615}
{"info/global_step": 616, "train_info/time_within_train_step": 24.986745595932007, "step": 616}
{"train_info/time_between_train_steps": 0.010351181030273438, "step": 616}
{"info/global_step": 617, "train_info/time_within_train_step": 24.872631788253784, "step": 617}
{"train_info/time_between_train_steps": 0.010468006134033203, "step": 617}
{"info/global_step": 618, "train_info/time_within_train_step": 24.98721742630005, "step": 618}
{"train_info/time_between_train_steps": 0.0055119991302490234, "step": 618}
{"info/global_step": 619, "train_info/time_within_train_step": 25.001556634902954, "step": 619}
{"train_info/time_between_train_steps": 0.005318880081176758, "step": 619}
{"info/global_step": 620, "train_info/time_within_train_step": 24.978041887283325, "step": 620}
{"train_info/time_between_train_steps": 0.005305290222167969, "step": 620}
{"info/global_step": 621, "train_info/time_within_train_step": 24.864333629608154, "step": 621}
{"train_info/time_between_train_steps": 0.0055522918701171875, "step": 621}
{"info/global_step": 622, "train_info/time_within_train_step": 25.092259168624878, "step": 622}
{"train_info/time_between_train_steps": 0.01022481918334961, "step": 622}
{"info/global_step": 623, "train_info/time_within_train_step": 24.906385898590088, "step": 623}
{"train_info/time_between_train_steps": 0.010372161865234375, "step": 623}
{"info/global_step": 624, "train_info/time_within_train_step": 24.964969158172607, "step": 624}
{"train_info/time_between_train_steps": 0.005382537841796875, "step": 624}
{"info/global_step": 625, "train_info/time_within_train_step": 24.87836503982544, "step": 625}
{"train_info/time_between_train_steps": 0.00576472282409668, "step": 625}
{"info/global_step": 626, "train_info/time_within_train_step": 25.173921585083008, "step": 626}
{"train_info/time_between_train_steps": 0.007264375686645508, "step": 626}
{"info/global_step": 627, "train_info/time_within_train_step": 25.17004919052124, "step": 627}
{"train_info/time_between_train_steps": 0.005307912826538086, "step": 627}
{"info/global_step": 628, "train_info/time_within_train_step": 24.917709350585938, "step": 628}
{"train_info/time_between_train_steps": 0.0052492618560791016, "step": 628}
{"info/global_step": 629, "train_info/time_within_train_step": 24.899018049240112, "step": 629}
{"train_info/time_between_train_steps": 0.009771108627319336, "step": 629}
{"info/global_step": 630, "train_info/time_within_train_step": 24.798579216003418, "step": 630}
{"train_info/time_between_train_steps": 0.00494384765625, "step": 630}
{"info/global_step": 631, "train_info/time_within_train_step": 24.833930492401123, "step": 631}
{"train_info/time_between_train_steps": 0.009662389755249023, "step": 631}
{"info/global_step": 632, "train_info/time_within_train_step": 24.99925661087036, "step": 632}
{"train_info/time_between_train_steps": 0.009842634201049805, "step": 632}
{"info/global_step": 633, "train_info/time_within_train_step": 24.819513082504272, "step": 633}
{"train_info/time_between_train_steps": 0.005167722702026367, "step": 633}
{"info/global_step": 634, "train_info/time_within_train_step": 25.01201057434082, "step": 634}
{"train_info/time_between_train_steps": 0.007008790969848633, "step": 634}
{"info/global_step": 635, "train_info/time_within_train_step": 24.863290071487427, "step": 635}
{"train_info/time_between_train_steps": 0.005349874496459961, "step": 635}
{"info/global_step": 636, "train_info/time_within_train_step": 24.840529203414917, "step": 636}
{"train_info/time_between_train_steps": 0.0052678585052490234, "step": 636}
{"info/global_step": 637, "train_info/time_within_train_step": 24.818865060806274, "step": 637}
{"train_info/time_between_train_steps": 0.00684356689453125, "step": 637}
{"info/global_step": 638, "train_info/time_within_train_step": 24.823858737945557, "step": 638}
{"train_info/time_between_train_steps": 0.005226612091064453, "step": 638}
{"info/global_step": 639, "train_info/time_within_train_step": 24.907450675964355, "step": 639}
{"train_info/time_between_train_steps": 0.00528407096862793, "step": 639}
{"info/global_step": 640, "train_info/time_within_train_step": 24.926746606826782, "step": 640}
{"train_info/time_between_train_steps": 0.005357265472412109, "step": 640}
{"info/global_step": 641, "train_info/time_within_train_step": 24.854747533798218, "step": 641}
{"train_info/time_between_train_steps": 0.006382942199707031, "step": 641}
{"info/global_step": 642, "train_info/time_within_train_step": 24.834380626678467, "step": 642}
{"train_info/time_between_train_steps": 0.006665468215942383, "step": 642}
{"info/global_step": 643, "train_info/time_within_train_step": 24.849488258361816, "step": 643}
{"train_info/time_between_train_steps": 0.00693821907043457, "step": 643}
{"info/global_step": 644, "train_info/time_within_train_step": 24.83594584465027, "step": 644}
{"train_info/time_between_train_steps": 0.005437612533569336, "step": 644}
{"info/global_step": 645, "train_info/time_within_train_step": 24.847956895828247, "step": 645}
{"train_info/time_between_train_steps": 0.0053255558013916016, "step": 645}
{"info/global_step": 646, "train_info/time_within_train_step": 24.878829956054688, "step": 646}
{"train_info/time_between_train_steps": 0.00925755500793457, "step": 646}
{"info/global_step": 647, "train_info/time_within_train_step": 24.912137508392334, "step": 647}
{"train_info/time_between_train_steps": 0.005961418151855469, "step": 647}
{"info/global_step": 648, "train_info/time_within_train_step": 25.07262134552002, "step": 648}
{"train_info/time_between_train_steps": 0.011075735092163086, "step": 648}
{"train_info/time_between_train_steps": 12.927958011627197, "step": 648}
{"info/global_step": 649, "train_info/time_within_train_step": 24.818776607513428, "step": 649}
{"train_info/time_between_train_steps": 0.005021810531616211, "step": 649}
{"info/global_step": 650, "train_info/time_within_train_step": 25.03152847290039, "step": 650}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734223409, "_runtime": 16471}, "step": 650}
{"logs": {"train/loss": 2.9853, "train/learning_rate": 0.00030555555555555555, "train/epoch": 18.0, "_timestamp": 1734223409, "_runtime": 16471}, "step": 650}
{"train_info/time_between_train_steps": 0.00709080696105957, "step": 650}
{"info/global_step": 651, "train_info/time_within_train_step": 24.824679374694824, "step": 651}
{"train_info/time_between_train_steps": 0.009786844253540039, "step": 651}
{"info/global_step": 652, "train_info/time_within_train_step": 25.034242868423462, "step": 652}
{"train_info/time_between_train_steps": 0.005425453186035156, "step": 652}
{"info/global_step": 653, "train_info/time_within_train_step": 24.84995675086975, "step": 653}
{"train_info/time_between_train_steps": 0.005499839782714844, "step": 653}
{"info/global_step": 654, "train_info/time_within_train_step": 25.036678791046143, "step": 654}
{"train_info/time_between_train_steps": 0.005450248718261719, "step": 654}
{"info/global_step": 655, "train_info/time_within_train_step": 24.877155542373657, "step": 655}
{"train_info/time_between_train_steps": 0.00527501106262207, "step": 655}
{"info/global_step": 656, "train_info/time_within_train_step": 24.95072078704834, "step": 656}
{"train_info/time_between_train_steps": 0.005378007888793945, "step": 656}
{"info/global_step": 657, "train_info/time_within_train_step": 24.87637734413147, "step": 657}
{"train_info/time_between_train_steps": 0.005580425262451172, "step": 657}
{"info/global_step": 658, "train_info/time_within_train_step": 25.118428945541382, "step": 658}
{"train_info/time_between_train_steps": 0.010280132293701172, "step": 658}
{"info/global_step": 659, "train_info/time_within_train_step": 24.899574279785156, "step": 659}
{"train_info/time_between_train_steps": 0.0054209232330322266, "step": 659}
{"info/global_step": 660, "train_info/time_within_train_step": 25.063084363937378, "step": 660}
{"train_info/time_between_train_steps": 0.010255813598632812, "step": 660}
{"info/global_step": 661, "train_info/time_within_train_step": 24.92264676094055, "step": 661}
{"train_info/time_between_train_steps": 0.005624294281005859, "step": 661}
{"info/global_step": 662, "train_info/time_within_train_step": 25.206746101379395, "step": 662}
{"train_info/time_between_train_steps": 0.005723714828491211, "step": 662}
{"info/global_step": 663, "train_info/time_within_train_step": 24.852110147476196, "step": 663}
{"train_info/time_between_train_steps": 0.0052144527435302734, "step": 663}
{"info/global_step": 664, "train_info/time_within_train_step": 24.894866704940796, "step": 664}
{"train_info/time_between_train_steps": 0.005375385284423828, "step": 664}
{"info/global_step": 665, "train_info/time_within_train_step": 25.03052806854248, "step": 665}
{"train_info/time_between_train_steps": 0.005076408386230469, "step": 665}
{"info/global_step": 666, "train_info/time_within_train_step": 24.83625054359436, "step": 666}
{"train_info/time_between_train_steps": 0.005040407180786133, "step": 666}
{"info/global_step": 667, "train_info/time_within_train_step": 24.850733757019043, "step": 667}
{"train_info/time_between_train_steps": 0.01125335693359375, "step": 667}
{"info/global_step": 668, "train_info/time_within_train_step": 24.83849573135376, "step": 668}
{"train_info/time_between_train_steps": 0.005125522613525391, "step": 668}
{"info/global_step": 669, "train_info/time_within_train_step": 24.824647665023804, "step": 669}
{"train_info/time_between_train_steps": 0.0054094791412353516, "step": 669}
{"info/global_step": 670, "train_info/time_within_train_step": 24.827686309814453, "step": 670}
{"train_info/time_between_train_steps": 0.005468606948852539, "step": 670}
{"info/global_step": 671, "train_info/time_within_train_step": 24.85394811630249, "step": 671}
{"train_info/time_between_train_steps": 0.010134696960449219, "step": 671}
{"info/global_step": 672, "train_info/time_within_train_step": 24.859093189239502, "step": 672}
{"train_info/time_between_train_steps": 0.005454301834106445, "step": 672}
{"info/global_step": 673, "train_info/time_within_train_step": 24.857227087020874, "step": 673}
{"train_info/time_between_train_steps": 0.005244016647338867, "step": 673}
{"info/global_step": 674, "train_info/time_within_train_step": 24.818758487701416, "step": 674}
{"train_info/time_between_train_steps": 0.005373954772949219, "step": 674}
{"info/global_step": 675, "train_info/time_within_train_step": 24.85346245765686, "step": 675}
{"train_info/time_between_train_steps": 0.005315065383911133, "step": 675}
{"info/global_step": 676, "train_info/time_within_train_step": 24.90540647506714, "step": 676}
{"train_info/time_between_train_steps": 0.005298137664794922, "step": 676}
{"info/global_step": 677, "train_info/time_within_train_step": 24.89534640312195, "step": 677}
{"train_info/time_between_train_steps": 0.005258798599243164, "step": 677}
{"info/global_step": 678, "train_info/time_within_train_step": 24.892264366149902, "step": 678}
{"train_info/time_between_train_steps": 0.009924173355102539, "step": 678}
{"info/global_step": 679, "train_info/time_within_train_step": 24.834885835647583, "step": 679}
{"train_info/time_between_train_steps": 0.005280971527099609, "step": 679}
{"info/global_step": 680, "train_info/time_within_train_step": 24.846224308013916, "step": 680}
{"train_info/time_between_train_steps": 0.005570888519287109, "step": 680}
{"info/global_step": 681, "train_info/time_within_train_step": 24.977795839309692, "step": 681}
{"train_info/time_between_train_steps": 0.010603666305541992, "step": 681}
{"info/global_step": 682, "train_info/time_within_train_step": 24.93028497695923, "step": 682}
{"train_info/time_between_train_steps": 0.005518913269042969, "step": 682}
{"info/global_step": 683, "train_info/time_within_train_step": 24.879460096359253, "step": 683}
{"train_info/time_between_train_steps": 0.005896329879760742, "step": 683}
{"info/global_step": 684, "train_info/time_within_train_step": 24.929694652557373, "step": 684}
{"train_info/time_between_train_steps": 0.006058931350708008, "step": 684}
{"train_info/time_between_train_steps": 13.213730573654175, "step": 684}
{"info/global_step": 685, "train_info/time_within_train_step": 24.833669662475586, "step": 685}
{"train_info/time_between_train_steps": 0.009477376937866211, "step": 685}
{"info/global_step": 686, "train_info/time_within_train_step": 25.020060300827026, "step": 686}
{"train_info/time_between_train_steps": 0.017001628875732422, "step": 686}
{"info/global_step": 687, "train_info/time_within_train_step": 24.99788498878479, "step": 687}
{"train_info/time_between_train_steps": 0.005250215530395508, "step": 687}
{"info/global_step": 688, "train_info/time_within_train_step": 25.006826400756836, "step": 688}
{"train_info/time_between_train_steps": 0.005901336669921875, "step": 688}
{"info/global_step": 689, "train_info/time_within_train_step": 24.89552330970764, "step": 689}
{"train_info/time_between_train_steps": 0.005226850509643555, "step": 689}
{"info/global_step": 690, "train_info/time_within_train_step": 24.975557804107666, "step": 690}
{"train_info/time_between_train_steps": 0.010082721710205078, "step": 690}
{"info/global_step": 691, "train_info/time_within_train_step": 24.918123960494995, "step": 691}
{"train_info/time_between_train_steps": 0.00713348388671875, "step": 691}
{"info/global_step": 692, "train_info/time_within_train_step": 24.987672328948975, "step": 692}
{"train_info/time_between_train_steps": 0.005448341369628906, "step": 692}
{"info/global_step": 693, "train_info/time_within_train_step": 24.860209465026855, "step": 693}
{"train_info/time_between_train_steps": 0.0053157806396484375, "step": 693}
{"info/global_step": 694, "train_info/time_within_train_step": 24.996159315109253, "step": 694}
{"train_info/time_between_train_steps": 0.005290031433105469, "step": 694}
{"info/global_step": 695, "train_info/time_within_train_step": 25.167099237442017, "step": 695}
{"train_info/time_between_train_steps": 0.006897926330566406, "step": 695}
{"info/global_step": 696, "train_info/time_within_train_step": 25.09348773956299, "step": 696}
{"train_info/time_between_train_steps": 0.005388021469116211, "step": 696}
{"info/global_step": 697, "train_info/time_within_train_step": 24.879976272583008, "step": 697}
{"train_info/time_between_train_steps": 0.005375862121582031, "step": 697}
{"info/global_step": 698, "train_info/time_within_train_step": 24.993125677108765, "step": 698}
{"train_info/time_between_train_steps": 0.0055620670318603516, "step": 698}
{"info/global_step": 699, "train_info/time_within_train_step": 24.81773328781128, "step": 699}
{"train_info/time_between_train_steps": 0.00548863410949707, "step": 699}
{"info/global_step": 700, "train_info/time_within_train_step": 24.914769649505615, "step": 700}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734224668, "_runtime": 17730}, "step": 700}
{"logs": {"train/loss": 2.9074, "train/learning_rate": 0.0002777777777777778, "train/epoch": 19.01, "_timestamp": 1734224668, "_runtime": 17730}, "step": 700}
{"train_info/time_between_train_steps": 1.8723108768463135, "step": 700}
{"info/global_step": 701, "train_info/time_within_train_step": 24.934658765792847, "step": 701}
{"train_info/time_between_train_steps": 0.009102582931518555, "step": 701}
{"info/global_step": 702, "train_info/time_within_train_step": 24.978580951690674, "step": 702}
{"train_info/time_between_train_steps": 0.005318403244018555, "step": 702}
{"info/global_step": 703, "train_info/time_within_train_step": 24.89414143562317, "step": 703}
{"train_info/time_between_train_steps": 0.00977468490600586, "step": 703}
{"info/global_step": 704, "train_info/time_within_train_step": 24.829761028289795, "step": 704}
{"train_info/time_between_train_steps": 0.005237579345703125, "step": 704}
{"info/global_step": 705, "train_info/time_within_train_step": 24.910454273223877, "step": 705}
{"train_info/time_between_train_steps": 0.009891986846923828, "step": 705}
{"info/global_step": 706, "train_info/time_within_train_step": 24.81820774078369, "step": 706}
{"train_info/time_between_train_steps": 0.010145425796508789, "step": 706}
{"info/global_step": 707, "train_info/time_within_train_step": 24.83589243888855, "step": 707}
{"train_info/time_between_train_steps": 0.005500316619873047, "step": 707}
{"info/global_step": 708, "train_info/time_within_train_step": 24.835484743118286, "step": 708}
{"train_info/time_between_train_steps": 0.005316734313964844, "step": 708}
{"info/global_step": 709, "train_info/time_within_train_step": 24.915559768676758, "step": 709}
{"train_info/time_between_train_steps": 0.005457401275634766, "step": 709}
{"info/global_step": 710, "train_info/time_within_train_step": 24.883921146392822, "step": 710}
{"train_info/time_between_train_steps": 0.005418300628662109, "step": 710}
{"info/global_step": 711, "train_info/time_within_train_step": 24.862916469573975, "step": 711}
{"train_info/time_between_train_steps": 0.006422281265258789, "step": 711}
{"info/global_step": 712, "train_info/time_within_train_step": 25.024678468704224, "step": 712}
{"train_info/time_between_train_steps": 0.005514621734619141, "step": 712}
{"info/global_step": 713, "train_info/time_within_train_step": 24.834012269973755, "step": 713}
{"train_info/time_between_train_steps": 0.00978994369506836, "step": 713}
{"info/global_step": 714, "train_info/time_within_train_step": 24.892040014266968, "step": 714}
{"train_info/time_between_train_steps": 0.0052645206451416016, "step": 714}
{"info/global_step": 715, "train_info/time_within_train_step": 24.94103693962097, "step": 715}
{"train_info/time_between_train_steps": 0.010216951370239258, "step": 715}
{"info/global_step": 716, "train_info/time_within_train_step": 24.87632179260254, "step": 716}
{"train_info/time_between_train_steps": 0.005769014358520508, "step": 716}
{"info/global_step": 717, "train_info/time_within_train_step": 24.84022855758667, "step": 717}
{"train_info/time_between_train_steps": 0.0069942474365234375, "step": 717}
{"info/global_step": 718, "train_info/time_within_train_step": 24.854680061340332, "step": 718}
{"train_info/time_between_train_steps": 0.005423307418823242, "step": 718}
{"info/global_step": 719, "train_info/time_within_train_step": 24.978630542755127, "step": 719}
{"train_info/time_between_train_steps": 0.010376453399658203, "step": 719}
{"info/global_step": 720, "train_info/time_within_train_step": 25.027259588241577, "step": 720}
{"train_info/time_between_train_steps": 0.0061779022216796875, "step": 720}
{"train_info/time_between_train_steps": 14.318996906280518, "step": 720}
{"info/global_step": 721, "train_info/time_within_train_step": 24.860551834106445, "step": 721}
{"train_info/time_between_train_steps": 0.0069179534912109375, "step": 721}
{"info/global_step": 722, "train_info/time_within_train_step": 25.0494167804718, "step": 722}
{"train_info/time_between_train_steps": 0.006067514419555664, "step": 722}
{"info/global_step": 723, "train_info/time_within_train_step": 24.909573554992676, "step": 723}
{"train_info/time_between_train_steps": 0.006150960922241211, "step": 723}
{"info/global_step": 724, "train_info/time_within_train_step": 25.072714805603027, "step": 724}
{"train_info/time_between_train_steps": 0.007315874099731445, "step": 724}
{"info/global_step": 725, "train_info/time_within_train_step": 24.87135148048401, "step": 725}
{"train_info/time_between_train_steps": 0.016256093978881836, "step": 725}
{"info/global_step": 726, "train_info/time_within_train_step": 24.97177267074585, "step": 726}
{"train_info/time_between_train_steps": 0.005317211151123047, "step": 726}
{"info/global_step": 727, "train_info/time_within_train_step": 25.048938512802124, "step": 727}
{"train_info/time_between_train_steps": 0.011124610900878906, "step": 727}
{"info/global_step": 728, "train_info/time_within_train_step": 24.991302251815796, "step": 728}
{"train_info/time_between_train_steps": 0.0052835941314697266, "step": 728}
{"info/global_step": 729, "train_info/time_within_train_step": 24.917952299118042, "step": 729}
{"train_info/time_between_train_steps": 0.005673646926879883, "step": 729}
{"info/global_step": 730, "train_info/time_within_train_step": 24.995283365249634, "step": 730}
{"train_info/time_between_train_steps": 0.005724430084228516, "step": 730}
{"info/global_step": 731, "train_info/time_within_train_step": 24.847764253616333, "step": 731}
{"train_info/time_between_train_steps": 0.005755901336669922, "step": 731}
{"info/global_step": 732, "train_info/time_within_train_step": 25.021394968032837, "step": 732}
{"train_info/time_between_train_steps": 0.006264209747314453, "step": 732}
{"info/global_step": 733, "train_info/time_within_train_step": 24.954590559005737, "step": 733}
{"train_info/time_between_train_steps": 0.005502223968505859, "step": 733}
{"info/global_step": 734, "train_info/time_within_train_step": 25.052980661392212, "step": 734}
{"train_info/time_between_train_steps": 0.005884647369384766, "step": 734}
{"info/global_step": 735, "train_info/time_within_train_step": 24.820966720581055, "step": 735}
{"train_info/time_between_train_steps": 0.005392789840698242, "step": 735}
{"info/global_step": 736, "train_info/time_within_train_step": 24.93418860435486, "step": 736}
{"train_info/time_between_train_steps": 0.005590200424194336, "step": 736}
{"info/global_step": 737, "train_info/time_within_train_step": 24.86923837661743, "step": 737}
{"train_info/time_between_train_steps": 0.008344650268554688, "step": 737}
{"info/global_step": 738, "train_info/time_within_train_step": 25.024264574050903, "step": 738}
{"train_info/time_between_train_steps": 0.005230426788330078, "step": 738}
{"info/global_step": 739, "train_info/time_within_train_step": 24.85434365272522, "step": 739}
{"train_info/time_between_train_steps": 0.005446195602416992, "step": 739}
{"info/global_step": 740, "train_info/time_within_train_step": 24.871586561203003, "step": 740}
{"train_info/time_between_train_steps": 0.009942293167114258, "step": 740}
{"info/global_step": 741, "train_info/time_within_train_step": 24.898678064346313, "step": 741}
{"train_info/time_between_train_steps": 0.00541377067565918, "step": 741}
{"info/global_step": 742, "train_info/time_within_train_step": 24.96035623550415, "step": 742}
{"train_info/time_between_train_steps": 0.005314350128173828, "step": 742}
{"info/global_step": 743, "train_info/time_within_train_step": 24.928645372390747, "step": 743}
{"train_info/time_between_train_steps": 0.005699634552001953, "step": 743}
{"info/global_step": 744, "train_info/time_within_train_step": 24.883456707000732, "step": 744}
{"train_info/time_between_train_steps": 0.010917901992797852, "step": 744}
{"info/global_step": 745, "train_info/time_within_train_step": 24.867234468460083, "step": 745}
{"train_info/time_between_train_steps": 0.009961843490600586, "step": 745}
{"info/global_step": 746, "train_info/time_within_train_step": 24.818235158920288, "step": 746}
{"train_info/time_between_train_steps": 0.005389690399169922, "step": 746}
{"info/global_step": 747, "train_info/time_within_train_step": 24.85788130760193, "step": 747}
{"train_info/time_between_train_steps": 0.006463289260864258, "step": 747}
{"info/global_step": 748, "train_info/time_within_train_step": 24.848506927490234, "step": 748}
{"train_info/time_between_train_steps": 0.00565028190612793, "step": 748}
{"info/global_step": 749, "train_info/time_within_train_step": 24.821555376052856, "step": 749}
{"train_info/time_between_train_steps": 0.005579233169555664, "step": 749}
{"info/global_step": 750, "train_info/time_within_train_step": 24.95274806022644, "step": 750}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734225931, "_runtime": 18993}, "step": 750}
{"logs": {"train/loss": 2.8558, "train/learning_rate": 0.00025, "train/epoch": 20.02, "_timestamp": 1734225931, "_runtime": 18993}, "step": 750}
{"train_info/time_between_train_steps": 0.007195234298706055, "step": 750}
{"info/global_step": 751, "train_info/time_within_train_step": 24.91141629219055, "step": 751}
{"train_info/time_between_train_steps": 0.005352020263671875, "step": 751}
{"info/global_step": 752, "train_info/time_within_train_step": 24.893556594848633, "step": 752}
{"train_info/time_between_train_steps": 0.006603240966796875, "step": 752}
{"info/global_step": 753, "train_info/time_within_train_step": 24.85122561454773, "step": 753}
{"train_info/time_between_train_steps": 0.005667448043823242, "step": 753}
{"info/global_step": 754, "train_info/time_within_train_step": 24.920214653015137, "step": 754}
{"train_info/time_between_train_steps": 0.0060274600982666016, "step": 754}
{"info/global_step": 755, "train_info/time_within_train_step": 24.869670867919922, "step": 755}
{"train_info/time_between_train_steps": 0.006330251693725586, "step": 755}
{"info/global_step": 756, "train_info/time_within_train_step": 24.884581327438354, "step": 756}
{"train_info/time_between_train_steps": 0.011255264282226562, "step": 756}
{"train_info/time_between_train_steps": 12.892217874526978, "step": 756}
{"info/global_step": 757, "train_info/time_within_train_step": 24.867026805877686, "step": 757}
{"train_info/time_between_train_steps": 0.005803346633911133, "step": 757}
{"info/global_step": 758, "train_info/time_within_train_step": 25.264230489730835, "step": 758}
{"train_info/time_between_train_steps": 0.005461692810058594, "step": 758}
{"info/global_step": 759, "train_info/time_within_train_step": 24.922152519226074, "step": 759}
{"train_info/time_between_train_steps": 0.010756492614746094, "step": 759}
{"info/global_step": 760, "train_info/time_within_train_step": 25.13169813156128, "step": 760}
{"train_info/time_between_train_steps": 0.005583047866821289, "step": 760}
{"info/global_step": 761, "train_info/time_within_train_step": 24.82957887649536, "step": 761}
{"train_info/time_between_train_steps": 0.009486198425292969, "step": 761}
{"info/global_step": 762, "train_info/time_within_train_step": 25.115577459335327, "step": 762}
{"train_info/time_between_train_steps": 0.005899906158447266, "step": 762}
{"info/global_step": 763, "train_info/time_within_train_step": 24.915167093276978, "step": 763}
{"train_info/time_between_train_steps": 0.009476900100708008, "step": 763}
{"info/global_step": 764, "train_info/time_within_train_step": 24.996310710906982, "step": 764}
{"train_info/time_between_train_steps": 0.005247592926025391, "step": 764}
{"info/global_step": 765, "train_info/time_within_train_step": 24.989982843399048, "step": 765}
{"train_info/time_between_train_steps": 0.009712457656860352, "step": 765}
{"info/global_step": 766, "train_info/time_within_train_step": 24.9927077293396, "step": 766}
{"train_info/time_between_train_steps": 0.005370616912841797, "step": 766}
{"info/global_step": 767, "train_info/time_within_train_step": 24.915322065353394, "step": 767}
{"train_info/time_between_train_steps": 0.005753755569458008, "step": 767}
{"info/global_step": 768, "train_info/time_within_train_step": 24.95649814605713, "step": 768}
{"train_info/time_between_train_steps": 0.0055353641510009766, "step": 768}
{"info/global_step": 769, "train_info/time_within_train_step": 24.837328910827637, "step": 769}
{"train_info/time_between_train_steps": 0.005418539047241211, "step": 769}
{"info/global_step": 770, "train_info/time_within_train_step": 24.99283766746521, "step": 770}
{"train_info/time_between_train_steps": 0.005231380462646484, "step": 770}
{"info/global_step": 771, "train_info/time_within_train_step": 24.988779544830322, "step": 771}
{"train_info/time_between_train_steps": 0.006766080856323242, "step": 771}
{"info/global_step": 772, "train_info/time_within_train_step": 24.987138271331787, "step": 772}
{"train_info/time_between_train_steps": 0.00543665885925293, "step": 772}
{"info/global_step": 773, "train_info/time_within_train_step": 24.85032892227173, "step": 773}
{"train_info/time_between_train_steps": 0.009919881820678711, "step": 773}
{"info/global_step": 774, "train_info/time_within_train_step": 24.950448751449585, "step": 774}
{"train_info/time_between_train_steps": 0.009725093841552734, "step": 774}
{"info/global_step": 775, "train_info/time_within_train_step": 24.80346965789795, "step": 775}
{"train_info/time_between_train_steps": 0.005118370056152344, "step": 775}
{"info/global_step": 776, "train_info/time_within_train_step": 24.805495500564575, "step": 776}
{"train_info/time_between_train_steps": 0.009846210479736328, "step": 776}
{"info/global_step": 777, "train_info/time_within_train_step": 24.825583696365356, "step": 777}
{"train_info/time_between_train_steps": 0.009711742401123047, "step": 777}
{"info/global_step": 778, "train_info/time_within_train_step": 24.830135345458984, "step": 778}
{"train_info/time_between_train_steps": 0.009929895401000977, "step": 778}
{"info/global_step": 779, "train_info/time_within_train_step": 24.837259769439697, "step": 779}
{"train_info/time_between_train_steps": 0.005408525466918945, "step": 779}
{"info/global_step": 780, "train_info/time_within_train_step": 24.858203172683716, "step": 780}
{"train_info/time_between_train_steps": 0.005500078201293945, "step": 780}
{"info/global_step": 781, "train_info/time_within_train_step": 24.86197829246521, "step": 781}
{"train_info/time_between_train_steps": 0.005242824554443359, "step": 781}
{"info/global_step": 782, "train_info/time_within_train_step": 24.835482597351074, "step": 782}
{"train_info/time_between_train_steps": 0.005391836166381836, "step": 782}
{"info/global_step": 783, "train_info/time_within_train_step": 24.819520950317383, "step": 783}
{"train_info/time_between_train_steps": 0.006692171096801758, "step": 783}
{"info/global_step": 784, "train_info/time_within_train_step": 24.91721200942993, "step": 784}
{"train_info/time_between_train_steps": 0.005259513854980469, "step": 784}
{"info/global_step": 785, "train_info/time_within_train_step": 24.857242107391357, "step": 785}
{"train_info/time_between_train_steps": 0.010138511657714844, "step": 785}
{"info/global_step": 786, "train_info/time_within_train_step": 24.931999921798706, "step": 786}
{"train_info/time_between_train_steps": 0.005362033843994141, "step": 786}
{"info/global_step": 787, "train_info/time_within_train_step": 24.824763774871826, "step": 787}
{"train_info/time_between_train_steps": 0.0051708221435546875, "step": 787}
{"info/global_step": 788, "train_info/time_within_train_step": 24.839720726013184, "step": 788}
{"train_info/time_between_train_steps": 0.005186319351196289, "step": 788}
{"info/global_step": 789, "train_info/time_within_train_step": 24.94595742225647, "step": 789}
{"train_info/time_between_train_steps": 0.006505727767944336, "step": 789}
{"info/global_step": 790, "train_info/time_within_train_step": 24.943979740142822, "step": 790}
{"train_info/time_between_train_steps": 0.005391836166381836, "step": 790}
{"info/global_step": 791, "train_info/time_within_train_step": 24.859233140945435, "step": 791}
{"train_info/time_between_train_steps": 0.005683183670043945, "step": 791}
{"info/global_step": 792, "train_info/time_within_train_step": 24.901174545288086, "step": 792}
{"train_info/time_between_train_steps": 0.005852222442626953, "step": 792}
{"train_info/time_between_train_steps": 13.127850770950317, "step": 792}
{"info/global_step": 793, "train_info/time_within_train_step": 24.956989765167236, "step": 793}
{"train_info/time_between_train_steps": 0.00626683235168457, "step": 793}
{"info/global_step": 794, "train_info/time_within_train_step": 24.98543620109558, "step": 794}
{"train_info/time_between_train_steps": 0.005439043045043945, "step": 794}
{"info/global_step": 795, "train_info/time_within_train_step": 24.930163383483887, "step": 795}
{"train_info/time_between_train_steps": 0.00913381576538086, "step": 795}
{"info/global_step": 796, "train_info/time_within_train_step": 25.049944639205933, "step": 796}
{"train_info/time_between_train_steps": 0.0053997039794921875, "step": 796}
{"info/global_step": 797, "train_info/time_within_train_step": 24.957502126693726, "step": 797}
{"train_info/time_between_train_steps": 0.011751413345336914, "step": 797}
{"info/global_step": 798, "train_info/time_within_train_step": 25.127673864364624, "step": 798}
{"train_info/time_between_train_steps": 0.01179814338684082, "step": 798}
{"info/global_step": 799, "train_info/time_within_train_step": 24.839606761932373, "step": 799}
{"train_info/time_between_train_steps": 0.005309581756591797, "step": 799}
{"info/global_step": 800, "train_info/time_within_train_step": 24.999761819839478, "step": 800}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734227203, "_runtime": 20265}, "step": 800}
{"logs": {"train/loss": 2.8322, "train/learning_rate": 0.00022222222222222218, "train/epoch": 22.01, "_timestamp": 1734227203, "_runtime": 20265}, "step": 800}
{"train_info/time_between_train_steps": 1.929295539855957, "step": 800}
{"info/global_step": 801, "train_info/time_within_train_step": 24.835052728652954, "step": 801}
{"train_info/time_between_train_steps": 0.010434389114379883, "step": 801}
{"info/global_step": 802, "train_info/time_within_train_step": 25.009047269821167, "step": 802}
{"train_info/time_between_train_steps": 0.0051729679107666016, "step": 802}
{"info/global_step": 803, "train_info/time_within_train_step": 24.87336277961731, "step": 803}
{"train_info/time_between_train_steps": 0.005358219146728516, "step": 803}
{"info/global_step": 804, "train_info/time_within_train_step": 25.1014621257782, "step": 804}
{"train_info/time_between_train_steps": 0.005402803421020508, "step": 804}
{"info/global_step": 805, "train_info/time_within_train_step": 24.818095207214355, "step": 805}
{"train_info/time_between_train_steps": 0.005447864532470703, "step": 805}
{"info/global_step": 806, "train_info/time_within_train_step": 24.999789237976074, "step": 806}
{"train_info/time_between_train_steps": 0.009388923645019531, "step": 806}
{"info/global_step": 807, "train_info/time_within_train_step": 24.866825342178345, "step": 807}
{"train_info/time_between_train_steps": 0.010361671447753906, "step": 807}
{"info/global_step": 808, "train_info/time_within_train_step": 24.9831600189209, "step": 808}
{"train_info/time_between_train_steps": 0.009631872177124023, "step": 808}
{"info/global_step": 809, "train_info/time_within_train_step": 24.862526178359985, "step": 809}
{"train_info/time_between_train_steps": 0.01030731201171875, "step": 809}
{"info/global_step": 810, "train_info/time_within_train_step": 24.826462030410767, "step": 810}
{"train_info/time_between_train_steps": 0.004926443099975586, "step": 810}
{"info/global_step": 811, "train_info/time_within_train_step": 24.81890058517456, "step": 811}
{"train_info/time_between_train_steps": 0.004940509796142578, "step": 811}
{"info/global_step": 812, "train_info/time_within_train_step": 24.833422660827637, "step": 812}
{"train_info/time_between_train_steps": 0.005053997039794922, "step": 812}
{"info/global_step": 813, "train_info/time_within_train_step": 24.816401481628418, "step": 813}
{"train_info/time_between_train_steps": 0.005056142807006836, "step": 813}
{"info/global_step": 814, "train_info/time_within_train_step": 24.867125511169434, "step": 814}
{"train_info/time_between_train_steps": 0.005127429962158203, "step": 814}
{"info/global_step": 815, "train_info/time_within_train_step": 24.843831777572632, "step": 815}
{"train_info/time_between_train_steps": 0.005216836929321289, "step": 815}
{"info/global_step": 816, "train_info/time_within_train_step": 24.837802410125732, "step": 816}
{"train_info/time_between_train_steps": 0.005404472351074219, "step": 816}
{"info/global_step": 817, "train_info/time_within_train_step": 24.908573150634766, "step": 817}
{"train_info/time_between_train_steps": 0.005179405212402344, "step": 817}
{"info/global_step": 818, "train_info/time_within_train_step": 24.81600785255432, "step": 818}
{"train_info/time_between_train_steps": 0.005140781402587891, "step": 818}
{"info/global_step": 819, "train_info/time_within_train_step": 24.8798246383667, "step": 819}
{"train_info/time_between_train_steps": 0.008253812789916992, "step": 819}
{"info/global_step": 820, "train_info/time_within_train_step": 24.964329957962036, "step": 820}
{"train_info/time_between_train_steps": 0.007184743881225586, "step": 820}
{"info/global_step": 821, "train_info/time_within_train_step": 24.837276935577393, "step": 821}
{"train_info/time_between_train_steps": 0.010034561157226562, "step": 821}
{"info/global_step": 822, "train_info/time_within_train_step": 24.967714309692383, "step": 822}
{"train_info/time_between_train_steps": 0.005385875701904297, "step": 822}
{"info/global_step": 823, "train_info/time_within_train_step": 24.844910383224487, "step": 823}
{"train_info/time_between_train_steps": 0.005286455154418945, "step": 823}
{"info/global_step": 824, "train_info/time_within_train_step": 24.932342290878296, "step": 824}
{"train_info/time_between_train_steps": 0.005293607711791992, "step": 824}
{"info/global_step": 825, "train_info/time_within_train_step": 24.816417932510376, "step": 825}
{"train_info/time_between_train_steps": 0.005524158477783203, "step": 825}
{"info/global_step": 826, "train_info/time_within_train_step": 24.889130353927612, "step": 826}
{"train_info/time_between_train_steps": 0.005335092544555664, "step": 826}
{"info/global_step": 827, "train_info/time_within_train_step": 24.92388916015625, "step": 827}
{"train_info/time_between_train_steps": 0.010826826095581055, "step": 827}
{"info/global_step": 828, "train_info/time_within_train_step": 24.867936372756958, "step": 828}
{"train_info/time_between_train_steps": 0.0065762996673583984, "step": 828}
{"train_info/time_between_train_steps": 13.282467603683472, "step": 828}
{"info/global_step": 829, "train_info/time_within_train_step": 24.81164026260376, "step": 829}
{"train_info/time_between_train_steps": 0.0054209232330322266, "step": 829}
{"info/global_step": 830, "train_info/time_within_train_step": 24.95504331588745, "step": 830}
{"train_info/time_between_train_steps": 0.005316257476806641, "step": 830}
{"info/global_step": 831, "train_info/time_within_train_step": 24.827765464782715, "step": 831}
{"train_info/time_between_train_steps": 0.005545616149902344, "step": 831}
{"info/global_step": 832, "train_info/time_within_train_step": 24.964035511016846, "step": 832}
{"train_info/time_between_train_steps": 0.005448102951049805, "step": 832}
{"info/global_step": 833, "train_info/time_within_train_step": 24.82692265510559, "step": 833}
{"train_info/time_between_train_steps": 0.010919332504272461, "step": 833}
{"info/global_step": 834, "train_info/time_within_train_step": 24.92902421951294, "step": 834}
{"train_info/time_between_train_steps": 0.005125999450683594, "step": 834}
{"info/global_step": 835, "train_info/time_within_train_step": 24.912879705429077, "step": 835}
{"train_info/time_between_train_steps": 0.005739450454711914, "step": 835}
{"info/global_step": 836, "train_info/time_within_train_step": 24.99137258529663, "step": 836}
{"train_info/time_between_train_steps": 0.02035975456237793, "step": 836}
{"info/global_step": 837, "train_info/time_within_train_step": 24.81220054626465, "step": 837}
{"train_info/time_between_train_steps": 0.007132053375244141, "step": 837}
{"info/global_step": 838, "train_info/time_within_train_step": 25.008244037628174, "step": 838}
{"train_info/time_between_train_steps": 0.005504608154296875, "step": 838}
{"info/global_step": 839, "train_info/time_within_train_step": 24.79850459098816, "step": 839}
{"train_info/time_between_train_steps": 0.010474205017089844, "step": 839}
{"info/global_step": 840, "train_info/time_within_train_step": 25.016520261764526, "step": 840}
{"train_info/time_between_train_steps": 0.005894660949707031, "step": 840}
{"info/global_step": 841, "train_info/time_within_train_step": 24.891045093536377, "step": 841}
{"train_info/time_between_train_steps": 0.005484580993652344, "step": 841}
{"info/global_step": 842, "train_info/time_within_train_step": 25.01455068588257, "step": 842}
{"train_info/time_between_train_steps": 0.005327939987182617, "step": 842}
{"info/global_step": 843, "train_info/time_within_train_step": 24.840386867523193, "step": 843}
{"train_info/time_between_train_steps": 0.00524139404296875, "step": 843}
{"info/global_step": 844, "train_info/time_within_train_step": 24.897262811660767, "step": 844}
{"train_info/time_between_train_steps": 0.005623340606689453, "step": 844}
{"info/global_step": 845, "train_info/time_within_train_step": 24.97070074081421, "step": 845}
{"train_info/time_between_train_steps": 0.0052340030670166016, "step": 845}
{"info/global_step": 846, "train_info/time_within_train_step": 24.85195541381836, "step": 846}
{"train_info/time_between_train_steps": 0.00516510009765625, "step": 846}
{"info/global_step": 847, "train_info/time_within_train_step": 24.7927508354187, "step": 847}
{"train_info/time_between_train_steps": 0.005074262619018555, "step": 847}
{"info/global_step": 848, "train_info/time_within_train_step": 24.82908868789673, "step": 848}
{"train_info/time_between_train_steps": 0.005211591720581055, "step": 848}
{"info/global_step": 849, "train_info/time_within_train_step": 24.8313250541687, "step": 849}
{"train_info/time_between_train_steps": 0.009912490844726562, "step": 849}
{"info/global_step": 850, "train_info/time_within_train_step": 24.828755855560303, "step": 850}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734228463, "_runtime": 21525}, "step": 850}
{"logs": {"train/loss": 2.7684, "train/learning_rate": 0.00019444444444444443, "train/epoch": 23.02, "_timestamp": 1734228463, "_runtime": 21525}, "step": 850}
{"train_info/time_between_train_steps": 0.0069463253021240234, "step": 850}
{"info/global_step": 851, "train_info/time_within_train_step": 24.895885944366455, "step": 851}
{"train_info/time_between_train_steps": 0.007528543472290039, "step": 851}
{"info/global_step": 852, "train_info/time_within_train_step": 24.802377223968506, "step": 852}
{"train_info/time_between_train_steps": 0.005118370056152344, "step": 852}
{"info/global_step": 853, "train_info/time_within_train_step": 24.8768949508667, "step": 853}
{"train_info/time_between_train_steps": 0.008997201919555664, "step": 853}
{"info/global_step": 854, "train_info/time_within_train_step": 24.97196912765503, "step": 854}
{"train_info/time_between_train_steps": 0.011767864227294922, "step": 854}
{"info/global_step": 855, "train_info/time_within_train_step": 24.81713557243347, "step": 855}
{"train_info/time_between_train_steps": 0.005259513854980469, "step": 855}
{"info/global_step": 856, "train_info/time_within_train_step": 24.848630905151367, "step": 856}
{"train_info/time_between_train_steps": 0.005171537399291992, "step": 856}
{"info/global_step": 857, "train_info/time_within_train_step": 24.79180598258972, "step": 857}
{"train_info/time_between_train_steps": 0.005347728729248047, "step": 857}
{"info/global_step": 858, "train_info/time_within_train_step": 25.02887988090515, "step": 858}
{"train_info/time_between_train_steps": 0.0053784847259521484, "step": 858}
{"info/global_step": 859, "train_info/time_within_train_step": 24.824865579605103, "step": 859}
{"train_info/time_between_train_steps": 0.006031036376953125, "step": 859}
{"info/global_step": 860, "train_info/time_within_train_step": 24.89435076713562, "step": 860}
{"train_info/time_between_train_steps": 0.0053827762603759766, "step": 860}
{"info/global_step": 861, "train_info/time_within_train_step": 24.820162534713745, "step": 861}
{"train_info/time_between_train_steps": 0.00549769401550293, "step": 861}
{"info/global_step": 862, "train_info/time_within_train_step": 24.815762519836426, "step": 862}
{"train_info/time_between_train_steps": 0.006927490234375, "step": 862}
{"info/global_step": 863, "train_info/time_within_train_step": 24.816720485687256, "step": 863}
{"train_info/time_between_train_steps": 0.005797624588012695, "step": 863}
{"info/global_step": 864, "train_info/time_within_train_step": 24.827021837234497, "step": 864}
{"train_info/time_between_train_steps": 0.00687718391418457, "step": 864}
{"train_info/time_between_train_steps": 13.026398420333862, "step": 864}
{"info/global_step": 865, "train_info/time_within_train_step": 24.818477153778076, "step": 865}
{"train_info/time_between_train_steps": 0.009981393814086914, "step": 865}
{"info/global_step": 866, "train_info/time_within_train_step": 25.07369637489319, "step": 866}
{"train_info/time_between_train_steps": 0.00707554817199707, "step": 866}
{"info/global_step": 867, "train_info/time_within_train_step": 24.906333208084106, "step": 867}
{"train_info/time_between_train_steps": 0.005985260009765625, "step": 867}
{"info/global_step": 868, "train_info/time_within_train_step": 25.086865663528442, "step": 868}
{"train_info/time_between_train_steps": 0.005445003509521484, "step": 868}
{"info/global_step": 869, "train_info/time_within_train_step": 24.8547101020813, "step": 869}
{"train_info/time_between_train_steps": 0.00577235221862793, "step": 869}
{"info/global_step": 870, "train_info/time_within_train_step": 25.069451332092285, "step": 870}
{"train_info/time_between_train_steps": 0.01019287109375, "step": 870}
{"info/global_step": 871, "train_info/time_within_train_step": 24.83804726600647, "step": 871}
{"train_info/time_between_train_steps": 0.005678892135620117, "step": 871}
{"info/global_step": 872, "train_info/time_within_train_step": 24.958513021469116, "step": 872}
{"train_info/time_between_train_steps": 0.010160684585571289, "step": 872}
{"info/global_step": 873, "train_info/time_within_train_step": 24.856936931610107, "step": 873}
{"train_info/time_between_train_steps": 0.005240917205810547, "step": 873}
{"info/global_step": 874, "train_info/time_within_train_step": 25.026860237121582, "step": 874}
{"train_info/time_between_train_steps": 0.01028752326965332, "step": 874}
{"info/global_step": 875, "train_info/time_within_train_step": 24.82977819442749, "step": 875}
{"train_info/time_between_train_steps": 0.005598306655883789, "step": 875}
{"info/global_step": 876, "train_info/time_within_train_step": 25.04047393798828, "step": 876}
{"train_info/time_between_train_steps": 0.005352497100830078, "step": 876}
{"info/global_step": 877, "train_info/time_within_train_step": 24.879592895507812, "step": 877}
{"train_info/time_between_train_steps": 0.007230997085571289, "step": 877}
{"info/global_step": 878, "train_info/time_within_train_step": 25.022327423095703, "step": 878}
{"train_info/time_between_train_steps": 0.0062448978424072266, "step": 878}
{"info/global_step": 879, "train_info/time_within_train_step": 24.87887930870056, "step": 879}
{"train_info/time_between_train_steps": 0.0058689117431640625, "step": 879}
{"info/global_step": 880, "train_info/time_within_train_step": 24.963780403137207, "step": 880}
{"train_info/time_between_train_steps": 0.0059528350830078125, "step": 880}
{"info/global_step": 881, "train_info/time_within_train_step": 24.922878980636597, "step": 881}
{"train_info/time_between_train_steps": 0.005017280578613281, "step": 881}
{"info/global_step": 882, "train_info/time_within_train_step": 24.92434334754944, "step": 882}
{"train_info/time_between_train_steps": 0.005820035934448242, "step": 882}
{"info/global_step": 883, "train_info/time_within_train_step": 24.887449979782104, "step": 883}
{"train_info/time_between_train_steps": 0.005379438400268555, "step": 883}
{"info/global_step": 884, "train_info/time_within_train_step": 24.80946135520935, "step": 884}
{"train_info/time_between_train_steps": 0.005159616470336914, "step": 884}
{"info/global_step": 885, "train_info/time_within_train_step": 24.83112645149231, "step": 885}
{"train_info/time_between_train_steps": 0.00532078742980957, "step": 885}
{"info/global_step": 886, "train_info/time_within_train_step": 24.81863498687744, "step": 886}
{"train_info/time_between_train_steps": 0.005416393280029297, "step": 886}
{"info/global_step": 887, "train_info/time_within_train_step": 24.816309213638306, "step": 887}
{"train_info/time_between_train_steps": 0.00538182258605957, "step": 887}
{"info/global_step": 888, "train_info/time_within_train_step": 24.91209578514099, "step": 888}
{"train_info/time_between_train_steps": 0.005989789962768555, "step": 888}
{"info/global_step": 889, "train_info/time_within_train_step": 24.919208526611328, "step": 889}
{"train_info/time_between_train_steps": 0.0057413578033447266, "step": 889}
{"info/global_step": 890, "train_info/time_within_train_step": 24.843008041381836, "step": 890}
{"train_info/time_between_train_steps": 0.0061838626861572266, "step": 890}
{"info/global_step": 891, "train_info/time_within_train_step": 24.909939765930176, "step": 891}
{"train_info/time_between_train_steps": 0.005634307861328125, "step": 891}
{"info/global_step": 892, "train_info/time_within_train_step": 25.007795810699463, "step": 892}
{"train_info/time_between_train_steps": 0.006165504455566406, "step": 892}
{"info/global_step": 893, "train_info/time_within_train_step": 24.928173303604126, "step": 893}
{"train_info/time_between_train_steps": 0.00582122802734375, "step": 893}
{"info/global_step": 894, "train_info/time_within_train_step": 24.85231900215149, "step": 894}
{"train_info/time_between_train_steps": 0.005541086196899414, "step": 894}
{"info/global_step": 895, "train_info/time_within_train_step": 24.829843282699585, "step": 895}
{"train_info/time_between_train_steps": 0.006539106369018555, "step": 895}
{"info/global_step": 896, "train_info/time_within_train_step": 24.866857290267944, "step": 896}
{"train_info/time_between_train_steps": 0.006003618240356445, "step": 896}
{"info/global_step": 897, "train_info/time_within_train_step": 25.18749737739563, "step": 897}
{"train_info/time_between_train_steps": 0.01641249656677246, "step": 897}
{"info/global_step": 898, "train_info/time_within_train_step": 24.913522243499756, "step": 898}
{"train_info/time_between_train_steps": 0.00582432746887207, "step": 898}
{"info/global_step": 899, "train_info/time_within_train_step": 25.037867307662964, "step": 899}
{"train_info/time_between_train_steps": 0.00680232048034668, "step": 899}
{"info/global_step": 900, "train_info/time_within_train_step": 24.924374103546143, "step": 900}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734229722, "_runtime": 22784}, "step": 900}
{"logs": {"train/loss": 2.7306, "train/learning_rate": 0.00016666666666666666, "train/epoch": 24.03, "_timestamp": 1734229722, "_runtime": 22784}, "step": 900}
{"train_info/time_between_train_steps": 2.3906936645507812, "step": 900}
{"train_info/time_between_train_steps": 15.878149509429932, "step": 900}
{"info/global_step": 901, "train_info/time_within_train_step": 24.84505295753479, "step": 901}
{"train_info/time_between_train_steps": 0.0061931610107421875, "step": 901}
{"info/global_step": 902, "train_info/time_within_train_step": 25.046781301498413, "step": 902}
{"train_info/time_between_train_steps": 0.006254673004150391, "step": 902}
{"info/global_step": 903, "train_info/time_within_train_step": 24.87582302093506, "step": 903}
{"train_info/time_between_train_steps": 0.0056040287017822266, "step": 903}
{"info/global_step": 904, "train_info/time_within_train_step": 25.015215396881104, "step": 904}
{"train_info/time_between_train_steps": 0.00583958625793457, "step": 904}
{"info/global_step": 905, "train_info/time_within_train_step": 24.84567880630493, "step": 905}
{"train_info/time_between_train_steps": 0.005495309829711914, "step": 905}
{"info/global_step": 906, "train_info/time_within_train_step": 25.02852487564087, "step": 906}
{"train_info/time_between_train_steps": 0.005826473236083984, "step": 906}
{"info/global_step": 907, "train_info/time_within_train_step": 24.95069193840027, "step": 907}
{"train_info/time_between_train_steps": 0.010240793228149414, "step": 907}
{"info/global_step": 908, "train_info/time_within_train_step": 25.048007011413574, "step": 908}
{"train_info/time_between_train_steps": 0.010198593139648438, "step": 908}
{"info/global_step": 909, "train_info/time_within_train_step": 24.900066137313843, "step": 909}
{"train_info/time_between_train_steps": 0.005696535110473633, "step": 909}
{"info/global_step": 910, "train_info/time_within_train_step": 25.191584587097168, "step": 910}
{"train_info/time_between_train_steps": 0.005810260772705078, "step": 910}
{"info/global_step": 911, "train_info/time_within_train_step": 25.02729606628418, "step": 911}
{"train_info/time_between_train_steps": 0.0062444210052490234, "step": 911}
{"info/global_step": 912, "train_info/time_within_train_step": 25.087554454803467, "step": 912}
{"train_info/time_between_train_steps": 0.005834102630615234, "step": 912}
{"info/global_step": 913, "train_info/time_within_train_step": 24.964200019836426, "step": 913}
{"train_info/time_between_train_steps": 0.006013393402099609, "step": 913}
{"info/global_step": 914, "train_info/time_within_train_step": 25.02462649345398, "step": 914}
{"train_info/time_between_train_steps": 0.0057790279388427734, "step": 914}
{"info/global_step": 915, "train_info/time_within_train_step": 24.81514883041382, "step": 915}
{"train_info/time_between_train_steps": 0.005944013595581055, "step": 915}
{"info/global_step": 916, "train_info/time_within_train_step": 24.99430513381958, "step": 916}
{"train_info/time_between_train_steps": 0.006527423858642578, "step": 916}
{"info/global_step": 917, "train_info/time_within_train_step": 24.9074969291687, "step": 917}
{"train_info/time_between_train_steps": 0.00530242919921875, "step": 917}
{"info/global_step": 918, "train_info/time_within_train_step": 24.98659372329712, "step": 918}
{"train_info/time_between_train_steps": 0.005318880081176758, "step": 918}
{"info/global_step": 919, "train_info/time_within_train_step": 25.120907068252563, "step": 919}
{"train_info/time_between_train_steps": 0.010413885116577148, "step": 919}
{"info/global_step": 920, "train_info/time_within_train_step": 24.89365863800049, "step": 920}
{"train_info/time_between_train_steps": 0.00559234619140625, "step": 920}
{"info/global_step": 921, "train_info/time_within_train_step": 24.80582046508789, "step": 921}
{"train_info/time_between_train_steps": 0.005490779876708984, "step": 921}
{"info/global_step": 922, "train_info/time_within_train_step": 24.870129346847534, "step": 922}
{"train_info/time_between_train_steps": 0.005389690399169922, "step": 922}
{"info/global_step": 923, "train_info/time_within_train_step": 24.827677249908447, "step": 923}
{"train_info/time_between_train_steps": 0.005467414855957031, "step": 923}
{"info/global_step": 924, "train_info/time_within_train_step": 24.89350700378418, "step": 924}
{"train_info/time_between_train_steps": 0.006434917449951172, "step": 924}
{"info/global_step": 925, "train_info/time_within_train_step": 24.900644302368164, "step": 925}
{"train_info/time_between_train_steps": 0.011518716812133789, "step": 925}
{"info/global_step": 926, "train_info/time_within_train_step": 24.933642625808716, "step": 926}
{"train_info/time_between_train_steps": 0.0056133270263671875, "step": 926}
{"info/global_step": 927, "train_info/time_within_train_step": 24.883776903152466, "step": 927}
{"train_info/time_between_train_steps": 0.005446195602416992, "step": 927}
{"info/global_step": 928, "train_info/time_within_train_step": 25.06656312942505, "step": 928}
{"train_info/time_between_train_steps": 0.00565028190612793, "step": 928}
{"info/global_step": 929, "train_info/time_within_train_step": 24.971574783325195, "step": 929}
{"train_info/time_between_train_steps": 0.005410909652709961, "step": 929}
{"info/global_step": 930, "train_info/time_within_train_step": 24.917301893234253, "step": 930}
{"train_info/time_between_train_steps": 0.005475044250488281, "step": 930}
{"info/global_step": 931, "train_info/time_within_train_step": 24.838096857070923, "step": 931}
{"train_info/time_between_train_steps": 0.005390167236328125, "step": 931}
{"info/global_step": 932, "train_info/time_within_train_step": 24.87847352027893, "step": 932}
{"train_info/time_between_train_steps": 0.005348682403564453, "step": 932}
{"info/global_step": 933, "train_info/time_within_train_step": 24.9820396900177, "step": 933}
{"train_info/time_between_train_steps": 0.006515979766845703, "step": 933}
{"info/global_step": 934, "train_info/time_within_train_step": 24.79417109489441, "step": 934}
{"train_info/time_between_train_steps": 0.006160736083984375, "step": 934}
{"info/global_step": 935, "train_info/time_within_train_step": 24.88009476661682, "step": 935}
{"train_info/time_between_train_steps": 0.005988121032714844, "step": 935}
{"info/global_step": 936, "train_info/time_within_train_step": 24.90435290336609, "step": 936}
{"train_info/time_between_train_steps": 0.006172895431518555, "step": 936}
{"train_info/time_between_train_steps": 13.377685070037842, "step": 936}
{"info/global_step": 937, "train_info/time_within_train_step": 24.870922088623047, "step": 937}
{"train_info/time_between_train_steps": 0.0049724578857421875, "step": 937}
{"info/global_step": 938, "train_info/time_within_train_step": 24.990118503570557, "step": 938}
{"train_info/time_between_train_steps": 0.005061149597167969, "step": 938}
{"info/global_step": 939, "train_info/time_within_train_step": 24.79060697555542, "step": 939}
{"train_info/time_between_train_steps": 0.005053997039794922, "step": 939}
{"info/global_step": 940, "train_info/time_within_train_step": 24.944958686828613, "step": 940}
{"train_info/time_between_train_steps": 0.005424022674560547, "step": 940}
{"info/global_step": 941, "train_info/time_within_train_step": 24.875040292739868, "step": 941}
{"train_info/time_between_train_steps": 0.01013946533203125, "step": 941}
{"info/global_step": 942, "train_info/time_within_train_step": 24.965777158737183, "step": 942}
{"train_info/time_between_train_steps": 0.010221481323242188, "step": 942}
{"info/global_step": 943, "train_info/time_within_train_step": 25.01395606994629, "step": 943}
{"train_info/time_between_train_steps": 0.0055179595947265625, "step": 943}
{"info/global_step": 944, "train_info/time_within_train_step": 24.91875982284546, "step": 944}
{"train_info/time_between_train_steps": 0.005222797393798828, "step": 944}
{"info/global_step": 945, "train_info/time_within_train_step": 24.796139001846313, "step": 945}
{"train_info/time_between_train_steps": 0.0052220821380615234, "step": 945}
{"info/global_step": 946, "train_info/time_within_train_step": 25.085413455963135, "step": 946}
{"train_info/time_between_train_steps": 0.00556635856628418, "step": 946}
{"info/global_step": 947, "train_info/time_within_train_step": 25.565890073776245, "step": 947}
{"train_info/time_between_train_steps": 0.010892629623413086, "step": 947}
{"info/global_step": 948, "train_info/time_within_train_step": 25.055221796035767, "step": 948}
{"train_info/time_between_train_steps": 0.00581049919128418, "step": 948}
{"info/global_step": 949, "train_info/time_within_train_step": 24.792773485183716, "step": 949}
{"train_info/time_between_train_steps": 0.0057430267333984375, "step": 949}
{"info/global_step": 950, "train_info/time_within_train_step": 24.97985601425171, "step": 950}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734230999, "_runtime": 24061}, "step": 950}
{"logs": {"train/loss": 2.7179, "train/learning_rate": 0.0001388888888888889, "train/epoch": 26.01, "_timestamp": 1734230999, "_runtime": 24061}, "step": 950}
{"train_info/time_between_train_steps": 0.0078582763671875, "step": 950}
{"info/global_step": 951, "train_info/time_within_train_step": 24.893521070480347, "step": 951}
{"train_info/time_between_train_steps": 0.006894350051879883, "step": 951}
{"info/global_step": 952, "train_info/time_within_train_step": 24.898371696472168, "step": 952}
{"train_info/time_between_train_steps": 0.0054438114166259766, "step": 952}
{"info/global_step": 953, "train_info/time_within_train_step": 24.820926427841187, "step": 953}
{"train_info/time_between_train_steps": 0.00546717643737793, "step": 953}
{"info/global_step": 954, "train_info/time_within_train_step": 24.88321280479431, "step": 954}
{"train_info/time_between_train_steps": 0.0056781768798828125, "step": 954}
{"info/global_step": 955, "train_info/time_within_train_step": 24.855647563934326, "step": 955}
{"train_info/time_between_train_steps": 0.010134458541870117, "step": 955}
{"info/global_step": 956, "train_info/time_within_train_step": 24.901132822036743, "step": 956}
{"train_info/time_between_train_steps": 0.005637645721435547, "step": 956}
{"info/global_step": 957, "train_info/time_within_train_step": 24.86692476272583, "step": 957}
{"train_info/time_between_train_steps": 0.005948066711425781, "step": 957}
{"info/global_step": 958, "train_info/time_within_train_step": 24.85603141784668, "step": 958}
{"train_info/time_between_train_steps": 0.00566554069519043, "step": 958}
{"info/global_step": 959, "train_info/time_within_train_step": 24.913495302200317, "step": 959}
{"train_info/time_between_train_steps": 0.005914926528930664, "step": 959}
{"info/global_step": 960, "train_info/time_within_train_step": 24.86657166481018, "step": 960}
{"train_info/time_between_train_steps": 0.0067901611328125, "step": 960}
{"info/global_step": 961, "train_info/time_within_train_step": 24.908731937408447, "step": 961}
{"train_info/time_between_train_steps": 0.005868434906005859, "step": 961}
{"info/global_step": 962, "train_info/time_within_train_step": 24.876627445220947, "step": 962}
{"train_info/time_between_train_steps": 0.006682395935058594, "step": 962}
{"info/global_step": 963, "train_info/time_within_train_step": 24.843806982040405, "step": 963}
{"train_info/time_between_train_steps": 0.005685329437255859, "step": 963}
{"info/global_step": 964, "train_info/time_within_train_step": 24.847148180007935, "step": 964}
{"train_info/time_between_train_steps": 0.0057125091552734375, "step": 964}
{"info/global_step": 965, "train_info/time_within_train_step": 24.85105586051941, "step": 965}
{"train_info/time_between_train_steps": 0.01009225845336914, "step": 965}
{"info/global_step": 966, "train_info/time_within_train_step": 24.859808921813965, "step": 966}
{"train_info/time_between_train_steps": 0.005681276321411133, "step": 966}
{"info/global_step": 967, "train_info/time_within_train_step": 24.847561836242676, "step": 967}
{"train_info/time_between_train_steps": 0.010624170303344727, "step": 967}
{"info/global_step": 968, "train_info/time_within_train_step": 24.830575466156006, "step": 968}
{"train_info/time_between_train_steps": 0.00561213493347168, "step": 968}
{"info/global_step": 969, "train_info/time_within_train_step": 24.817611694335938, "step": 969}
{"train_info/time_between_train_steps": 0.007193088531494141, "step": 969}
{"info/global_step": 970, "train_info/time_within_train_step": 24.880847215652466, "step": 970}
{"train_info/time_between_train_steps": 0.010393619537353516, "step": 970}
{"info/global_step": 971, "train_info/time_within_train_step": 24.87374711036682, "step": 971}
{"train_info/time_between_train_steps": 0.005919933319091797, "step": 971}
{"info/global_step": 972, "train_info/time_within_train_step": 24.91787099838257, "step": 972}
{"train_info/time_between_train_steps": 0.0064961910247802734, "step": 972}
{"train_info/time_between_train_steps": 13.630686283111572, "step": 972}
{"info/global_step": 973, "train_info/time_within_train_step": 24.855340003967285, "step": 973}
{"train_info/time_between_train_steps": 0.005261898040771484, "step": 973}
{"info/global_step": 974, "train_info/time_within_train_step": 25.07389235496521, "step": 974}
{"train_info/time_between_train_steps": 0.005207538604736328, "step": 974}
{"info/global_step": 975, "train_info/time_within_train_step": 24.799115419387817, "step": 975}
{"train_info/time_between_train_steps": 0.005208253860473633, "step": 975}
{"info/global_step": 976, "train_info/time_within_train_step": 24.92853546142578, "step": 976}
{"train_info/time_between_train_steps": 0.005197048187255859, "step": 976}
{"info/global_step": 977, "train_info/time_within_train_step": 24.918912649154663, "step": 977}
{"train_info/time_between_train_steps": 0.014816045761108398, "step": 977}
{"info/global_step": 978, "train_info/time_within_train_step": 24.892608642578125, "step": 978}
{"train_info/time_between_train_steps": 0.005222797393798828, "step": 978}
{"info/global_step": 979, "train_info/time_within_train_step": 24.811286449432373, "step": 979}
{"train_info/time_between_train_steps": 0.009862422943115234, "step": 979}
{"info/global_step": 980, "train_info/time_within_train_step": 25.016618013381958, "step": 980}
{"train_info/time_between_train_steps": 0.010216236114501953, "step": 980}
{"info/global_step": 981, "train_info/time_within_train_step": 24.866021871566772, "step": 981}
{"train_info/time_between_train_steps": 0.005492687225341797, "step": 981}
{"info/global_step": 982, "train_info/time_within_train_step": 24.91320824623108, "step": 982}
{"train_info/time_between_train_steps": 0.005259275436401367, "step": 982}
{"info/global_step": 983, "train_info/time_within_train_step": 24.805384397506714, "step": 983}
{"train_info/time_between_train_steps": 0.005343198776245117, "step": 983}
{"info/global_step": 984, "train_info/time_within_train_step": 24.911157846450806, "step": 984}
{"train_info/time_between_train_steps": 0.005625724792480469, "step": 984}
{"info/global_step": 985, "train_info/time_within_train_step": 24.873642921447754, "step": 985}
{"train_info/time_between_train_steps": 0.005629539489746094, "step": 985}
{"info/global_step": 986, "train_info/time_within_train_step": 24.91504406929016, "step": 986}
{"train_info/time_between_train_steps": 0.005156040191650391, "step": 986}
{"info/global_step": 987, "train_info/time_within_train_step": 24.815245389938354, "step": 987}
{"train_info/time_between_train_steps": 0.005393028259277344, "step": 987}
{"info/global_step": 988, "train_info/time_within_train_step": 24.949061632156372, "step": 988}
{"train_info/time_between_train_steps": 0.010040521621704102, "step": 988}
{"info/global_step": 989, "train_info/time_within_train_step": 24.97230052947998, "step": 989}
{"train_info/time_between_train_steps": 0.005232095718383789, "step": 989}
{"info/global_step": 990, "train_info/time_within_train_step": 24.96164846420288, "step": 990}
{"train_info/time_between_train_steps": 0.005013227462768555, "step": 990}
{"info/global_step": 991, "train_info/time_within_train_step": 24.79354429244995, "step": 991}
{"train_info/time_between_train_steps": 0.005156040191650391, "step": 991}
{"info/global_step": 992, "train_info/time_within_train_step": 24.801170825958252, "step": 992}
{"train_info/time_between_train_steps": 0.0050907135009765625, "step": 992}
{"info/global_step": 993, "train_info/time_within_train_step": 24.792524099349976, "step": 993}
{"train_info/time_between_train_steps": 0.005475044250488281, "step": 993}
{"info/global_step": 994, "train_info/time_within_train_step": 24.825885772705078, "step": 994}
{"train_info/time_between_train_steps": 0.005475282669067383, "step": 994}
{"info/global_step": 995, "train_info/time_within_train_step": 24.84985661506653, "step": 995}
{"train_info/time_between_train_steps": 0.009958267211914062, "step": 995}
{"info/global_step": 996, "train_info/time_within_train_step": 24.809561014175415, "step": 996}
{"train_info/time_between_train_steps": 0.006421566009521484, "step": 996}
{"info/global_step": 997, "train_info/time_within_train_step": 24.838820934295654, "step": 997}
{"train_info/time_between_train_steps": 0.005614519119262695, "step": 997}
{"info/global_step": 998, "train_info/time_within_train_step": 24.834523677825928, "step": 998}
{"train_info/time_between_train_steps": 0.010039567947387695, "step": 998}
{"info/global_step": 999, "train_info/time_within_train_step": 24.797834157943726, "step": 999}
{"train_info/time_between_train_steps": 0.0052945613861083984, "step": 999}
{"info/global_step": 1000, "train_info/time_within_train_step": 24.856910467147827, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 19104.0, "train_info/memory_max_reserved": 19104.0, "_timestamp": 1734232257, "_runtime": 25319}, "step": 1000}
{"logs": {"train/loss": 2.6628, "train/learning_rate": 0.00011111111111111109, "train/epoch": 27.02, "_timestamp": 1734232257, "_runtime": 25319}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1734232259, "_runtime": 25321}, "step": 1000}
{"logs": {"eval/loss": 3.39341402053833, "eval/runtime": 2.2648, "eval/samples_per_second": 57.843, "eval/steps_per_second": 3.974, "train/epoch": 27.02, "_timestamp": 1734232259, "_runtime": 25321}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1734232259, "_runtime": 25321}, "step": 1000}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 3.39341402053833, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 29.767405523913666, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 2.2648, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 57.843, "train/epoch": 27.02, "_timestamp": 1734232259, "_runtime": 25321}, "step": 1000}
{"train_info/time_between_train_steps": 4.17676568031311, "step": 1000}
{"info/global_step": 1001, "train_info/time_within_train_step": 24.890364170074463, "step": 1001}
{"train_info/time_between_train_steps": 0.005227327346801758, "step": 1001}
{"info/global_step": 1002, "train_info/time_within_train_step": 24.893830060958862, "step": 1002}
{"train_info/time_between_train_steps": 0.0053288936614990234, "step": 1002}
{"info/global_step": 1003, "train_info/time_within_train_step": 24.823359966278076, "step": 1003}
{"train_info/time_between_train_steps": 0.005225181579589844, "step": 1003}
{"info/global_step": 1004, "train_info/time_within_train_step": 24.885671377182007, "step": 1004}
{"train_info/time_between_train_steps": 0.009073734283447266, "step": 1004}
{"info/global_step": 1005, "train_info/time_within_train_step": 24.905568599700928, "step": 1005}
{"train_info/time_between_train_steps": 0.006804704666137695, "step": 1005}
{"info/global_step": 1006, "train_info/time_within_train_step": 24.98363471031189, "step": 1006}
{"train_info/time_between_train_steps": 0.01053476333618164, "step": 1006}
{"info/global_step": 1007, "train_info/time_within_train_step": 24.931803464889526, "step": 1007}
{"train_info/time_between_train_steps": 0.01728224754333496, "step": 1007}
{"info/global_step": 1008, "train_info/time_within_train_step": 24.93532919883728, "step": 1008}
{"train_info/time_between_train_steps": 0.010930538177490234, "step": 1008}
{"train_info/time_between_train_steps": 13.121721982955933, "step": 1008}
{"info/global_step": 1009, "train_info/time_within_train_step": 24.830073356628418, "step": 1009}
{"train_info/time_between_train_steps": 0.005065202713012695, "step": 1009}
{"info/global_step": 1010, "train_info/time_within_train_step": 24.922114372253418, "step": 1010}
{"train_info/time_between_train_steps": 0.005308866500854492, "step": 1010}
{"info/global_step": 1011, "train_info/time_within_train_step": 24.854736328125, "step": 1011}
{"train_info/time_between_train_steps": 0.005581378936767578, "step": 1011}
{"info/global_step": 1012, "train_info/time_within_train_step": 24.980600833892822, "step": 1012}
{"train_info/time_between_train_steps": 0.005429267883300781, "step": 1012}
{"info/global_step": 1013, "train_info/time_within_train_step": 24.921558380126953, "step": 1013}
{"train_info/time_between_train_steps": 0.009743452072143555, "step": 1013}
{"info/global_step": 1014, "train_info/time_within_train_step": 24.9425790309906, "step": 1014}
{"train_info/time_between_train_steps": 0.005362272262573242, "step": 1014}
{"info/global_step": 1015, "train_info/time_within_train_step": 24.853583812713623, "step": 1015}
{"train_info/time_between_train_steps": 0.005309104919433594, "step": 1015}
{"info/global_step": 1016, "train_info/time_within_train_step": 24.915880918502808, "step": 1016}
{"train_info/time_between_train_steps": 0.005425214767456055, "step": 1016}
{"info/global_step": 1017, "train_info/time_within_train_step": 24.839359283447266, "step": 1017}
{"train_info/time_between_train_steps": 0.0055997371673583984, "step": 1017}
{"info/global_step": 1018, "train_info/time_within_train_step": 24.95697045326233, "step": 1018}
{"train_info/time_between_train_steps": 0.005574464797973633, "step": 1018}
{"info/global_step": 1019, "train_info/time_within_train_step": 24.80938196182251, "step": 1019}
{"train_info/time_between_train_steps": 0.005597114562988281, "step": 1019}
{"info/global_step": 1020, "train_info/time_within_train_step": 24.938681602478027, "step": 1020}
{"train_info/time_between_train_steps": 0.005309104919433594, "step": 1020}
{"info/global_step": 1021, "train_info/time_within_train_step": 24.999765872955322, "step": 1021}
{"train_info/time_between_train_steps": 0.006102323532104492, "step": 1021}
{"info/global_step": 1022, "train_info/time_within_train_step": 25.155680894851685, "step": 1022}
{"train_info/time_between_train_steps": 0.005639791488647461, "step": 1022}
{"info/global_step": 1023, "train_info/time_within_train_step": 25.01226544380188, "step": 1023}
{"train_info/time_between_train_steps": 0.014892339706420898, "step": 1023}
{"info/global_step": 1024, "train_info/time_within_train_step": 24.96423625946045, "step": 1024}
{"train_info/time_between_train_steps": 0.005547523498535156, "step": 1024}
{"info/global_step": 1025, "train_info/time_within_train_step": 24.955123901367188, "step": 1025}
{"train_info/time_between_train_steps": 0.00531768798828125, "step": 1025}
{"info/global_step": 1026, "train_info/time_within_train_step": 24.877098321914673, "step": 1026}
{"train_info/time_between_train_steps": 0.00966024398803711, "step": 1026}
{"info/global_step": 1027, "train_info/time_within_train_step": 24.96300721168518, "step": 1027}
{"train_info/time_between_train_steps": 0.005094051361083984, "step": 1027}
{"info/global_step": 1028, "train_info/time_within_train_step": 24.978338956832886, "step": 1028}
{"train_info/time_between_train_steps": 0.009852886199951172, "step": 1028}
{"info/global_step": 1029, "train_info/time_within_train_step": 24.968745470046997, "step": 1029}
{"train_info/time_between_train_steps": 0.009590864181518555, "step": 1029}
{"info/global_step": 1030, "train_info/time_within_train_step": 24.988138914108276, "step": 1030}
{"train_info/time_between_train_steps": 0.009441614151000977, "step": 1030}
{"info/global_step": 1031, "train_info/time_within_train_step": 24.812130212783813, "step": 1031}
{"train_info/time_between_train_steps": 0.005276918411254883, "step": 1031}
{"info/global_step": 1032, "train_info/time_within_train_step": 24.848026752471924, "step": 1032}
{"train_info/time_between_train_steps": 0.010638952255249023, "step": 1032}
{"info/global_step": 1033, "train_info/time_within_train_step": 24.89657163619995, "step": 1033}
{"train_info/time_between_train_steps": 0.009610414505004883, "step": 1033}
{"info/global_step": 1034, "train_info/time_within_train_step": 24.9261736869812, "step": 1034}
{"train_info/time_between_train_steps": 0.005410671234130859, "step": 1034}
{"info/global_step": 1035, "train_info/time_within_train_step": 24.851815700531006, "step": 1035}
{"train_info/time_between_train_steps": 0.005322694778442383, "step": 1035}
{"info/global_step": 1036, "train_info/time_within_train_step": 25.039772748947144, "step": 1036}
{"train_info/time_between_train_steps": 0.005285024642944336, "step": 1036}
{"info/global_step": 1037, "train_info/time_within_train_step": 25.039023876190186, "step": 1037}
{"train_info/time_between_train_steps": 0.005091667175292969, "step": 1037}
{"info/global_step": 1038, "train_info/time_within_train_step": 24.819072246551514, "step": 1038}
{"train_info/time_between_train_steps": 0.0053517818450927734, "step": 1038}
{"info/global_step": 1039, "train_info/time_within_train_step": 24.923700094223022, "step": 1039}
{"train_info/time_between_train_steps": 0.010476112365722656, "step": 1039}
{"info/global_step": 1040, "train_info/time_within_train_step": 24.82953906059265, "step": 1040}
{"train_info/time_between_train_steps": 0.005433320999145508, "step": 1040}
{"info/global_step": 1041, "train_info/time_within_train_step": 24.851465702056885, "step": 1041}
{"train_info/time_between_train_steps": 0.005316257476806641, "step": 1041}
{"info/global_step": 1042, "train_info/time_within_train_step": 24.924890756607056, "step": 1042}
{"train_info/time_between_train_steps": 0.00522303581237793, "step": 1042}
{"info/global_step": 1043, "train_info/time_within_train_step": 24.885847806930542, "step": 1043}
{"train_info/time_between_train_steps": 0.005778789520263672, "step": 1043}
{"info/global_step": 1044, "train_info/time_within_train_step": 24.944465160369873, "step": 1044}
{"train_info/time_between_train_steps": 0.006150722503662109, "step": 1044}
{"train_info/time_between_train_steps": 13.353372573852539, "step": 1044}
{"info/global_step": 1045, "train_info/time_within_train_step": 25.001037120819092, "step": 1045}
{"train_info/time_between_train_steps": 0.004997968673706055, "step": 1045}
{"info/global_step": 1046, "train_info/time_within_train_step": 24.99483036994934, "step": 1046}
{"train_info/time_between_train_steps": 0.006031990051269531, "step": 1046}
{"info/global_step": 1047, "train_info/time_within_train_step": 24.880653381347656, "step": 1047}
{"train_info/time_between_train_steps": 0.006638765335083008, "step": 1047}
{"info/global_step": 1048, "train_info/time_within_train_step": 25.00995683670044, "step": 1048}
{"train_info/time_between_train_steps": 0.0050885677337646484, "step": 1048}
{"info/global_step": 1049, "train_info/time_within_train_step": 24.87820863723755, "step": 1049}
{"train_info/time_between_train_steps": 0.005531787872314453, "step": 1049}
{"info/global_step": 1050, "train_info/time_within_train_step": 25.05462336540222, "step": 1050}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1734233534, "_runtime": 26596}, "step": 1050}
{"logs": {"train/loss": 2.6546, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 29.0, "_timestamp": 1734233534, "_runtime": 26596}, "step": 1050}
{"train_info/time_between_train_steps": 0.008150339126586914, "step": 1050}
{"info/global_step": 1051, "train_info/time_within_train_step": 24.85918641090393, "step": 1051}
{"train_info/time_between_train_steps": 0.009413719177246094, "step": 1051}
{"info/global_step": 1052, "train_info/time_within_train_step": 25.21350407600403, "step": 1052}
{"train_info/time_between_train_steps": 0.010393619537353516, "step": 1052}
{"info/global_step": 1053, "train_info/time_within_train_step": 24.878694534301758, "step": 1053}
{"train_info/time_between_train_steps": 0.005323171615600586, "step": 1053}
{"info/global_step": 1054, "train_info/time_within_train_step": 25.172197341918945, "step": 1054}
{"train_info/time_between_train_steps": 0.0051212310791015625, "step": 1054}
{"info/global_step": 1055, "train_info/time_within_train_step": 24.86802887916565, "step": 1055}
{"train_info/time_between_train_steps": 0.005385160446166992, "step": 1055}
{"info/global_step": 1056, "train_info/time_within_train_step": 25.015278577804565, "step": 1056}
{"train_info/time_between_train_steps": 0.005324125289916992, "step": 1056}
{"info/global_step": 1057, "train_info/time_within_train_step": 25.009135246276855, "step": 1057}
{"train_info/time_between_train_steps": 0.011015653610229492, "step": 1057}
{"info/global_step": 1058, "train_info/time_within_train_step": 25.244943618774414, "step": 1058}
{"train_info/time_between_train_steps": 0.0055048465728759766, "step": 1058}
{"info/global_step": 1059, "train_info/time_within_train_step": 25.064175844192505, "step": 1059}
{"train_info/time_between_train_steps": 0.010412216186523438, "step": 1059}
{"info/global_step": 1060, "train_info/time_within_train_step": 25.20716094970703, "step": 1060}
{"train_info/time_between_train_steps": 0.007835149765014648, "step": 1060}
{"info/global_step": 1061, "train_info/time_within_train_step": 25.043896436691284, "step": 1061}
{"train_info/time_between_train_steps": 0.009973526000976562, "step": 1061}
{"info/global_step": 1062, "train_info/time_within_train_step": 24.982142686843872, "step": 1062}
{"train_info/time_between_train_steps": 0.005478858947753906, "step": 1062}
{"info/global_step": 1063, "train_info/time_within_train_step": 24.93752646446228, "step": 1063}
{"train_info/time_between_train_steps": 0.0069806575775146484, "step": 1063}
{"info/global_step": 1064, "train_info/time_within_train_step": 24.931630849838257, "step": 1064}
{"train_info/time_between_train_steps": 0.007384777069091797, "step": 1064}
{"info/global_step": 1065, "train_info/time_within_train_step": 24.895910263061523, "step": 1065}
{"train_info/time_between_train_steps": 0.010040283203125, "step": 1065}
{"info/global_step": 1066, "train_info/time_within_train_step": 24.990911960601807, "step": 1066}
{"train_info/time_between_train_steps": 0.009748697280883789, "step": 1066}
{"info/global_step": 1067, "train_info/time_within_train_step": 25.036095142364502, "step": 1067}
{"train_info/time_between_train_steps": 0.005407810211181641, "step": 1067}
{"info/global_step": 1068, "train_info/time_within_train_step": 25.056914806365967, "step": 1068}
{"train_info/time_between_train_steps": 0.008173704147338867, "step": 1068}
{"info/global_step": 1069, "train_info/time_within_train_step": 24.92108416557312, "step": 1069}
{"train_info/time_between_train_steps": 0.005720376968383789, "step": 1069}
{"info/global_step": 1070, "train_info/time_within_train_step": 25.055100917816162, "step": 1070}
{"train_info/time_between_train_steps": 0.010556936264038086, "step": 1070}
{"info/global_step": 1071, "train_info/time_within_train_step": 25.06771159172058, "step": 1071}
{"train_info/time_between_train_steps": 0.005647182464599609, "step": 1071}
{"info/global_step": 1072, "train_info/time_within_train_step": 25.03691601753235, "step": 1072}
{"train_info/time_between_train_steps": 0.01067495346069336, "step": 1072}
{"info/global_step": 1073, "train_info/time_within_train_step": 25.065762042999268, "step": 1073}
{"train_info/time_between_train_steps": 0.011735916137695312, "step": 1073}
{"info/global_step": 1074, "train_info/time_within_train_step": 25.04867935180664, "step": 1074}
{"train_info/time_between_train_steps": 0.006634712219238281, "step": 1074}
{"info/global_step": 1075, "train_info/time_within_train_step": 24.995625734329224, "step": 1075}
{"train_info/time_between_train_steps": 0.01565861701965332, "step": 1075}
{"info/global_step": 1076, "train_info/time_within_train_step": 24.93486738204956, "step": 1076}
{"train_info/time_between_train_steps": 0.0058057308197021484, "step": 1076}
{"info/global_step": 1077, "train_info/time_within_train_step": 25.024191856384277, "step": 1077}
{"train_info/time_between_train_steps": 0.006064176559448242, "step": 1077}
{"info/global_step": 1078, "train_info/time_within_train_step": 25.081807374954224, "step": 1078}
{"train_info/time_between_train_steps": 0.007053852081298828, "step": 1078}
{"info/global_step": 1079, "train_info/time_within_train_step": 24.967669010162354, "step": 1079}
{"train_info/time_between_train_steps": 0.012294769287109375, "step": 1079}
{"info/global_step": 1080, "train_info/time_within_train_step": 25.104267120361328, "step": 1080}
{"train_info/time_between_train_steps": 0.007311820983886719, "step": 1080}
{"train_info/time_between_train_steps": 14.048288822174072, "step": 1080}
{"info/global_step": 1081, "train_info/time_within_train_step": 25.057810306549072, "step": 1081}
{"train_info/time_between_train_steps": 0.006162405014038086, "step": 1081}
{"info/global_step": 1082, "train_info/time_within_train_step": 25.346698760986328, "step": 1082}
{"train_info/time_between_train_steps": 0.010921716690063477, "step": 1082}
{"info/global_step": 1083, "train_info/time_within_train_step": 25.302340269088745, "step": 1083}
{"train_info/time_between_train_steps": 0.006815433502197266, "step": 1083}
{"info/global_step": 1084, "train_info/time_within_train_step": 25.269686937332153, "step": 1084}
{"train_info/time_between_train_steps": 0.006607532501220703, "step": 1084}
{"info/global_step": 1085, "train_info/time_within_train_step": 25.12822914123535, "step": 1085}
{"train_info/time_between_train_steps": 0.016849517822265625, "step": 1085}
{"info/global_step": 1086, "train_info/time_within_train_step": 25.208937406539917, "step": 1086}
{"train_info/time_between_train_steps": 0.01130366325378418, "step": 1086}
{"info/global_step": 1087, "train_info/time_within_train_step": 25.050292253494263, "step": 1087}
{"train_info/time_between_train_steps": 0.015990018844604492, "step": 1087}
{"info/global_step": 1088, "train_info/time_within_train_step": 25.111268997192383, "step": 1088}
{"train_info/time_between_train_steps": 0.010406970977783203, "step": 1088}
{"info/global_step": 1089, "train_info/time_within_train_step": 25.027119874954224, "step": 1089}
{"train_info/time_between_train_steps": 0.006460666656494141, "step": 1089}
{"info/global_step": 1090, "train_info/time_within_train_step": 25.218413829803467, "step": 1090}
{"train_info/time_between_train_steps": 0.005415678024291992, "step": 1090}
{"info/global_step": 1091, "train_info/time_within_train_step": 24.97014570236206, "step": 1091}
{"train_info/time_between_train_steps": 0.010636329650878906, "step": 1091}
{"info/global_step": 1092, "train_info/time_within_train_step": 25.255555391311646, "step": 1092}
{"train_info/time_between_train_steps": 0.010962247848510742, "step": 1092}
{"info/global_step": 1093, "train_info/time_within_train_step": 25.02953577041626, "step": 1093}
{"train_info/time_between_train_steps": 0.006348371505737305, "step": 1093}
{"info/global_step": 1094, "train_info/time_within_train_step": 25.214500427246094, "step": 1094}
{"train_info/time_between_train_steps": 0.014543533325195312, "step": 1094}
{"info/global_step": 1095, "train_info/time_within_train_step": 25.015254020690918, "step": 1095}
{"train_info/time_between_train_steps": 0.01628899574279785, "step": 1095}
{"info/global_step": 1096, "train_info/time_within_train_step": 25.12826108932495, "step": 1096}
{"train_info/time_between_train_steps": 0.006868600845336914, "step": 1096}
{"info/global_step": 1097, "train_info/time_within_train_step": 25.11517071723938, "step": 1097}
{"train_info/time_between_train_steps": 0.009893178939819336, "step": 1097}
{"info/global_step": 1098, "train_info/time_within_train_step": 24.995494842529297, "step": 1098}
{"train_info/time_between_train_steps": 0.005620479583740234, "step": 1098}
{"info/global_step": 1099, "train_info/time_within_train_step": 24.995827436447144, "step": 1099}
{"train_info/time_between_train_steps": 0.0054018497467041016, "step": 1099}
{"info/global_step": 1100, "train_info/time_within_train_step": 25.01338768005371, "step": 1100}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1734234802, "_runtime": 27864}, "step": 1100}
{"logs": {"train/loss": 2.6071, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 30.02, "_timestamp": 1734234802, "_runtime": 27864}, "step": 1100}
{"train_info/time_between_train_steps": 2.0173261165618896, "step": 1100}
{"info/global_step": 1101, "train_info/time_within_train_step": 25.019257307052612, "step": 1101}
{"train_info/time_between_train_steps": 0.005467414855957031, "step": 1101}
{"info/global_step": 1102, "train_info/time_within_train_step": 24.99345898628235, "step": 1102}
{"train_info/time_between_train_steps": 0.01022195816040039, "step": 1102}
{"info/global_step": 1103, "train_info/time_within_train_step": 25.021325826644897, "step": 1103}
{"train_info/time_between_train_steps": 0.010655641555786133, "step": 1103}
{"info/global_step": 1104, "train_info/time_within_train_step": 24.934897661209106, "step": 1104}
{"train_info/time_between_train_steps": 0.005366086959838867, "step": 1104}
{"info/global_step": 1105, "train_info/time_within_train_step": 24.95122528076172, "step": 1105}
{"train_info/time_between_train_steps": 0.010321378707885742, "step": 1105}
{"info/global_step": 1106, "train_info/time_within_train_step": 24.990858554840088, "step": 1106}
{"train_info/time_between_train_steps": 0.005572795867919922, "step": 1106}
{"info/global_step": 1107, "train_info/time_within_train_step": 25.01461148262024, "step": 1107}
{"train_info/time_between_train_steps": 0.014860391616821289, "step": 1107}
{"info/global_step": 1108, "train_info/time_within_train_step": 25.010425806045532, "step": 1108}
{"train_info/time_between_train_steps": 0.010004043579101562, "step": 1108}
{"info/global_step": 1109, "train_info/time_within_train_step": 25.00536322593689, "step": 1109}
{"train_info/time_between_train_steps": 0.0053098201751708984, "step": 1109}
{"info/global_step": 1110, "train_info/time_within_train_step": 25.042315244674683, "step": 1110}
{"train_info/time_between_train_steps": 0.006187915802001953, "step": 1110}
{"info/global_step": 1111, "train_info/time_within_train_step": 25.15181875228882, "step": 1111}
{"train_info/time_between_train_steps": 0.01511240005493164, "step": 1111}
{"info/global_step": 1112, "train_info/time_within_train_step": 25.139058113098145, "step": 1112}
{"train_info/time_between_train_steps": 0.010045051574707031, "step": 1112}
{"info/global_step": 1113, "train_info/time_within_train_step": 25.036694765090942, "step": 1113}
{"train_info/time_between_train_steps": 0.005528450012207031, "step": 1113}
{"info/global_step": 1114, "train_info/time_within_train_step": 25.014702320098877, "step": 1114}
{"train_info/time_between_train_steps": 0.005644798278808594, "step": 1114}
{"info/global_step": 1115, "train_info/time_within_train_step": 25.0798602104187, "step": 1115}
{"train_info/time_between_train_steps": 0.006386756896972656, "step": 1115}
{"info/global_step": 1116, "train_info/time_within_train_step": 25.049476146697998, "step": 1116}
{"train_info/time_between_train_steps": 0.016310930252075195, "step": 1116}
{"train_info/time_between_train_steps": 13.242783069610596, "step": 1116}
{"info/global_step": 1117, "train_info/time_within_train_step": 25.487516403198242, "step": 1117}
{"train_info/time_between_train_steps": 0.014073848724365234, "step": 1117}
{"info/global_step": 1118, "train_info/time_within_train_step": 25.285876035690308, "step": 1118}
{"train_info/time_between_train_steps": 0.015307426452636719, "step": 1118}
{"info/global_step": 1119, "train_info/time_within_train_step": 25.096744537353516, "step": 1119}
{"train_info/time_between_train_steps": 0.005461454391479492, "step": 1119}
{"info/global_step": 1120, "train_info/time_within_train_step": 25.20404624938965, "step": 1120}
{"train_info/time_between_train_steps": 0.006623744964599609, "step": 1120}
{"info/global_step": 1121, "train_info/time_within_train_step": 25.025688648223877, "step": 1121}
{"train_info/time_between_train_steps": 0.010332345962524414, "step": 1121}
{"info/global_step": 1122, "train_info/time_within_train_step": 25.194417476654053, "step": 1122}
{"train_info/time_between_train_steps": 0.01036691665649414, "step": 1122}
{"info/global_step": 1123, "train_info/time_within_train_step": 25.064131021499634, "step": 1123}
{"train_info/time_between_train_steps": 0.010434627532958984, "step": 1123}
{"info/global_step": 1124, "train_info/time_within_train_step": 25.04735040664673, "step": 1124}
{"train_info/time_between_train_steps": 0.00997018814086914, "step": 1124}
{"info/global_step": 1125, "train_info/time_within_train_step": 25.014514923095703, "step": 1125}
{"train_info/time_between_train_steps": 0.010246992111206055, "step": 1125}
{"info/global_step": 1126, "train_info/time_within_train_step": 25.223379850387573, "step": 1126}
{"train_info/time_between_train_steps": 0.005545377731323242, "step": 1126}
{"info/global_step": 1127, "train_info/time_within_train_step": 25.034351348876953, "step": 1127}
{"train_info/time_between_train_steps": 0.0059468746185302734, "step": 1127}
{"info/global_step": 1128, "train_info/time_within_train_step": 25.094465255737305, "step": 1128}
{"train_info/time_between_train_steps": 0.010747671127319336, "step": 1128}
{"info/global_step": 1129, "train_info/time_within_train_step": 25.104392051696777, "step": 1129}
{"train_info/time_between_train_steps": 0.010514259338378906, "step": 1129}
{"info/global_step": 1130, "train_info/time_within_train_step": 25.307385444641113, "step": 1130}
{"train_info/time_between_train_steps": 0.0059719085693359375, "step": 1130}
{"info/global_step": 1131, "train_info/time_within_train_step": 24.998334884643555, "step": 1131}
{"train_info/time_between_train_steps": 0.005298614501953125, "step": 1131}
{"info/global_step": 1132, "train_info/time_within_train_step": 24.94709849357605, "step": 1132}
{"train_info/time_between_train_steps": 0.005861997604370117, "step": 1132}
{"info/global_step": 1133, "train_info/time_within_train_step": 25.00478219985962, "step": 1133}
{"train_info/time_between_train_steps": 0.009565591812133789, "step": 1133}
{"info/global_step": 1134, "train_info/time_within_train_step": 25.03484320640564, "step": 1134}
{"train_info/time_between_train_steps": 0.005216121673583984, "step": 1134}
{"info/global_step": 1135, "train_info/time_within_train_step": 25.111786603927612, "step": 1135}
{"train_info/time_between_train_steps": 0.00536656379699707, "step": 1135}
{"info/global_step": 1136, "train_info/time_within_train_step": 25.031759023666382, "step": 1136}
{"train_info/time_between_train_steps": 0.005671977996826172, "step": 1136}
{"info/global_step": 1137, "train_info/time_within_train_step": 24.857640266418457, "step": 1137}
{"train_info/time_between_train_steps": 0.005110502243041992, "step": 1137}
{"info/global_step": 1138, "train_info/time_within_train_step": 25.037914514541626, "step": 1138}
{"train_info/time_between_train_steps": 0.006674289703369141, "step": 1138}
{"info/global_step": 1139, "train_info/time_within_train_step": 24.884426832199097, "step": 1139}
{"train_info/time_between_train_steps": 0.010268211364746094, "step": 1139}
{"info/global_step": 1140, "train_info/time_within_train_step": 24.874329090118408, "step": 1140}
{"train_info/time_between_train_steps": 0.010199785232543945, "step": 1140}
{"info/global_step": 1141, "train_info/time_within_train_step": 25.002544164657593, "step": 1141}
{"train_info/time_between_train_steps": 0.010281801223754883, "step": 1141}
{"info/global_step": 1142, "train_info/time_within_train_step": 25.034414052963257, "step": 1142}
{"train_info/time_between_train_steps": 0.0052890777587890625, "step": 1142}
{"info/global_step": 1143, "train_info/time_within_train_step": 24.924615621566772, "step": 1143}
{"train_info/time_between_train_steps": 0.005250692367553711, "step": 1143}
{"info/global_step": 1144, "train_info/time_within_train_step": 24.896066665649414, "step": 1144}
{"train_info/time_between_train_steps": 0.0052490234375, "step": 1144}
{"info/global_step": 1145, "train_info/time_within_train_step": 25.12397861480713, "step": 1145}
{"train_info/time_between_train_steps": 0.005365848541259766, "step": 1145}
{"info/global_step": 1146, "train_info/time_within_train_step": 24.862194061279297, "step": 1146}
{"train_info/time_between_train_steps": 0.005199909210205078, "step": 1146}
{"info/global_step": 1147, "train_info/time_within_train_step": 24.93025827407837, "step": 1147}
{"train_info/time_between_train_steps": 0.005140781402587891, "step": 1147}
{"info/global_step": 1148, "train_info/time_within_train_step": 24.993709564208984, "step": 1148}
{"train_info/time_between_train_steps": 0.00558781623840332, "step": 1148}
{"info/global_step": 1149, "train_info/time_within_train_step": 24.96273684501648, "step": 1149}
{"train_info/time_between_train_steps": 0.0057718753814697266, "step": 1149}
{"info/global_step": 1150, "train_info/time_within_train_step": 25.064360857009888, "step": 1150}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1734236070, "_runtime": 29132}, "step": 1150}
{"logs": {"train/loss": 2.5836, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 31.03, "_timestamp": 1734236070, "_runtime": 29132}, "step": 1150}
{"train_info/time_between_train_steps": 0.013059377670288086, "step": 1150}
{"info/global_step": 1151, "train_info/time_within_train_step": 24.957296133041382, "step": 1151}
{"train_info/time_between_train_steps": 0.005991220474243164, "step": 1151}
{"info/global_step": 1152, "train_info/time_within_train_step": 24.946276903152466, "step": 1152}
{"train_info/time_between_train_steps": 0.010535240173339844, "step": 1152}
{"train_info/time_between_train_steps": 13.1576087474823, "step": 1152}
{"info/global_step": 1153, "train_info/time_within_train_step": 25.001699447631836, "step": 1153}
{"train_info/time_between_train_steps": 0.010315895080566406, "step": 1153}
{"info/global_step": 1154, "train_info/time_within_train_step": 25.482551097869873, "step": 1154}
{"train_info/time_between_train_steps": 0.007317781448364258, "step": 1154}
{"info/global_step": 1155, "train_info/time_within_train_step": 25.084977626800537, "step": 1155}
{"train_info/time_between_train_steps": 0.014554977416992188, "step": 1155}
{"info/global_step": 1156, "train_info/time_within_train_step": 25.380045413970947, "step": 1156}
{"train_info/time_between_train_steps": 0.006021976470947266, "step": 1156}
{"info/global_step": 1157, "train_info/time_within_train_step": 24.958987951278687, "step": 1157}
{"train_info/time_between_train_steps": 0.006484508514404297, "step": 1157}
{"info/global_step": 1158, "train_info/time_within_train_step": 25.230862855911255, "step": 1158}
{"train_info/time_between_train_steps": 0.006818294525146484, "step": 1158}
{"info/global_step": 1159, "train_info/time_within_train_step": 25.068286418914795, "step": 1159}
{"train_info/time_between_train_steps": 0.010784149169921875, "step": 1159}
{"info/global_step": 1160, "train_info/time_within_train_step": 25.189749717712402, "step": 1160}
{"train_info/time_between_train_steps": 0.01073002815246582, "step": 1160}
{"info/global_step": 1161, "train_info/time_within_train_step": 25.025173902511597, "step": 1161}
{"train_info/time_between_train_steps": 0.010904550552368164, "step": 1161}
{"info/global_step": 1162, "train_info/time_within_train_step": 25.069690704345703, "step": 1162}
{"train_info/time_between_train_steps": 0.006017446517944336, "step": 1162}
{"info/global_step": 1163, "train_info/time_within_train_step": 25.003974437713623, "step": 1163}
{"train_info/time_between_train_steps": 0.005854606628417969, "step": 1163}
{"info/global_step": 1164, "train_info/time_within_train_step": 25.181071043014526, "step": 1164}
{"train_info/time_between_train_steps": 0.010393381118774414, "step": 1164}
{"info/global_step": 1165, "train_info/time_within_train_step": 25.041306257247925, "step": 1165}
{"train_info/time_between_train_steps": 0.0055887699127197266, "step": 1165}
{"info/global_step": 1166, "train_info/time_within_train_step": 25.186166048049927, "step": 1166}
{"train_info/time_between_train_steps": 0.01028132438659668, "step": 1166}
{"info/global_step": 1167, "train_info/time_within_train_step": 25.09328818321228, "step": 1167}
{"train_info/time_between_train_steps": 0.006104707717895508, "step": 1167}
{"info/global_step": 1168, "train_info/time_within_train_step": 25.153541564941406, "step": 1168}
{"train_info/time_between_train_steps": 0.014923095703125, "step": 1168}
{"info/global_step": 1169, "train_info/time_within_train_step": 25.071670055389404, "step": 1169}
{"train_info/time_between_train_steps": 0.010282516479492188, "step": 1169}
{"info/global_step": 1170, "train_info/time_within_train_step": 25.03238010406494, "step": 1170}
{"train_info/time_between_train_steps": 0.01432490348815918, "step": 1170}
{"info/global_step": 1171, "train_info/time_within_train_step": 25.0759015083313, "step": 1171}
{"train_info/time_between_train_steps": 0.009580135345458984, "step": 1171}
{"info/global_step": 1172, "train_info/time_within_train_step": 25.176930904388428, "step": 1172}
{"train_info/time_between_train_steps": 0.01103973388671875, "step": 1172}
{"info/global_step": 1173, "train_info/time_within_train_step": 25.1403648853302, "step": 1173}
{"train_info/time_between_train_steps": 0.010315179824829102, "step": 1173}
{"info/global_step": 1174, "train_info/time_within_train_step": 24.993558883666992, "step": 1174}
{"train_info/time_between_train_steps": 0.005776643753051758, "step": 1174}
{"info/global_step": 1175, "train_info/time_within_train_step": 25.02325129508972, "step": 1175}
{"train_info/time_between_train_steps": 0.005548954010009766, "step": 1175}
{"info/global_step": 1176, "train_info/time_within_train_step": 25.177183866500854, "step": 1176}
{"train_info/time_between_train_steps": 0.007903575897216797, "step": 1176}
{"info/global_step": 1177, "train_info/time_within_train_step": 24.960387468338013, "step": 1177}
{"train_info/time_between_train_steps": 0.0067555904388427734, "step": 1177}
{"info/global_step": 1178, "train_info/time_within_train_step": 25.062332153320312, "step": 1178}
{"train_info/time_between_train_steps": 0.0077288150787353516, "step": 1178}
{"info/global_step": 1179, "train_info/time_within_train_step": 24.992783308029175, "step": 1179}
{"train_info/time_between_train_steps": 0.009744882583618164, "step": 1179}
{"info/global_step": 1180, "train_info/time_within_train_step": 24.97348117828369, "step": 1180}
{"train_info/time_between_train_steps": 0.005593061447143555, "step": 1180}
{"info/global_step": 1181, "train_info/time_within_train_step": 24.923481225967407, "step": 1181}
{"train_info/time_between_train_steps": 0.009724140167236328, "step": 1181}
{"info/global_step": 1182, "train_info/time_within_train_step": 25.06716275215149, "step": 1182}
{"train_info/time_between_train_steps": 0.006110668182373047, "step": 1182}
{"info/global_step": 1183, "train_info/time_within_train_step": 24.98671531677246, "step": 1183}
{"train_info/time_between_train_steps": 0.005563974380493164, "step": 1183}
{"info/global_step": 1184, "train_info/time_within_train_step": 24.990042686462402, "step": 1184}
{"train_info/time_between_train_steps": 0.010550260543823242, "step": 1184}
{"info/global_step": 1185, "train_info/time_within_train_step": 25.037740468978882, "step": 1185}
{"train_info/time_between_train_steps": 0.006591796875, "step": 1185}
{"info/global_step": 1186, "train_info/time_within_train_step": 24.998703002929688, "step": 1186}
{"train_info/time_between_train_steps": 0.00948333740234375, "step": 1186}
{"info/global_step": 1187, "train_info/time_within_train_step": 25.125373125076294, "step": 1187}
{"train_info/time_between_train_steps": 0.006422758102416992, "step": 1187}
{"info/global_step": 1188, "train_info/time_within_train_step": 25.085599660873413, "step": 1188}
{"train_info/time_between_train_steps": 0.006136178970336914, "step": 1188}
{"train_info/time_between_train_steps": 13.503971338272095, "step": 1188}
{"info/global_step": 1189, "train_info/time_within_train_step": 24.935739040374756, "step": 1189}
{"train_info/time_between_train_steps": 0.010036945343017578, "step": 1189}
{"info/global_step": 1190, "train_info/time_within_train_step": 25.036383152008057, "step": 1190}
{"train_info/time_between_train_steps": 0.005180835723876953, "step": 1190}
{"info/global_step": 1191, "train_info/time_within_train_step": 24.961068868637085, "step": 1191}
{"train_info/time_between_train_steps": 0.005414247512817383, "step": 1191}
{"info/global_step": 1192, "train_info/time_within_train_step": 25.122676610946655, "step": 1192}
{"train_info/time_between_train_steps": 0.005445957183837891, "step": 1192}
{"info/global_step": 1193, "train_info/time_within_train_step": 25.067089319229126, "step": 1193}
{"train_info/time_between_train_steps": 0.010284185409545898, "step": 1193}
{"info/global_step": 1194, "train_info/time_within_train_step": 25.116291046142578, "step": 1194}
{"train_info/time_between_train_steps": 0.0056226253509521484, "step": 1194}
{"info/global_step": 1195, "train_info/time_within_train_step": 25.074463367462158, "step": 1195}
{"train_info/time_between_train_steps": 0.010284662246704102, "step": 1195}
{"info/global_step": 1196, "train_info/time_within_train_step": 25.130858659744263, "step": 1196}
{"train_info/time_between_train_steps": 0.0058100223541259766, "step": 1196}
{"info/global_step": 1197, "train_info/time_within_train_step": 25.065150260925293, "step": 1197}
{"train_info/time_between_train_steps": 0.010676145553588867, "step": 1197}
{"info/global_step": 1198, "train_info/time_within_train_step": 25.178067922592163, "step": 1198}
{"train_info/time_between_train_steps": 0.016268491744995117, "step": 1198}
{"info/global_step": 1199, "train_info/time_within_train_step": 25.042709827423096, "step": 1199}
{"train_info/time_between_train_steps": 0.0056591033935546875, "step": 1199}
{"info/global_step": 1200, "train_info/time_within_train_step": 25.127809762954712, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1734237351, "_runtime": 30413}, "step": 1200}
{"logs": {"train/loss": 2.5862, "train/learning_rate": 0.0, "train/epoch": 33.01, "_timestamp": 1734237351, "_runtime": 30413}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1581.5546875, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1734237354, "_runtime": 30416}, "step": 1200}
{"logs": {"train/train_runtime": 30416.2883, "train/train_samples_per_second": 20.2, "train/train_steps_per_second": 0.039, "train/total_flos": 3.24507458469888e+17, "train/train_loss": 3.356172176202138, "train/epoch": 33.01, "_timestamp": 1734237354, "_runtime": 30416}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1581.5537109375, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1734237357, "_runtime": 30419}, "step": 1200}
{"logs": {"eval/loss": 3.416703939437866, "eval/runtime": 2.254, "eval/samples_per_second": 58.118, "eval/steps_per_second": 3.993, "train/epoch": 33.01, "_timestamp": 1734237357, "_runtime": 30419}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1581.5537109375, "train_info/memory_max_allocated": 18057.0224609375, "train_info/memory_reserved": 21960.0, "train_info/memory_max_reserved": 21960.0, "_timestamp": 1734237357, "_runtime": 30419}, "step": 1200}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 3.416703939437866, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 30.46882224879666, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 2.254, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 58.118, "train/epoch": 33.01, "_timestamp": 1734237357, "_runtime": 30419}, "step": 1200}