shuffle_control_EN53 / metrics.json
xiulinyang's picture
Adding model checkpoints and config files
b9a799a
{"num_parameters": 124439808, "trainable_parameters": 124439808, "step": 0}
{"train_info/time_between_train_steps": 3.681506872177124, "step": 0}
{"info/global_step": 1, "train_info/time_within_train_step": 33.22588038444519, "step": 1}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 19761.71484375, "train_info/memory_reserved": 22624.0, "train_info/memory_max_reserved": 22624.0, "_timestamp": 1733687534, "_runtime": 40}, "step": 1}
{"logs": {"train/loss": 11.0211, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1733687533, "_runtime": 39}, "step": 1}
{"train_info/time_between_train_steps": 0.13153982162475586, "step": 1}
{"info/global_step": 2, "train_info/time_within_train_step": 32.72058963775635, "step": 2}
{"train_info/time_between_train_steps": 0.00590825080871582, "step": 2}
{"info/global_step": 3, "train_info/time_within_train_step": 32.39141607284546, "step": 3}
{"train_info/time_between_train_steps": 0.006356477737426758, "step": 3}
{"info/global_step": 4, "train_info/time_within_train_step": 32.636337995529175, "step": 4}
{"train_info/time_between_train_steps": 0.005725383758544922, "step": 4}
{"info/global_step": 5, "train_info/time_within_train_step": 32.430628538131714, "step": 5}
{"train_info/time_between_train_steps": 0.006144523620605469, "step": 5}
{"info/global_step": 6, "train_info/time_within_train_step": 32.658926010131836, "step": 6}
{"train_info/time_between_train_steps": 0.006003379821777344, "step": 6}
{"info/global_step": 7, "train_info/time_within_train_step": 32.36413836479187, "step": 7}
{"train_info/time_between_train_steps": 0.010534048080444336, "step": 7}
{"info/global_step": 8, "train_info/time_within_train_step": 32.44034552574158, "step": 8}
{"train_info/time_between_train_steps": 0.00601959228515625, "step": 8}
{"info/global_step": 9, "train_info/time_within_train_step": 32.39487171173096, "step": 9}
{"train_info/time_between_train_steps": 0.005428791046142578, "step": 9}
{"info/global_step": 10, "train_info/time_within_train_step": 32.517645835876465, "step": 10}
{"train_info/time_between_train_steps": 0.005632877349853516, "step": 10}
{"info/global_step": 11, "train_info/time_within_train_step": 32.37699794769287, "step": 11}
{"train_info/time_between_train_steps": 0.005662441253662109, "step": 11}
{"info/global_step": 12, "train_info/time_within_train_step": 32.46292209625244, "step": 12}
{"train_info/time_between_train_steps": 0.005791187286376953, "step": 12}
{"info/global_step": 13, "train_info/time_within_train_step": 32.49907851219177, "step": 13}
{"train_info/time_between_train_steps": 0.005543708801269531, "step": 13}
{"info/global_step": 14, "train_info/time_within_train_step": 32.252946615219116, "step": 14}
{"train_info/time_between_train_steps": 0.00616002082824707, "step": 14}
{"info/global_step": 15, "train_info/time_within_train_step": 32.621471881866455, "step": 15}
{"train_info/time_between_train_steps": 0.006241321563720703, "step": 15}
{"info/global_step": 16, "train_info/time_within_train_step": 32.598816871643066, "step": 16}
{"train_info/time_between_train_steps": 0.005595207214355469, "step": 16}
{"info/global_step": 17, "train_info/time_within_train_step": 32.5531108379364, "step": 17}
{"train_info/time_between_train_steps": 0.005505561828613281, "step": 17}
{"info/global_step": 18, "train_info/time_within_train_step": 32.55298733711243, "step": 18}
{"train_info/time_between_train_steps": 0.005753040313720703, "step": 18}
{"info/global_step": 19, "train_info/time_within_train_step": 32.35093402862549, "step": 19}
{"train_info/time_between_train_steps": 0.005387067794799805, "step": 19}
{"info/global_step": 20, "train_info/time_within_train_step": 32.461787939071655, "step": 20}
{"train_info/time_between_train_steps": 0.005430459976196289, "step": 20}
{"info/global_step": 21, "train_info/time_within_train_step": 32.358699560165405, "step": 21}
{"train_info/time_between_train_steps": 0.005429744720458984, "step": 21}
{"info/global_step": 22, "train_info/time_within_train_step": 32.40512204170227, "step": 22}
{"train_info/time_between_train_steps": 0.005663394927978516, "step": 22}
{"info/global_step": 23, "train_info/time_within_train_step": 32.56002354621887, "step": 23}
{"train_info/time_between_train_steps": 0.006043195724487305, "step": 23}
{"info/global_step": 24, "train_info/time_within_train_step": 32.43665409088135, "step": 24}
{"train_info/time_between_train_steps": 0.006052494049072266, "step": 24}
{"info/global_step": 25, "train_info/time_within_train_step": 32.565892934799194, "step": 25}
{"train_info/time_between_train_steps": 0.005631923675537109, "step": 25}
{"info/global_step": 26, "train_info/time_within_train_step": 32.302213191986084, "step": 26}
{"train_info/time_between_train_steps": 0.006437540054321289, "step": 26}
{"info/global_step": 27, "train_info/time_within_train_step": 32.55335092544556, "step": 27}
{"train_info/time_between_train_steps": 0.006242036819458008, "step": 27}
{"train_info/time_between_train_steps": 23.862852573394775, "step": 27}
{"info/global_step": 28, "train_info/time_within_train_step": 32.345072507858276, "step": 28}
{"train_info/time_between_train_steps": 0.005890607833862305, "step": 28}
{"info/global_step": 29, "train_info/time_within_train_step": 32.83443856239319, "step": 29}
{"train_info/time_between_train_steps": 0.005501747131347656, "step": 29}
{"info/global_step": 30, "train_info/time_within_train_step": 32.35546088218689, "step": 30}
{"train_info/time_between_train_steps": 0.005373239517211914, "step": 30}
{"info/global_step": 31, "train_info/time_within_train_step": 32.88064789772034, "step": 31}
{"train_info/time_between_train_steps": 0.005957603454589844, "step": 31}
{"info/global_step": 32, "train_info/time_within_train_step": 32.293885469436646, "step": 32}
{"train_info/time_between_train_steps": 0.00883173942565918, "step": 32}
{"info/global_step": 33, "train_info/time_within_train_step": 32.57368040084839, "step": 33}
{"train_info/time_between_train_steps": 0.005586862564086914, "step": 33}
{"info/global_step": 34, "train_info/time_within_train_step": 32.33747148513794, "step": 34}
{"train_info/time_between_train_steps": 0.005339384078979492, "step": 34}
{"info/global_step": 35, "train_info/time_within_train_step": 32.41392922401428, "step": 35}
{"train_info/time_between_train_steps": 0.005402326583862305, "step": 35}
{"info/global_step": 36, "train_info/time_within_train_step": 32.36069965362549, "step": 36}
{"train_info/time_between_train_steps": 0.01003122329711914, "step": 36}
{"info/global_step": 37, "train_info/time_within_train_step": 32.42470741271973, "step": 37}
{"train_info/time_between_train_steps": 0.005098104476928711, "step": 37}
{"info/global_step": 38, "train_info/time_within_train_step": 32.380805253982544, "step": 38}
{"train_info/time_between_train_steps": 0.011169195175170898, "step": 38}
{"info/global_step": 39, "train_info/time_within_train_step": 32.39061737060547, "step": 39}
{"train_info/time_between_train_steps": 0.010234594345092773, "step": 39}
{"info/global_step": 40, "train_info/time_within_train_step": 32.30612111091614, "step": 40}
{"train_info/time_between_train_steps": 0.005423069000244141, "step": 40}
{"info/global_step": 41, "train_info/time_within_train_step": 32.61903095245361, "step": 41}
{"train_info/time_between_train_steps": 0.010092735290527344, "step": 41}
{"info/global_step": 42, "train_info/time_within_train_step": 32.308091163635254, "step": 42}
{"train_info/time_between_train_steps": 0.005415916442871094, "step": 42}
{"info/global_step": 43, "train_info/time_within_train_step": 32.256468772888184, "step": 43}
{"train_info/time_between_train_steps": 0.011347293853759766, "step": 43}
{"info/global_step": 44, "train_info/time_within_train_step": 32.061687707901, "step": 44}
{"train_info/time_between_train_steps": 0.005226612091064453, "step": 44}
{"info/global_step": 45, "train_info/time_within_train_step": 32.240567684173584, "step": 45}
{"train_info/time_between_train_steps": 0.005194425582885742, "step": 45}
{"info/global_step": 46, "train_info/time_within_train_step": 32.567339181900024, "step": 46}
{"train_info/time_between_train_steps": 0.010123491287231445, "step": 46}
{"info/global_step": 47, "train_info/time_within_train_step": 32.51317834854126, "step": 47}
{"train_info/time_between_train_steps": 0.005365848541259766, "step": 47}
{"info/global_step": 48, "train_info/time_within_train_step": 32.58642864227295, "step": 48}
{"train_info/time_between_train_steps": 0.008160591125488281, "step": 48}
{"info/global_step": 49, "train_info/time_within_train_step": 32.60082817077637, "step": 49}
{"train_info/time_between_train_steps": 0.010134220123291016, "step": 49}
{"info/global_step": 50, "train_info/time_within_train_step": 32.61146378517151, "step": 50}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733689149, "_runtime": 1655}, "step": 50}
{"logs": {"train/loss": 7.9711, "train/learning_rate": 0.00025, "train/epoch": 1.02, "_timestamp": 1733689149, "_runtime": 1655}, "step": 50}
{"train_info/time_between_train_steps": 0.0076160430908203125, "step": 50}
{"info/global_step": 51, "train_info/time_within_train_step": 32.46914315223694, "step": 51}
{"train_info/time_between_train_steps": 0.005556344985961914, "step": 51}
{"info/global_step": 52, "train_info/time_within_train_step": 32.438995122909546, "step": 52}
{"train_info/time_between_train_steps": 0.0054318904876708984, "step": 52}
{"info/global_step": 53, "train_info/time_within_train_step": 32.52835655212402, "step": 53}
{"train_info/time_between_train_steps": 0.00573277473449707, "step": 53}
{"info/global_step": 54, "train_info/time_within_train_step": 32.51054930686951, "step": 54}
{"train_info/time_between_train_steps": 0.005850553512573242, "step": 54}
{"train_info/time_between_train_steps": 23.461182594299316, "step": 54}
{"info/global_step": 55, "train_info/time_within_train_step": 32.57023000717163, "step": 55}
{"train_info/time_between_train_steps": 0.005537271499633789, "step": 55}
{"info/global_step": 56, "train_info/time_within_train_step": 32.4339120388031, "step": 56}
{"train_info/time_between_train_steps": 0.0054171085357666016, "step": 56}
{"info/global_step": 57, "train_info/time_within_train_step": 32.30394744873047, "step": 57}
{"train_info/time_between_train_steps": 0.010027647018432617, "step": 57}
{"info/global_step": 58, "train_info/time_within_train_step": 32.68250012397766, "step": 58}
{"train_info/time_between_train_steps": 0.01027059555053711, "step": 58}
{"info/global_step": 59, "train_info/time_within_train_step": 32.158254623413086, "step": 59}
{"train_info/time_between_train_steps": 0.005869626998901367, "step": 59}
{"info/global_step": 60, "train_info/time_within_train_step": 32.369914054870605, "step": 60}
{"train_info/time_between_train_steps": 0.00534510612487793, "step": 60}
{"info/global_step": 61, "train_info/time_within_train_step": 32.420798778533936, "step": 61}
{"train_info/time_between_train_steps": 0.005859851837158203, "step": 61}
{"info/global_step": 62, "train_info/time_within_train_step": 32.63410258293152, "step": 62}
{"train_info/time_between_train_steps": 0.005476236343383789, "step": 62}
{"info/global_step": 63, "train_info/time_within_train_step": 32.41828775405884, "step": 63}
{"train_info/time_between_train_steps": 0.010463714599609375, "step": 63}
{"info/global_step": 64, "train_info/time_within_train_step": 32.4257378578186, "step": 64}
{"train_info/time_between_train_steps": 0.005172252655029297, "step": 64}
{"info/global_step": 65, "train_info/time_within_train_step": 32.392709732055664, "step": 65}
{"train_info/time_between_train_steps": 0.005156278610229492, "step": 65}
{"info/global_step": 66, "train_info/time_within_train_step": 32.33672904968262, "step": 66}
{"train_info/time_between_train_steps": 0.010639190673828125, "step": 66}
{"info/global_step": 67, "train_info/time_within_train_step": 32.19670391082764, "step": 67}
{"train_info/time_between_train_steps": 0.005235910415649414, "step": 67}
{"info/global_step": 68, "train_info/time_within_train_step": 32.057944774627686, "step": 68}
{"train_info/time_between_train_steps": 0.00511932373046875, "step": 68}
{"info/global_step": 69, "train_info/time_within_train_step": 32.52954649925232, "step": 69}
{"train_info/time_between_train_steps": 0.008227348327636719, "step": 69}
{"info/global_step": 70, "train_info/time_within_train_step": 32.38155484199524, "step": 70}
{"train_info/time_between_train_steps": 0.008871316909790039, "step": 70}
{"info/global_step": 71, "train_info/time_within_train_step": 32.61561393737793, "step": 71}
{"train_info/time_between_train_steps": 0.005509853363037109, "step": 71}
{"info/global_step": 72, "train_info/time_within_train_step": 32.27597165107727, "step": 72}
{"train_info/time_between_train_steps": 0.005113124847412109, "step": 72}
{"info/global_step": 73, "train_info/time_within_train_step": 32.42532801628113, "step": 73}
{"train_info/time_between_train_steps": 0.005334615707397461, "step": 73}
{"info/global_step": 74, "train_info/time_within_train_step": 32.513357400894165, "step": 74}
{"train_info/time_between_train_steps": 0.007593393325805664, "step": 74}
{"info/global_step": 75, "train_info/time_within_train_step": 32.734588623046875, "step": 75}
{"train_info/time_between_train_steps": 0.005380153656005859, "step": 75}
{"info/global_step": 76, "train_info/time_within_train_step": 32.24607968330383, "step": 76}
{"train_info/time_between_train_steps": 0.005426883697509766, "step": 76}
{"info/global_step": 77, "train_info/time_within_train_step": 32.580296754837036, "step": 77}
{"train_info/time_between_train_steps": 0.005338430404663086, "step": 77}
{"info/global_step": 78, "train_info/time_within_train_step": 32.34770631790161, "step": 78}
{"train_info/time_between_train_steps": 0.008155345916748047, "step": 78}
{"info/global_step": 79, "train_info/time_within_train_step": 32.62880873680115, "step": 79}
{"train_info/time_between_train_steps": 0.0054361820220947266, "step": 79}
{"info/global_step": 80, "train_info/time_within_train_step": 32.75647330284119, "step": 80}
{"train_info/time_between_train_steps": 0.005555152893066406, "step": 80}
{"info/global_step": 81, "train_info/time_within_train_step": 32.34639072418213, "step": 81}
{"train_info/time_between_train_steps": 0.00612640380859375, "step": 81}
{"train_info/time_between_train_steps": 23.536869287490845, "step": 81}
{"info/global_step": 82, "train_info/time_within_train_step": 32.74170231819153, "step": 82}
{"train_info/time_between_train_steps": 0.005364894866943359, "step": 82}
{"info/global_step": 83, "train_info/time_within_train_step": 32.34957313537598, "step": 83}
{"train_info/time_between_train_steps": 0.007855653762817383, "step": 83}
{"info/global_step": 84, "train_info/time_within_train_step": 32.54166531562805, "step": 84}
{"train_info/time_between_train_steps": 0.006979227066040039, "step": 84}
{"info/global_step": 85, "train_info/time_within_train_step": 32.513529539108276, "step": 85}
{"train_info/time_between_train_steps": 0.0054569244384765625, "step": 85}
{"info/global_step": 86, "train_info/time_within_train_step": 32.48696041107178, "step": 86}
{"train_info/time_between_train_steps": 0.00868844985961914, "step": 86}
{"info/global_step": 87, "train_info/time_within_train_step": 32.65245079994202, "step": 87}
{"train_info/time_between_train_steps": 0.005691051483154297, "step": 87}
{"info/global_step": 88, "train_info/time_within_train_step": 32.47171425819397, "step": 88}
{"train_info/time_between_train_steps": 0.0072650909423828125, "step": 88}
{"info/global_step": 89, "train_info/time_within_train_step": 32.61938261985779, "step": 89}
{"train_info/time_between_train_steps": 0.005521535873413086, "step": 89}
{"info/global_step": 90, "train_info/time_within_train_step": 32.601402044296265, "step": 90}
{"train_info/time_between_train_steps": 0.005397796630859375, "step": 90}
{"info/global_step": 91, "train_info/time_within_train_step": 32.34563612937927, "step": 91}
{"train_info/time_between_train_steps": 0.005249738693237305, "step": 91}
{"info/global_step": 92, "train_info/time_within_train_step": 32.48661398887634, "step": 92}
{"train_info/time_between_train_steps": 0.008261442184448242, "step": 92}
{"info/global_step": 93, "train_info/time_within_train_step": 32.52534008026123, "step": 93}
{"train_info/time_between_train_steps": 0.00522613525390625, "step": 93}
{"info/global_step": 94, "train_info/time_within_train_step": 32.236693382263184, "step": 94}
{"train_info/time_between_train_steps": 0.005201101303100586, "step": 94}
{"info/global_step": 95, "train_info/time_within_train_step": 32.270127058029175, "step": 95}
{"train_info/time_between_train_steps": 0.008975744247436523, "step": 95}
{"info/global_step": 96, "train_info/time_within_train_step": 32.81215286254883, "step": 96}
{"train_info/time_between_train_steps": 0.0053980350494384766, "step": 96}
{"info/global_step": 97, "train_info/time_within_train_step": 32.3338098526001, "step": 97}
{"train_info/time_between_train_steps": 0.007978677749633789, "step": 97}
{"info/global_step": 98, "train_info/time_within_train_step": 32.3461709022522, "step": 98}
{"train_info/time_between_train_steps": 0.005184173583984375, "step": 98}
{"info/global_step": 99, "train_info/time_within_train_step": 32.64952850341797, "step": 99}
{"train_info/time_between_train_steps": 0.005248546600341797, "step": 99}
{"info/global_step": 100, "train_info/time_within_train_step": 32.43440246582031, "step": 100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733690819, "_runtime": 3325}, "step": 100}
{"logs": {"train/loss": 5.744, "train/learning_rate": 0.0005, "train/epoch": 3.02, "_timestamp": 1733690819, "_runtime": 3325}, "step": 100}
{"train_info/time_between_train_steps": 2.8307416439056396, "step": 100}
{"info/global_step": 101, "train_info/time_within_train_step": 32.478431701660156, "step": 101}
{"train_info/time_between_train_steps": 0.010165214538574219, "step": 101}
{"info/global_step": 102, "train_info/time_within_train_step": 32.743590354919434, "step": 102}
{"train_info/time_between_train_steps": 0.0053708553314208984, "step": 102}
{"info/global_step": 103, "train_info/time_within_train_step": 32.373923778533936, "step": 103}
{"train_info/time_between_train_steps": 0.0076296329498291016, "step": 103}
{"info/global_step": 104, "train_info/time_within_train_step": 32.4801881313324, "step": 104}
{"train_info/time_between_train_steps": 0.005274534225463867, "step": 104}
{"info/global_step": 105, "train_info/time_within_train_step": 32.4980149269104, "step": 105}
{"train_info/time_between_train_steps": 0.005313873291015625, "step": 105}
{"info/global_step": 106, "train_info/time_within_train_step": 32.40939927101135, "step": 106}
{"train_info/time_between_train_steps": 0.010514259338378906, "step": 106}
{"info/global_step": 107, "train_info/time_within_train_step": 32.730350732803345, "step": 107}
{"train_info/time_between_train_steps": 0.005681753158569336, "step": 107}
{"info/global_step": 108, "train_info/time_within_train_step": 32.27839517593384, "step": 108}
{"train_info/time_between_train_steps": 0.005709171295166016, "step": 108}
{"train_info/time_between_train_steps": 24.017690658569336, "step": 108}
{"info/global_step": 109, "train_info/time_within_train_step": 32.56250190734863, "step": 109}
{"train_info/time_between_train_steps": 0.0058252811431884766, "step": 109}
{"info/global_step": 110, "train_info/time_within_train_step": 32.50545859336853, "step": 110}
{"train_info/time_between_train_steps": 0.005808353424072266, "step": 110}
{"info/global_step": 111, "train_info/time_within_train_step": 32.42155432701111, "step": 111}
{"train_info/time_between_train_steps": 0.005364418029785156, "step": 111}
{"info/global_step": 112, "train_info/time_within_train_step": 32.83249831199646, "step": 112}
{"train_info/time_between_train_steps": 0.005339622497558594, "step": 112}
{"info/global_step": 113, "train_info/time_within_train_step": 32.30735397338867, "step": 113}
{"train_info/time_between_train_steps": 0.0074579715728759766, "step": 113}
{"info/global_step": 114, "train_info/time_within_train_step": 32.571003437042236, "step": 114}
{"train_info/time_between_train_steps": 0.0056760311126708984, "step": 114}
{"info/global_step": 115, "train_info/time_within_train_step": 32.483400106430054, "step": 115}
{"train_info/time_between_train_steps": 0.010178327560424805, "step": 115}
{"info/global_step": 116, "train_info/time_within_train_step": 32.41589689254761, "step": 116}
{"train_info/time_between_train_steps": 0.005427122116088867, "step": 116}
{"info/global_step": 117, "train_info/time_within_train_step": 32.2336266040802, "step": 117}
{"train_info/time_between_train_steps": 0.006546735763549805, "step": 117}
{"info/global_step": 118, "train_info/time_within_train_step": 32.67556881904602, "step": 118}
{"train_info/time_between_train_steps": 0.007224321365356445, "step": 118}
{"info/global_step": 119, "train_info/time_within_train_step": 32.375739336013794, "step": 119}
{"train_info/time_between_train_steps": 0.007554531097412109, "step": 119}
{"info/global_step": 120, "train_info/time_within_train_step": 32.36717867851257, "step": 120}
{"train_info/time_between_train_steps": 0.005281925201416016, "step": 120}
{"info/global_step": 121, "train_info/time_within_train_step": 32.74897646903992, "step": 121}
{"train_info/time_between_train_steps": 0.005589962005615234, "step": 121}
{"info/global_step": 122, "train_info/time_within_train_step": 32.0747344493866, "step": 122}
{"train_info/time_between_train_steps": 0.0055658817291259766, "step": 122}
{"info/global_step": 123, "train_info/time_within_train_step": 32.28490447998047, "step": 123}
{"train_info/time_between_train_steps": 0.0099945068359375, "step": 123}
{"info/global_step": 124, "train_info/time_within_train_step": 32.538254737854004, "step": 124}
{"train_info/time_between_train_steps": 0.005286216735839844, "step": 124}
{"info/global_step": 125, "train_info/time_within_train_step": 32.32377505302429, "step": 125}
{"train_info/time_between_train_steps": 0.005539655685424805, "step": 125}
{"info/global_step": 126, "train_info/time_within_train_step": 32.555620193481445, "step": 126}
{"train_info/time_between_train_steps": 0.005334138870239258, "step": 126}
{"info/global_step": 127, "train_info/time_within_train_step": 32.602896213531494, "step": 127}
{"train_info/time_between_train_steps": 0.005608081817626953, "step": 127}
{"info/global_step": 128, "train_info/time_within_train_step": 32.43479108810425, "step": 128}
{"train_info/time_between_train_steps": 0.005438327789306641, "step": 128}
{"info/global_step": 129, "train_info/time_within_train_step": 32.30211043357849, "step": 129}
{"train_info/time_between_train_steps": 0.010451316833496094, "step": 129}
{"info/global_step": 130, "train_info/time_within_train_step": 32.55166220664978, "step": 130}
{"train_info/time_between_train_steps": 0.0053920745849609375, "step": 130}
{"info/global_step": 131, "train_info/time_within_train_step": 32.40304660797119, "step": 131}
{"train_info/time_between_train_steps": 0.010200262069702148, "step": 131}
{"info/global_step": 132, "train_info/time_within_train_step": 32.149818658828735, "step": 132}
{"train_info/time_between_train_steps": 0.007139682769775391, "step": 132}
{"info/global_step": 133, "train_info/time_within_train_step": 32.59947967529297, "step": 133}
{"train_info/time_between_train_steps": 0.00653529167175293, "step": 133}
{"info/global_step": 134, "train_info/time_within_train_step": 32.322787046432495, "step": 134}
{"train_info/time_between_train_steps": 0.0058460235595703125, "step": 134}
{"info/global_step": 135, "train_info/time_within_train_step": 32.38719701766968, "step": 135}
{"train_info/time_between_train_steps": 0.011163711547851562, "step": 135}
{"train_info/time_between_train_steps": 23.615864038467407, "step": 135}
{"info/global_step": 136, "train_info/time_within_train_step": 32.92693567276001, "step": 136}
{"train_info/time_between_train_steps": 0.005370616912841797, "step": 136}
{"info/global_step": 137, "train_info/time_within_train_step": 32.30996561050415, "step": 137}
{"train_info/time_between_train_steps": 0.005300998687744141, "step": 137}
{"info/global_step": 138, "train_info/time_within_train_step": 32.4217004776001, "step": 138}
{"train_info/time_between_train_steps": 0.00520014762878418, "step": 138}
{"info/global_step": 139, "train_info/time_within_train_step": 32.727386236190796, "step": 139}
{"train_info/time_between_train_steps": 0.0055255889892578125, "step": 139}
{"info/global_step": 140, "train_info/time_within_train_step": 32.1287477016449, "step": 140}
{"train_info/time_between_train_steps": 0.010035276412963867, "step": 140}
{"info/global_step": 141, "train_info/time_within_train_step": 32.518765687942505, "step": 141}
{"train_info/time_between_train_steps": 0.005308389663696289, "step": 141}
{"info/global_step": 142, "train_info/time_within_train_step": 32.34349179267883, "step": 142}
{"train_info/time_between_train_steps": 0.005530595779418945, "step": 142}
{"info/global_step": 143, "train_info/time_within_train_step": 32.10921001434326, "step": 143}
{"train_info/time_between_train_steps": 0.008246183395385742, "step": 143}
{"info/global_step": 144, "train_info/time_within_train_step": 32.36915898323059, "step": 144}
{"train_info/time_between_train_steps": 0.005146026611328125, "step": 144}
{"info/global_step": 145, "train_info/time_within_train_step": 32.50912427902222, "step": 145}
{"train_info/time_between_train_steps": 0.010382652282714844, "step": 145}
{"info/global_step": 146, "train_info/time_within_train_step": 32.138211250305176, "step": 146}
{"train_info/time_between_train_steps": 0.005098581314086914, "step": 146}
{"info/global_step": 147, "train_info/time_within_train_step": 32.38246965408325, "step": 147}
{"train_info/time_between_train_steps": 0.0051114559173583984, "step": 147}
{"info/global_step": 148, "train_info/time_within_train_step": 32.640944957733154, "step": 148}
{"train_info/time_between_train_steps": 0.005298614501953125, "step": 148}
{"info/global_step": 149, "train_info/time_within_train_step": 32.39208436012268, "step": 149}
{"train_info/time_between_train_steps": 0.005362987518310547, "step": 149}
{"info/global_step": 150, "train_info/time_within_train_step": 32.50346851348877, "step": 150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733692492, "_runtime": 4998}, "step": 150}
{"logs": {"train/loss": 5.1901, "train/learning_rate": 0.0005833333333333333, "train/epoch": 5.01, "_timestamp": 1733692492, "_runtime": 4998}, "step": 150}
{"train_info/time_between_train_steps": 0.013803720474243164, "step": 150}
{"info/global_step": 151, "train_info/time_within_train_step": 32.5390567779541, "step": 151}
{"train_info/time_between_train_steps": 0.005182027816772461, "step": 151}
{"info/global_step": 152, "train_info/time_within_train_step": 32.51821565628052, "step": 152}
{"train_info/time_between_train_steps": 0.005606412887573242, "step": 152}
{"info/global_step": 153, "train_info/time_within_train_step": 32.02125430107117, "step": 153}
{"train_info/time_between_train_steps": 0.008603811264038086, "step": 153}
{"info/global_step": 154, "train_info/time_within_train_step": 32.53186082839966, "step": 154}
{"train_info/time_between_train_steps": 0.005334138870239258, "step": 154}
{"info/global_step": 155, "train_info/time_within_train_step": 32.50127410888672, "step": 155}
{"train_info/time_between_train_steps": 0.005150794982910156, "step": 155}
{"info/global_step": 156, "train_info/time_within_train_step": 32.34284687042236, "step": 156}
{"train_info/time_between_train_steps": 0.00766754150390625, "step": 156}
{"info/global_step": 157, "train_info/time_within_train_step": 32.525063037872314, "step": 157}
{"train_info/time_between_train_steps": 0.01051473617553711, "step": 157}
{"info/global_step": 158, "train_info/time_within_train_step": 32.51372575759888, "step": 158}
{"train_info/time_between_train_steps": 0.01083517074584961, "step": 158}
{"info/global_step": 159, "train_info/time_within_train_step": 32.391618728637695, "step": 159}
{"train_info/time_between_train_steps": 0.00554966926574707, "step": 159}
{"info/global_step": 160, "train_info/time_within_train_step": 32.29981732368469, "step": 160}
{"train_info/time_between_train_steps": 0.0054471492767333984, "step": 160}
{"info/global_step": 161, "train_info/time_within_train_step": 32.45966625213623, "step": 161}
{"train_info/time_between_train_steps": 0.0172119140625, "step": 161}
{"info/global_step": 162, "train_info/time_within_train_step": 32.35407781600952, "step": 162}
{"train_info/time_between_train_steps": 0.010923624038696289, "step": 162}
{"train_info/time_between_train_steps": 23.670746326446533, "step": 162}
{"info/global_step": 163, "train_info/time_within_train_step": 32.49798798561096, "step": 163}
{"train_info/time_between_train_steps": 0.005978107452392578, "step": 163}
{"info/global_step": 164, "train_info/time_within_train_step": 32.66934776306152, "step": 164}
{"train_info/time_between_train_steps": 0.00919795036315918, "step": 164}
{"info/global_step": 165, "train_info/time_within_train_step": 32.380778551101685, "step": 165}
{"train_info/time_between_train_steps": 0.008846521377563477, "step": 165}
{"info/global_step": 166, "train_info/time_within_train_step": 32.53283739089966, "step": 166}
{"train_info/time_between_train_steps": 0.0056416988372802734, "step": 166}
{"info/global_step": 167, "train_info/time_within_train_step": 32.4118378162384, "step": 167}
{"train_info/time_between_train_steps": 0.006047248840332031, "step": 167}
{"info/global_step": 168, "train_info/time_within_train_step": 32.40234327316284, "step": 168}
{"train_info/time_between_train_steps": 0.005459308624267578, "step": 168}
{"info/global_step": 169, "train_info/time_within_train_step": 32.781498432159424, "step": 169}
{"train_info/time_between_train_steps": 0.005761146545410156, "step": 169}
{"info/global_step": 170, "train_info/time_within_train_step": 32.497361183166504, "step": 170}
{"train_info/time_between_train_steps": 0.0056264400482177734, "step": 170}
{"info/global_step": 171, "train_info/time_within_train_step": 32.87142610549927, "step": 171}
{"train_info/time_between_train_steps": 0.0056362152099609375, "step": 171}
{"info/global_step": 172, "train_info/time_within_train_step": 32.49816298484802, "step": 172}
{"train_info/time_between_train_steps": 0.005283355712890625, "step": 172}
{"info/global_step": 173, "train_info/time_within_train_step": 32.57838678359985, "step": 173}
{"train_info/time_between_train_steps": 0.005427360534667969, "step": 173}
{"info/global_step": 174, "train_info/time_within_train_step": 32.45901417732239, "step": 174}
{"train_info/time_between_train_steps": 0.008009195327758789, "step": 174}
{"info/global_step": 175, "train_info/time_within_train_step": 32.41997408866882, "step": 175}
{"train_info/time_between_train_steps": 0.005824089050292969, "step": 175}
{"info/global_step": 176, "train_info/time_within_train_step": 32.353354692459106, "step": 176}
{"train_info/time_between_train_steps": 0.0055065155029296875, "step": 176}
{"info/global_step": 177, "train_info/time_within_train_step": 32.565218925476074, "step": 177}
{"train_info/time_between_train_steps": 0.010290384292602539, "step": 177}
{"info/global_step": 178, "train_info/time_within_train_step": 32.29863381385803, "step": 178}
{"train_info/time_between_train_steps": 0.005389213562011719, "step": 178}
{"info/global_step": 179, "train_info/time_within_train_step": 32.26189970970154, "step": 179}
{"train_info/time_between_train_steps": 0.010750055313110352, "step": 179}
{"info/global_step": 180, "train_info/time_within_train_step": 32.63847279548645, "step": 180}
{"train_info/time_between_train_steps": 0.011171579360961914, "step": 180}
{"info/global_step": 181, "train_info/time_within_train_step": 32.237446546554565, "step": 181}
{"train_info/time_between_train_steps": 0.010946035385131836, "step": 181}
{"info/global_step": 182, "train_info/time_within_train_step": 32.45562267303467, "step": 182}
{"train_info/time_between_train_steps": 0.005480051040649414, "step": 182}
{"info/global_step": 183, "train_info/time_within_train_step": 32.473384857177734, "step": 183}
{"train_info/time_between_train_steps": 0.011756420135498047, "step": 183}
{"info/global_step": 184, "train_info/time_within_train_step": 32.569047927856445, "step": 184}
{"train_info/time_between_train_steps": 0.005323886871337891, "step": 184}
{"info/global_step": 185, "train_info/time_within_train_step": 31.9078586101532, "step": 185}
{"train_info/time_between_train_steps": 0.005476236343383789, "step": 185}
{"info/global_step": 186, "train_info/time_within_train_step": 32.33596158027649, "step": 186}
{"train_info/time_between_train_steps": 0.005545139312744141, "step": 186}
{"info/global_step": 187, "train_info/time_within_train_step": 32.290727376937866, "step": 187}
{"train_info/time_between_train_steps": 0.0059206485748291016, "step": 187}
{"info/global_step": 188, "train_info/time_within_train_step": 32.642181396484375, "step": 188}
{"train_info/time_between_train_steps": 0.0057561397552490234, "step": 188}
{"info/global_step": 189, "train_info/time_within_train_step": 32.50485277175903, "step": 189}
{"train_info/time_between_train_steps": 0.00881195068359375, "step": 189}
{"train_info/time_between_train_steps": 24.419675827026367, "step": 189}
{"info/global_step": 190, "train_info/time_within_train_step": 32.577392578125, "step": 190}
{"train_info/time_between_train_steps": 0.0055773258209228516, "step": 190}
{"info/global_step": 191, "train_info/time_within_train_step": 32.401285886764526, "step": 191}
{"train_info/time_between_train_steps": 0.006231069564819336, "step": 191}
{"info/global_step": 192, "train_info/time_within_train_step": 32.3385112285614, "step": 192}
{"train_info/time_between_train_steps": 0.011219263076782227, "step": 192}
{"info/global_step": 193, "train_info/time_within_train_step": 32.450294971466064, "step": 193}
{"train_info/time_between_train_steps": 0.00623631477355957, "step": 193}
{"info/global_step": 194, "train_info/time_within_train_step": 32.467045307159424, "step": 194}
{"train_info/time_between_train_steps": 0.00757145881652832, "step": 194}
{"info/global_step": 195, "train_info/time_within_train_step": 32.38900399208069, "step": 195}
{"train_info/time_between_train_steps": 0.00587773323059082, "step": 195}
{"info/global_step": 196, "train_info/time_within_train_step": 32.37414884567261, "step": 196}
{"train_info/time_between_train_steps": 0.015440702438354492, "step": 196}
{"info/global_step": 197, "train_info/time_within_train_step": 32.627724409103394, "step": 197}
{"train_info/time_between_train_steps": 0.006155490875244141, "step": 197}
{"info/global_step": 198, "train_info/time_within_train_step": 32.42310857772827, "step": 198}
{"train_info/time_between_train_steps": 0.005555391311645508, "step": 198}
{"info/global_step": 199, "train_info/time_within_train_step": 32.3640456199646, "step": 199}
{"train_info/time_between_train_steps": 0.005375862121582031, "step": 199}
{"info/global_step": 200, "train_info/time_within_train_step": 32.40460276603699, "step": 200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733694163, "_runtime": 6669}, "step": 200}
{"logs": {"train/loss": 4.9219, "train/learning_rate": 0.0005555555555555556, "train/epoch": 7.01, "_timestamp": 1733694163, "_runtime": 6669}, "step": 200}
{"train_info/time_between_train_steps": 2.501081705093384, "step": 200}
{"info/global_step": 201, "train_info/time_within_train_step": 32.51926374435425, "step": 201}
{"train_info/time_between_train_steps": 0.005820512771606445, "step": 201}
{"info/global_step": 202, "train_info/time_within_train_step": 32.31741952896118, "step": 202}
{"train_info/time_between_train_steps": 0.005653858184814453, "step": 202}
{"info/global_step": 203, "train_info/time_within_train_step": 32.423625469207764, "step": 203}
{"train_info/time_between_train_steps": 0.005642414093017578, "step": 203}
{"info/global_step": 204, "train_info/time_within_train_step": 32.70672416687012, "step": 204}
{"train_info/time_between_train_steps": 0.01048588752746582, "step": 204}
{"info/global_step": 205, "train_info/time_within_train_step": 32.43717050552368, "step": 205}
{"train_info/time_between_train_steps": 0.0057239532470703125, "step": 205}
{"info/global_step": 206, "train_info/time_within_train_step": 32.15246343612671, "step": 206}
{"train_info/time_between_train_steps": 0.0059010982513427734, "step": 206}
{"info/global_step": 207, "train_info/time_within_train_step": 32.498090505599976, "step": 207}
{"train_info/time_between_train_steps": 0.005867481231689453, "step": 207}
{"info/global_step": 208, "train_info/time_within_train_step": 32.754719257354736, "step": 208}
{"train_info/time_between_train_steps": 0.005751371383666992, "step": 208}
{"info/global_step": 209, "train_info/time_within_train_step": 32.35574674606323, "step": 209}
{"train_info/time_between_train_steps": 0.0057299137115478516, "step": 209}
{"info/global_step": 210, "train_info/time_within_train_step": 32.56430697441101, "step": 210}
{"train_info/time_between_train_steps": 0.005669593811035156, "step": 210}
{"info/global_step": 211, "train_info/time_within_train_step": 32.781561613082886, "step": 211}
{"train_info/time_between_train_steps": 0.005735158920288086, "step": 211}
{"info/global_step": 212, "train_info/time_within_train_step": 32.66396617889404, "step": 212}
{"train_info/time_between_train_steps": 0.010883569717407227, "step": 212}
{"info/global_step": 213, "train_info/time_within_train_step": 32.24815082550049, "step": 213}
{"train_info/time_between_train_steps": 0.011667251586914062, "step": 213}
{"info/global_step": 214, "train_info/time_within_train_step": 32.4153413772583, "step": 214}
{"train_info/time_between_train_steps": 0.00606846809387207, "step": 214}
{"info/global_step": 215, "train_info/time_within_train_step": 32.62559747695923, "step": 215}
{"train_info/time_between_train_steps": 0.006456851959228516, "step": 215}
{"info/global_step": 216, "train_info/time_within_train_step": 32.145156383514404, "step": 216}
{"train_info/time_between_train_steps": 0.006157875061035156, "step": 216}
{"train_info/time_between_train_steps": 23.555867433547974, "step": 216}
{"info/global_step": 217, "train_info/time_within_train_step": 32.694085121154785, "step": 217}
{"train_info/time_between_train_steps": 0.0054476261138916016, "step": 217}
{"info/global_step": 218, "train_info/time_within_train_step": 32.64172315597534, "step": 218}
{"train_info/time_between_train_steps": 0.0053560733795166016, "step": 218}
{"info/global_step": 219, "train_info/time_within_train_step": 32.30480098724365, "step": 219}
{"train_info/time_between_train_steps": 0.008550167083740234, "step": 219}
{"info/global_step": 220, "train_info/time_within_train_step": 32.45453858375549, "step": 220}
{"train_info/time_between_train_steps": 0.010412454605102539, "step": 220}
{"info/global_step": 221, "train_info/time_within_train_step": 32.26173758506775, "step": 221}
{"train_info/time_between_train_steps": 0.009369373321533203, "step": 221}
{"info/global_step": 222, "train_info/time_within_train_step": 32.53485989570618, "step": 222}
{"train_info/time_between_train_steps": 0.005616903305053711, "step": 222}
{"info/global_step": 223, "train_info/time_within_train_step": 32.39740705490112, "step": 223}
{"train_info/time_between_train_steps": 0.0051517486572265625, "step": 223}
{"info/global_step": 224, "train_info/time_within_train_step": 32.55450940132141, "step": 224}
{"train_info/time_between_train_steps": 0.005318641662597656, "step": 224}
{"info/global_step": 225, "train_info/time_within_train_step": 32.42094564437866, "step": 225}
{"train_info/time_between_train_steps": 0.005766391754150391, "step": 225}
{"info/global_step": 226, "train_info/time_within_train_step": 32.45213341712952, "step": 226}
{"train_info/time_between_train_steps": 0.005146980285644531, "step": 226}
{"info/global_step": 227, "train_info/time_within_train_step": 32.276522397994995, "step": 227}
{"train_info/time_between_train_steps": 0.01004171371459961, "step": 227}
{"info/global_step": 228, "train_info/time_within_train_step": 32.63637661933899, "step": 228}
{"train_info/time_between_train_steps": 0.010256290435791016, "step": 228}
{"info/global_step": 229, "train_info/time_within_train_step": 32.591525077819824, "step": 229}
{"train_info/time_between_train_steps": 0.005024909973144531, "step": 229}
{"info/global_step": 230, "train_info/time_within_train_step": 32.632859230041504, "step": 230}
{"train_info/time_between_train_steps": 0.005188703536987305, "step": 230}
{"info/global_step": 231, "train_info/time_within_train_step": 32.167293548583984, "step": 231}
{"train_info/time_between_train_steps": 0.005347490310668945, "step": 231}
{"info/global_step": 232, "train_info/time_within_train_step": 32.04650592803955, "step": 232}
{"train_info/time_between_train_steps": 0.009997844696044922, "step": 232}
{"info/global_step": 233, "train_info/time_within_train_step": 32.33018350601196, "step": 233}
{"train_info/time_between_train_steps": 0.010453462600708008, "step": 233}
{"info/global_step": 234, "train_info/time_within_train_step": 32.10135817527771, "step": 234}
{"train_info/time_between_train_steps": 0.005101442337036133, "step": 234}
{"info/global_step": 235, "train_info/time_within_train_step": 32.27740120887756, "step": 235}
{"train_info/time_between_train_steps": 0.005235195159912109, "step": 235}
{"info/global_step": 236, "train_info/time_within_train_step": 32.37502121925354, "step": 236}
{"train_info/time_between_train_steps": 0.00535130500793457, "step": 236}
{"info/global_step": 237, "train_info/time_within_train_step": 32.39889979362488, "step": 237}
{"train_info/time_between_train_steps": 0.005326509475708008, "step": 237}
{"info/global_step": 238, "train_info/time_within_train_step": 32.399428844451904, "step": 238}
{"train_info/time_between_train_steps": 0.005362272262573242, "step": 238}
{"info/global_step": 239, "train_info/time_within_train_step": 32.551642656326294, "step": 239}
{"train_info/time_between_train_steps": 0.005224704742431641, "step": 239}
{"info/global_step": 240, "train_info/time_within_train_step": 32.39025163650513, "step": 240}
{"train_info/time_between_train_steps": 0.011473655700683594, "step": 240}
{"info/global_step": 241, "train_info/time_within_train_step": 32.64253282546997, "step": 241}
{"train_info/time_between_train_steps": 0.005532264709472656, "step": 241}
{"info/global_step": 242, "train_info/time_within_train_step": 31.981594800949097, "step": 242}
{"train_info/time_between_train_steps": 0.007395744323730469, "step": 242}
{"info/global_step": 243, "train_info/time_within_train_step": 32.469701528549194, "step": 243}
{"train_info/time_between_train_steps": 0.009227514266967773, "step": 243}
{"train_info/time_between_train_steps": 23.7015643119812, "step": 243}
{"info/global_step": 244, "train_info/time_within_train_step": 32.4140899181366, "step": 244}
{"train_info/time_between_train_steps": 0.005132436752319336, "step": 244}
{"info/global_step": 245, "train_info/time_within_train_step": 32.34044313430786, "step": 245}
{"train_info/time_between_train_steps": 0.00828242301940918, "step": 245}
{"info/global_step": 246, "train_info/time_within_train_step": 32.22316002845764, "step": 246}
{"train_info/time_between_train_steps": 0.0054776668548583984, "step": 246}
{"info/global_step": 247, "train_info/time_within_train_step": 32.748966217041016, "step": 247}
{"train_info/time_between_train_steps": 0.0054552555084228516, "step": 247}
{"info/global_step": 248, "train_info/time_within_train_step": 32.33254432678223, "step": 248}
{"train_info/time_between_train_steps": 0.005776166915893555, "step": 248}
{"info/global_step": 249, "train_info/time_within_train_step": 32.16154646873474, "step": 249}
{"train_info/time_between_train_steps": 0.009700775146484375, "step": 249}
{"info/global_step": 250, "train_info/time_within_train_step": 32.586970806121826, "step": 250}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733695835, "_runtime": 8341}, "step": 250}
{"logs": {"train/loss": 4.7815, "train/learning_rate": 0.0005277777777777777, "train/epoch": 9.01, "_timestamp": 1733695835, "_runtime": 8341}, "step": 250}
{"train_info/time_between_train_steps": 0.007583141326904297, "step": 250}
{"info/global_step": 251, "train_info/time_within_train_step": 32.493483543395996, "step": 251}
{"train_info/time_between_train_steps": 0.005215644836425781, "step": 251}
{"info/global_step": 252, "train_info/time_within_train_step": 32.69473218917847, "step": 252}
{"train_info/time_between_train_steps": 0.005066633224487305, "step": 252}
{"info/global_step": 253, "train_info/time_within_train_step": 32.149529457092285, "step": 253}
{"train_info/time_between_train_steps": 0.005276918411254883, "step": 253}
{"info/global_step": 254, "train_info/time_within_train_step": 32.24671721458435, "step": 254}
{"train_info/time_between_train_steps": 0.0051822662353515625, "step": 254}
{"info/global_step": 255, "train_info/time_within_train_step": 32.539634704589844, "step": 255}
{"train_info/time_between_train_steps": 0.0051116943359375, "step": 255}
{"info/global_step": 256, "train_info/time_within_train_step": 32.50719618797302, "step": 256}
{"train_info/time_between_train_steps": 0.005310535430908203, "step": 256}
{"info/global_step": 257, "train_info/time_within_train_step": 32.17264461517334, "step": 257}
{"train_info/time_between_train_steps": 0.007485389709472656, "step": 257}
{"info/global_step": 258, "train_info/time_within_train_step": 32.29588747024536, "step": 258}
{"train_info/time_between_train_steps": 0.00526118278503418, "step": 258}
{"info/global_step": 259, "train_info/time_within_train_step": 32.55680704116821, "step": 259}
{"train_info/time_between_train_steps": 0.010158300399780273, "step": 259}
{"info/global_step": 260, "train_info/time_within_train_step": 32.506256103515625, "step": 260}
{"train_info/time_between_train_steps": 0.00542140007019043, "step": 260}
{"info/global_step": 261, "train_info/time_within_train_step": 32.13860368728638, "step": 261}
{"train_info/time_between_train_steps": 0.005172252655029297, "step": 261}
{"info/global_step": 262, "train_info/time_within_train_step": 32.34112811088562, "step": 262}
{"train_info/time_between_train_steps": 0.00523829460144043, "step": 262}
{"info/global_step": 263, "train_info/time_within_train_step": 32.575992822647095, "step": 263}
{"train_info/time_between_train_steps": 0.005141019821166992, "step": 263}
{"info/global_step": 264, "train_info/time_within_train_step": 32.405596017837524, "step": 264}
{"train_info/time_between_train_steps": 0.007681608200073242, "step": 264}
{"info/global_step": 265, "train_info/time_within_train_step": 32.305986642837524, "step": 265}
{"train_info/time_between_train_steps": 0.0066928863525390625, "step": 265}
{"info/global_step": 266, "train_info/time_within_train_step": 32.58982229232788, "step": 266}
{"train_info/time_between_train_steps": 0.005150556564331055, "step": 266}
{"info/global_step": 267, "train_info/time_within_train_step": 32.411648750305176, "step": 267}
{"train_info/time_between_train_steps": 0.005353689193725586, "step": 267}
{"info/global_step": 268, "train_info/time_within_train_step": 32.330849409103394, "step": 268}
{"train_info/time_between_train_steps": 0.005408763885498047, "step": 268}
{"info/global_step": 269, "train_info/time_within_train_step": 32.246145248413086, "step": 269}
{"train_info/time_between_train_steps": 0.010528087615966797, "step": 269}
{"info/global_step": 270, "train_info/time_within_train_step": 32.24973511695862, "step": 270}
{"train_info/time_between_train_steps": 0.0056612491607666016, "step": 270}
{"train_info/time_between_train_steps": 24.005107879638672, "step": 270}
{"info/global_step": 271, "train_info/time_within_train_step": 32.528809785842896, "step": 271}
{"train_info/time_between_train_steps": 0.0051097869873046875, "step": 271}
{"info/global_step": 272, "train_info/time_within_train_step": 32.77389717102051, "step": 272}
{"train_info/time_between_train_steps": 0.005402565002441406, "step": 272}
{"info/global_step": 273, "train_info/time_within_train_step": 32.254085540771484, "step": 273}
{"train_info/time_between_train_steps": 0.019589900970458984, "step": 273}
{"info/global_step": 274, "train_info/time_within_train_step": 32.80850863456726, "step": 274}
{"train_info/time_between_train_steps": 0.013438940048217773, "step": 274}
{"info/global_step": 275, "train_info/time_within_train_step": 32.62053155899048, "step": 275}
{"train_info/time_between_train_steps": 0.005974292755126953, "step": 275}
{"info/global_step": 276, "train_info/time_within_train_step": 32.6808876991272, "step": 276}
{"train_info/time_between_train_steps": 0.018045425415039062, "step": 276}
{"info/global_step": 277, "train_info/time_within_train_step": 32.134827852249146, "step": 277}
{"train_info/time_between_train_steps": 0.010959148406982422, "step": 277}
{"info/global_step": 278, "train_info/time_within_train_step": 32.39870500564575, "step": 278}
{"train_info/time_between_train_steps": 0.00542759895324707, "step": 278}
{"info/global_step": 279, "train_info/time_within_train_step": 32.57310652732849, "step": 279}
{"train_info/time_between_train_steps": 0.005521535873413086, "step": 279}
{"info/global_step": 280, "train_info/time_within_train_step": 32.49414277076721, "step": 280}
{"train_info/time_between_train_steps": 0.005219697952270508, "step": 280}
{"info/global_step": 281, "train_info/time_within_train_step": 32.08818078041077, "step": 281}
{"train_info/time_between_train_steps": 0.005254268646240234, "step": 281}
{"info/global_step": 282, "train_info/time_within_train_step": 32.37484836578369, "step": 282}
{"train_info/time_between_train_steps": 0.005243778228759766, "step": 282}
{"info/global_step": 283, "train_info/time_within_train_step": 32.420653104782104, "step": 283}
{"train_info/time_between_train_steps": 0.00768589973449707, "step": 283}
{"info/global_step": 284, "train_info/time_within_train_step": 32.282864570617676, "step": 284}
{"train_info/time_between_train_steps": 0.0054073333740234375, "step": 284}
{"info/global_step": 285, "train_info/time_within_train_step": 32.273990869522095, "step": 285}
{"train_info/time_between_train_steps": 0.009600162506103516, "step": 285}
{"info/global_step": 286, "train_info/time_within_train_step": 32.53428769111633, "step": 286}
{"train_info/time_between_train_steps": 0.010319232940673828, "step": 286}
{"info/global_step": 287, "train_info/time_within_train_step": 32.482757568359375, "step": 287}
{"train_info/time_between_train_steps": 0.010318279266357422, "step": 287}
{"info/global_step": 288, "train_info/time_within_train_step": 32.2037398815155, "step": 288}
{"train_info/time_between_train_steps": 0.005185365676879883, "step": 288}
{"info/global_step": 289, "train_info/time_within_train_step": 32.28483724594116, "step": 289}
{"train_info/time_between_train_steps": 0.005261421203613281, "step": 289}
{"info/global_step": 290, "train_info/time_within_train_step": 32.32819890975952, "step": 290}
{"train_info/time_between_train_steps": 0.0051920413970947266, "step": 290}
{"info/global_step": 291, "train_info/time_within_train_step": 32.33924579620361, "step": 291}
{"train_info/time_between_train_steps": 0.005350351333618164, "step": 291}
{"info/global_step": 292, "train_info/time_within_train_step": 32.35774207115173, "step": 292}
{"train_info/time_between_train_steps": 0.005487918853759766, "step": 292}
{"info/global_step": 293, "train_info/time_within_train_step": 32.59755825996399, "step": 293}
{"train_info/time_between_train_steps": 0.010126352310180664, "step": 293}
{"info/global_step": 294, "train_info/time_within_train_step": 32.09001803398132, "step": 294}
{"train_info/time_between_train_steps": 0.005410909652709961, "step": 294}
{"info/global_step": 295, "train_info/time_within_train_step": 32.48085856437683, "step": 295}
{"train_info/time_between_train_steps": 0.008847951889038086, "step": 295}
{"info/global_step": 296, "train_info/time_within_train_step": 32.70277762413025, "step": 296}
{"train_info/time_between_train_steps": 0.0057430267333984375, "step": 296}
{"info/global_step": 297, "train_info/time_within_train_step": 32.3166618347168, "step": 297}
{"train_info/time_between_train_steps": 0.01076054573059082, "step": 297}
{"train_info/time_between_train_steps": 23.450214624404907, "step": 297}
{"info/global_step": 298, "train_info/time_within_train_step": 32.43792366981506, "step": 298}
{"train_info/time_between_train_steps": 0.0057201385498046875, "step": 298}
{"info/global_step": 299, "train_info/time_within_train_step": 33.02242112159729, "step": 299}
{"train_info/time_between_train_steps": 0.0053119659423828125, "step": 299}
{"info/global_step": 300, "train_info/time_within_train_step": 32.35365891456604, "step": 300}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733697504, "_runtime": 10010}, "step": 300}
{"logs": {"train/loss": 4.6493, "train/learning_rate": 0.0005, "train/epoch": 11.0, "_timestamp": 1733697504, "_runtime": 10010}, "step": 300}
{"train_info/time_between_train_steps": 2.443493604660034, "step": 300}
{"info/global_step": 301, "train_info/time_within_train_step": 32.437798261642456, "step": 301}
{"train_info/time_between_train_steps": 0.005480766296386719, "step": 301}
{"info/global_step": 302, "train_info/time_within_train_step": 32.60413122177124, "step": 302}
{"train_info/time_between_train_steps": 0.006064414978027344, "step": 302}
{"info/global_step": 303, "train_info/time_within_train_step": 32.586238622665405, "step": 303}
{"train_info/time_between_train_steps": 0.0054798126220703125, "step": 303}
{"info/global_step": 304, "train_info/time_within_train_step": 32.526628255844116, "step": 304}
{"train_info/time_between_train_steps": 0.010885000228881836, "step": 304}
{"info/global_step": 305, "train_info/time_within_train_step": 32.532477617263794, "step": 305}
{"train_info/time_between_train_steps": 0.005549430847167969, "step": 305}
{"info/global_step": 306, "train_info/time_within_train_step": 32.56254291534424, "step": 306}
{"train_info/time_between_train_steps": 0.015432596206665039, "step": 306}
{"info/global_step": 307, "train_info/time_within_train_step": 32.66433143615723, "step": 307}
{"train_info/time_between_train_steps": 0.005274534225463867, "step": 307}
{"info/global_step": 308, "train_info/time_within_train_step": 32.59117913246155, "step": 308}
{"train_info/time_between_train_steps": 0.005158662796020508, "step": 308}
{"info/global_step": 309, "train_info/time_within_train_step": 32.50848197937012, "step": 309}
{"train_info/time_between_train_steps": 0.0054187774658203125, "step": 309}
{"info/global_step": 310, "train_info/time_within_train_step": 32.38107872009277, "step": 310}
{"train_info/time_between_train_steps": 0.010169506072998047, "step": 310}
{"info/global_step": 311, "train_info/time_within_train_step": 32.66692042350769, "step": 311}
{"train_info/time_between_train_steps": 0.0054852962493896484, "step": 311}
{"info/global_step": 312, "train_info/time_within_train_step": 32.735755443573, "step": 312}
{"train_info/time_between_train_steps": 0.010424375534057617, "step": 312}
{"info/global_step": 313, "train_info/time_within_train_step": 32.73018527030945, "step": 313}
{"train_info/time_between_train_steps": 0.008273601531982422, "step": 313}
{"info/global_step": 314, "train_info/time_within_train_step": 32.29290199279785, "step": 314}
{"train_info/time_between_train_steps": 0.005400657653808594, "step": 314}
{"info/global_step": 315, "train_info/time_within_train_step": 32.48679184913635, "step": 315}
{"train_info/time_between_train_steps": 0.005323648452758789, "step": 315}
{"info/global_step": 316, "train_info/time_within_train_step": 32.630892515182495, "step": 316}
{"train_info/time_between_train_steps": 0.0080718994140625, "step": 316}
{"info/global_step": 317, "train_info/time_within_train_step": 32.54364776611328, "step": 317}
{"train_info/time_between_train_steps": 0.005285739898681641, "step": 317}
{"info/global_step": 318, "train_info/time_within_train_step": 32.550410747528076, "step": 318}
{"train_info/time_between_train_steps": 0.005470991134643555, "step": 318}
{"info/global_step": 319, "train_info/time_within_train_step": 32.4919593334198, "step": 319}
{"train_info/time_between_train_steps": 0.005407810211181641, "step": 319}
{"info/global_step": 320, "train_info/time_within_train_step": 32.57850527763367, "step": 320}
{"train_info/time_between_train_steps": 0.005412101745605469, "step": 320}
{"info/global_step": 321, "train_info/time_within_train_step": 32.68901348114014, "step": 321}
{"train_info/time_between_train_steps": 0.00783228874206543, "step": 321}
{"info/global_step": 322, "train_info/time_within_train_step": 32.68795871734619, "step": 322}
{"train_info/time_between_train_steps": 0.008895635604858398, "step": 322}
{"info/global_step": 323, "train_info/time_within_train_step": 32.434333086013794, "step": 323}
{"train_info/time_between_train_steps": 0.006007194519042969, "step": 323}
{"info/global_step": 324, "train_info/time_within_train_step": 32.47243690490723, "step": 324}
{"train_info/time_between_train_steps": 0.007821321487426758, "step": 324}
{"train_info/time_between_train_steps": 23.699759483337402, "step": 324}
{"info/global_step": 325, "train_info/time_within_train_step": 32.76911163330078, "step": 325}
{"train_info/time_between_train_steps": 0.016160964965820312, "step": 325}
{"info/global_step": 326, "train_info/time_within_train_step": 32.21050238609314, "step": 326}
{"train_info/time_between_train_steps": 0.0053975582122802734, "step": 326}
{"info/global_step": 327, "train_info/time_within_train_step": 32.398765563964844, "step": 327}
{"train_info/time_between_train_steps": 0.005372524261474609, "step": 327}
{"info/global_step": 328, "train_info/time_within_train_step": 32.592416286468506, "step": 328}
{"train_info/time_between_train_steps": 0.009860992431640625, "step": 328}
{"info/global_step": 329, "train_info/time_within_train_step": 32.48257565498352, "step": 329}
{"train_info/time_between_train_steps": 0.008361577987670898, "step": 329}
{"info/global_step": 330, "train_info/time_within_train_step": 32.36395525932312, "step": 330}
{"train_info/time_between_train_steps": 0.012162446975708008, "step": 330}
{"info/global_step": 331, "train_info/time_within_train_step": 32.479568004608154, "step": 331}
{"train_info/time_between_train_steps": 0.005822181701660156, "step": 331}
{"info/global_step": 332, "train_info/time_within_train_step": 32.587780237197876, "step": 332}
{"train_info/time_between_train_steps": 0.008799076080322266, "step": 332}
{"info/global_step": 333, "train_info/time_within_train_step": 32.78673458099365, "step": 333}
{"train_info/time_between_train_steps": 0.010161876678466797, "step": 333}
{"info/global_step": 334, "train_info/time_within_train_step": 32.75552797317505, "step": 334}
{"train_info/time_between_train_steps": 0.005127429962158203, "step": 334}
{"info/global_step": 335, "train_info/time_within_train_step": 32.33199429512024, "step": 335}
{"train_info/time_between_train_steps": 0.005248308181762695, "step": 335}
{"info/global_step": 336, "train_info/time_within_train_step": 32.50639843940735, "step": 336}
{"train_info/time_between_train_steps": 0.005275726318359375, "step": 336}
{"info/global_step": 337, "train_info/time_within_train_step": 32.70723032951355, "step": 337}
{"train_info/time_between_train_steps": 0.005279541015625, "step": 337}
{"info/global_step": 338, "train_info/time_within_train_step": 32.33006477355957, "step": 338}
{"train_info/time_between_train_steps": 0.0070111751556396484, "step": 338}
{"info/global_step": 339, "train_info/time_within_train_step": 32.172741413116455, "step": 339}
{"train_info/time_between_train_steps": 0.005442380905151367, "step": 339}
{"info/global_step": 340, "train_info/time_within_train_step": 32.387470722198486, "step": 340}
{"train_info/time_between_train_steps": 0.005304813385009766, "step": 340}
{"info/global_step": 341, "train_info/time_within_train_step": 32.38851356506348, "step": 341}
{"train_info/time_between_train_steps": 0.005470991134643555, "step": 341}
{"info/global_step": 342, "train_info/time_within_train_step": 32.59941482543945, "step": 342}
{"train_info/time_between_train_steps": 0.0052754878997802734, "step": 342}
{"info/global_step": 343, "train_info/time_within_train_step": 32.411309242248535, "step": 343}
{"train_info/time_between_train_steps": 0.005178689956665039, "step": 343}
{"info/global_step": 344, "train_info/time_within_train_step": 32.127031564712524, "step": 344}
{"train_info/time_between_train_steps": 0.0065670013427734375, "step": 344}
{"info/global_step": 345, "train_info/time_within_train_step": 32.33880400657654, "step": 345}
{"train_info/time_between_train_steps": 0.005088090896606445, "step": 345}
{"info/global_step": 346, "train_info/time_within_train_step": 32.2820348739624, "step": 346}
{"train_info/time_between_train_steps": 0.005359649658203125, "step": 346}
{"info/global_step": 347, "train_info/time_within_train_step": 32.610384464263916, "step": 347}
{"train_info/time_between_train_steps": 0.005284786224365234, "step": 347}
{"info/global_step": 348, "train_info/time_within_train_step": 32.30148148536682, "step": 348}
{"train_info/time_between_train_steps": 0.005778789520263672, "step": 348}
{"info/global_step": 349, "train_info/time_within_train_step": 32.38583707809448, "step": 349}
{"train_info/time_between_train_steps": 0.01064157485961914, "step": 349}
{"info/global_step": 350, "train_info/time_within_train_step": 32.25187349319458, "step": 350}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733699155, "_runtime": 11661}, "step": 350}
{"logs": {"train/loss": 4.4128, "train/learning_rate": 0.00047222222222222224, "train/epoch": 12.02, "_timestamp": 1733699155, "_runtime": 11661}, "step": 350}
{"train_info/time_between_train_steps": 0.012549161911010742, "step": 350}
{"info/global_step": 351, "train_info/time_within_train_step": 32.71546292304993, "step": 351}
{"train_info/time_between_train_steps": 0.005639314651489258, "step": 351}
{"train_info/time_between_train_steps": 23.599206924438477, "step": 351}
{"info/global_step": 352, "train_info/time_within_train_step": 32.44250464439392, "step": 352}
{"train_info/time_between_train_steps": 0.0056896209716796875, "step": 352}
{"info/global_step": 353, "train_info/time_within_train_step": 32.57051062583923, "step": 353}
{"train_info/time_between_train_steps": 0.005604743957519531, "step": 353}
{"info/global_step": 354, "train_info/time_within_train_step": 32.573174715042114, "step": 354}
{"train_info/time_between_train_steps": 0.005310535430908203, "step": 354}
{"info/global_step": 355, "train_info/time_within_train_step": 32.664777755737305, "step": 355}
{"train_info/time_between_train_steps": 0.01047205924987793, "step": 355}
{"info/global_step": 356, "train_info/time_within_train_step": 32.55393362045288, "step": 356}
{"train_info/time_between_train_steps": 0.005239248275756836, "step": 356}
{"info/global_step": 357, "train_info/time_within_train_step": 32.28160214424133, "step": 357}
{"train_info/time_between_train_steps": 0.0055789947509765625, "step": 357}
{"info/global_step": 358, "train_info/time_within_train_step": 32.47785186767578, "step": 358}
{"train_info/time_between_train_steps": 0.0057718753814697266, "step": 358}
{"info/global_step": 359, "train_info/time_within_train_step": 32.74133539199829, "step": 359}
{"train_info/time_between_train_steps": 0.005470991134643555, "step": 359}
{"info/global_step": 360, "train_info/time_within_train_step": 32.55565071105957, "step": 360}
{"train_info/time_between_train_steps": 0.005366802215576172, "step": 360}
{"info/global_step": 361, "train_info/time_within_train_step": 32.7644157409668, "step": 361}
{"train_info/time_between_train_steps": 0.005482912063598633, "step": 361}
{"info/global_step": 362, "train_info/time_within_train_step": 32.40821170806885, "step": 362}
{"train_info/time_between_train_steps": 0.0054132938385009766, "step": 362}
{"info/global_step": 363, "train_info/time_within_train_step": 32.481738328933716, "step": 363}
{"train_info/time_between_train_steps": 0.005352973937988281, "step": 363}
{"info/global_step": 364, "train_info/time_within_train_step": 32.472020387649536, "step": 364}
{"train_info/time_between_train_steps": 0.010319709777832031, "step": 364}
{"info/global_step": 365, "train_info/time_within_train_step": 32.579925775527954, "step": 365}
{"train_info/time_between_train_steps": 0.005471467971801758, "step": 365}
{"info/global_step": 366, "train_info/time_within_train_step": 32.2835111618042, "step": 366}
{"train_info/time_between_train_steps": 0.0052759647369384766, "step": 366}
{"info/global_step": 367, "train_info/time_within_train_step": 32.28908920288086, "step": 367}
{"train_info/time_between_train_steps": 0.005265474319458008, "step": 367}
{"info/global_step": 368, "train_info/time_within_train_step": 32.27126622200012, "step": 368}
{"train_info/time_between_train_steps": 0.0053174495697021484, "step": 368}
{"info/global_step": 369, "train_info/time_within_train_step": 32.52360939979553, "step": 369}
{"train_info/time_between_train_steps": 0.005132913589477539, "step": 369}
{"info/global_step": 370, "train_info/time_within_train_step": 32.7398362159729, "step": 370}
{"train_info/time_between_train_steps": 0.005318641662597656, "step": 370}
{"info/global_step": 371, "train_info/time_within_train_step": 32.317169189453125, "step": 371}
{"train_info/time_between_train_steps": 0.010139703750610352, "step": 371}
{"info/global_step": 372, "train_info/time_within_train_step": 32.54671359062195, "step": 372}
{"train_info/time_between_train_steps": 0.010082483291625977, "step": 372}
{"info/global_step": 373, "train_info/time_within_train_step": 32.50788760185242, "step": 373}
{"train_info/time_between_train_steps": 0.007486104965209961, "step": 373}
{"info/global_step": 374, "train_info/time_within_train_step": 32.490031719207764, "step": 374}
{"train_info/time_between_train_steps": 0.005684375762939453, "step": 374}
{"info/global_step": 375, "train_info/time_within_train_step": 32.7070791721344, "step": 375}
{"train_info/time_between_train_steps": 0.005922794342041016, "step": 375}
{"info/global_step": 376, "train_info/time_within_train_step": 32.401795864105225, "step": 376}
{"train_info/time_between_train_steps": 0.005727291107177734, "step": 376}
{"info/global_step": 377, "train_info/time_within_train_step": 32.7458176612854, "step": 377}
{"train_info/time_between_train_steps": 0.005722522735595703, "step": 377}
{"info/global_step": 378, "train_info/time_within_train_step": 32.693368911743164, "step": 378}
{"train_info/time_between_train_steps": 0.005852699279785156, "step": 378}
{"train_info/time_between_train_steps": 23.50010323524475, "step": 378}
{"info/global_step": 379, "train_info/time_within_train_step": 32.699424505233765, "step": 379}
{"train_info/time_between_train_steps": 0.011150360107421875, "step": 379}
{"info/global_step": 380, "train_info/time_within_train_step": 32.78534007072449, "step": 380}
{"train_info/time_between_train_steps": 0.005563497543334961, "step": 380}
{"info/global_step": 381, "train_info/time_within_train_step": 32.4865403175354, "step": 381}
{"train_info/time_between_train_steps": 0.00531005859375, "step": 381}
{"info/global_step": 382, "train_info/time_within_train_step": 32.676581382751465, "step": 382}
{"train_info/time_between_train_steps": 0.00547480583190918, "step": 382}
{"info/global_step": 383, "train_info/time_within_train_step": 32.69442558288574, "step": 383}
{"train_info/time_between_train_steps": 0.005573272705078125, "step": 383}
{"info/global_step": 384, "train_info/time_within_train_step": 32.775251388549805, "step": 384}
{"train_info/time_between_train_steps": 0.005351066589355469, "step": 384}
{"info/global_step": 385, "train_info/time_within_train_step": 32.50159239768982, "step": 385}
{"train_info/time_between_train_steps": 0.007616996765136719, "step": 385}
{"info/global_step": 386, "train_info/time_within_train_step": 32.71977400779724, "step": 386}
{"train_info/time_between_train_steps": 0.005327939987182617, "step": 386}
{"info/global_step": 387, "train_info/time_within_train_step": 32.65986251831055, "step": 387}
{"train_info/time_between_train_steps": 0.007458686828613281, "step": 387}
{"info/global_step": 388, "train_info/time_within_train_step": 32.563969135284424, "step": 388}
{"train_info/time_between_train_steps": 0.007226228713989258, "step": 388}
{"info/global_step": 389, "train_info/time_within_train_step": 32.445627212524414, "step": 389}
{"train_info/time_between_train_steps": 0.005164146423339844, "step": 389}
{"info/global_step": 390, "train_info/time_within_train_step": 32.27331066131592, "step": 390}
{"train_info/time_between_train_steps": 0.00512385368347168, "step": 390}
{"info/global_step": 391, "train_info/time_within_train_step": 32.449904441833496, "step": 391}
{"train_info/time_between_train_steps": 0.00863337516784668, "step": 391}
{"info/global_step": 392, "train_info/time_within_train_step": 32.22465777397156, "step": 392}
{"train_info/time_between_train_steps": 0.005341529846191406, "step": 392}
{"info/global_step": 393, "train_info/time_within_train_step": 32.29384398460388, "step": 393}
{"train_info/time_between_train_steps": 0.005263566970825195, "step": 393}
{"info/global_step": 394, "train_info/time_within_train_step": 31.914151191711426, "step": 394}
{"train_info/time_between_train_steps": 0.005298137664794922, "step": 394}
{"info/global_step": 395, "train_info/time_within_train_step": 32.13217258453369, "step": 395}
{"train_info/time_between_train_steps": 0.005208730697631836, "step": 395}
{"info/global_step": 396, "train_info/time_within_train_step": 32.39009690284729, "step": 396}
{"train_info/time_between_train_steps": 0.005285978317260742, "step": 396}
{"info/global_step": 397, "train_info/time_within_train_step": 32.56088185310364, "step": 397}
{"train_info/time_between_train_steps": 0.005259275436401367, "step": 397}
{"info/global_step": 398, "train_info/time_within_train_step": 32.6872832775116, "step": 398}
{"train_info/time_between_train_steps": 0.010202169418334961, "step": 398}
{"info/global_step": 399, "train_info/time_within_train_step": 32.07564401626587, "step": 399}
{"train_info/time_between_train_steps": 0.00559544563293457, "step": 399}
{"info/global_step": 400, "train_info/time_within_train_step": 32.422640800476074, "step": 400}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733700828, "_runtime": 13334}, "step": 400}
{"logs": {"train/loss": 4.2741, "train/learning_rate": 0.00044444444444444436, "train/epoch": 14.02, "_timestamp": 1733700828, "_runtime": 13334}, "step": 400}
{"train_info/time_between_train_steps": 2.582751750946045, "step": 400}
{"info/global_step": 401, "train_info/time_within_train_step": 32.392059564590454, "step": 401}
{"train_info/time_between_train_steps": 0.005143880844116211, "step": 401}
{"info/global_step": 402, "train_info/time_within_train_step": 32.22800350189209, "step": 402}
{"train_info/time_between_train_steps": 0.005624055862426758, "step": 402}
{"info/global_step": 403, "train_info/time_within_train_step": 32.02459192276001, "step": 403}
{"train_info/time_between_train_steps": 0.0052378177642822266, "step": 403}
{"info/global_step": 404, "train_info/time_within_train_step": 32.58956503868103, "step": 404}
{"train_info/time_between_train_steps": 0.005676984786987305, "step": 404}
{"info/global_step": 405, "train_info/time_within_train_step": 32.24957895278931, "step": 405}
{"train_info/time_between_train_steps": 0.0056073665618896484, "step": 405}
{"train_info/time_between_train_steps": 23.350337982177734, "step": 405}
{"info/global_step": 406, "train_info/time_within_train_step": 32.68146085739136, "step": 406}
{"train_info/time_between_train_steps": 0.010431051254272461, "step": 406}
{"info/global_step": 407, "train_info/time_within_train_step": 32.50228524208069, "step": 407}
{"train_info/time_between_train_steps": 0.0054547786712646484, "step": 407}
{"info/global_step": 408, "train_info/time_within_train_step": 31.976628303527832, "step": 408}
{"train_info/time_between_train_steps": 0.007567405700683594, "step": 408}
{"info/global_step": 409, "train_info/time_within_train_step": 32.40708804130554, "step": 409}
{"train_info/time_between_train_steps": 0.011082649230957031, "step": 409}
{"info/global_step": 410, "train_info/time_within_train_step": 32.28608679771423, "step": 410}
{"train_info/time_between_train_steps": 0.005501985549926758, "step": 410}
{"info/global_step": 411, "train_info/time_within_train_step": 32.52357792854309, "step": 411}
{"train_info/time_between_train_steps": 0.00522303581237793, "step": 411}
{"info/global_step": 412, "train_info/time_within_train_step": 32.30158591270447, "step": 412}
{"train_info/time_between_train_steps": 0.0051462650299072266, "step": 412}
{"info/global_step": 413, "train_info/time_within_train_step": 32.17716884613037, "step": 413}
{"train_info/time_between_train_steps": 0.005304574966430664, "step": 413}
{"info/global_step": 414, "train_info/time_within_train_step": 32.520946979522705, "step": 414}
{"train_info/time_between_train_steps": 0.004912614822387695, "step": 414}
{"info/global_step": 415, "train_info/time_within_train_step": 32.356844425201416, "step": 415}
{"train_info/time_between_train_steps": 0.0049707889556884766, "step": 415}
{"info/global_step": 416, "train_info/time_within_train_step": 32.27116298675537, "step": 416}
{"train_info/time_between_train_steps": 0.005084514617919922, "step": 416}
{"info/global_step": 417, "train_info/time_within_train_step": 32.18281054496765, "step": 417}
{"train_info/time_between_train_steps": 0.005231142044067383, "step": 417}
{"info/global_step": 418, "train_info/time_within_train_step": 32.29518914222717, "step": 418}
{"train_info/time_between_train_steps": 0.005072116851806641, "step": 418}
{"info/global_step": 419, "train_info/time_within_train_step": 32.0013267993927, "step": 419}
{"train_info/time_between_train_steps": 0.005061149597167969, "step": 419}
{"info/global_step": 420, "train_info/time_within_train_step": 32.14422559738159, "step": 420}
{"train_info/time_between_train_steps": 0.005170106887817383, "step": 420}
{"info/global_step": 421, "train_info/time_within_train_step": 32.190518856048584, "step": 421}
{"train_info/time_between_train_steps": 0.006226539611816406, "step": 421}
{"info/global_step": 422, "train_info/time_within_train_step": 32.47921586036682, "step": 422}
{"train_info/time_between_train_steps": 0.004945516586303711, "step": 422}
{"info/global_step": 423, "train_info/time_within_train_step": 32.126333713531494, "step": 423}
{"train_info/time_between_train_steps": 0.005091667175292969, "step": 423}
{"info/global_step": 424, "train_info/time_within_train_step": 32.50057673454285, "step": 424}
{"train_info/time_between_train_steps": 0.006413936614990234, "step": 424}
{"info/global_step": 425, "train_info/time_within_train_step": 32.28959679603577, "step": 425}
{"train_info/time_between_train_steps": 0.006974935531616211, "step": 425}
{"info/global_step": 426, "train_info/time_within_train_step": 32.33735680580139, "step": 426}
{"train_info/time_between_train_steps": 0.005476951599121094, "step": 426}
{"info/global_step": 427, "train_info/time_within_train_step": 32.45458936691284, "step": 427}
{"train_info/time_between_train_steps": 0.0051975250244140625, "step": 427}
{"info/global_step": 428, "train_info/time_within_train_step": 32.24913930892944, "step": 428}
{"train_info/time_between_train_steps": 0.010238409042358398, "step": 428}
{"info/global_step": 429, "train_info/time_within_train_step": 32.5591459274292, "step": 429}
{"train_info/time_between_train_steps": 0.008646488189697266, "step": 429}
{"info/global_step": 430, "train_info/time_within_train_step": 32.388643741607666, "step": 430}
{"train_info/time_between_train_steps": 0.010329961776733398, "step": 430}
{"info/global_step": 431, "train_info/time_within_train_step": 31.91805386543274, "step": 431}
{"train_info/time_between_train_steps": 0.005397796630859375, "step": 431}
{"info/global_step": 432, "train_info/time_within_train_step": 32.683690786361694, "step": 432}
{"train_info/time_between_train_steps": 0.010359525680541992, "step": 432}
{"train_info/time_between_train_steps": 23.645903825759888, "step": 432}
{"info/global_step": 433, "train_info/time_within_train_step": 32.044883012771606, "step": 433}
{"train_info/time_between_train_steps": 0.00971531867980957, "step": 433}
{"info/global_step": 434, "train_info/time_within_train_step": 32.50393533706665, "step": 434}
{"train_info/time_between_train_steps": 0.005284786224365234, "step": 434}
{"info/global_step": 435, "train_info/time_within_train_step": 32.490694999694824, "step": 435}
{"train_info/time_between_train_steps": 0.010900020599365234, "step": 435}
{"info/global_step": 436, "train_info/time_within_train_step": 32.84360218048096, "step": 436}
{"train_info/time_between_train_steps": 0.010262012481689453, "step": 436}
{"info/global_step": 437, "train_info/time_within_train_step": 32.23982834815979, "step": 437}
{"train_info/time_between_train_steps": 0.005406618118286133, "step": 437}
{"info/global_step": 438, "train_info/time_within_train_step": 32.290995836257935, "step": 438}
{"train_info/time_between_train_steps": 0.0053975582122802734, "step": 438}
{"info/global_step": 439, "train_info/time_within_train_step": 32.24326467514038, "step": 439}
{"train_info/time_between_train_steps": 0.005160331726074219, "step": 439}
{"info/global_step": 440, "train_info/time_within_train_step": 32.61563968658447, "step": 440}
{"train_info/time_between_train_steps": 0.010445356369018555, "step": 440}
{"info/global_step": 441, "train_info/time_within_train_step": 32.40563344955444, "step": 441}
{"train_info/time_between_train_steps": 0.0074727535247802734, "step": 441}
{"info/global_step": 442, "train_info/time_within_train_step": 32.6476149559021, "step": 442}
{"train_info/time_between_train_steps": 0.005095720291137695, "step": 442}
{"info/global_step": 443, "train_info/time_within_train_step": 32.46728706359863, "step": 443}
{"train_info/time_between_train_steps": 0.005160808563232422, "step": 443}
{"info/global_step": 444, "train_info/time_within_train_step": 32.03106451034546, "step": 444}
{"train_info/time_between_train_steps": 0.005196571350097656, "step": 444}
{"info/global_step": 445, "train_info/time_within_train_step": 32.593945264816284, "step": 445}
{"train_info/time_between_train_steps": 0.005112171173095703, "step": 445}
{"info/global_step": 446, "train_info/time_within_train_step": 32.60211491584778, "step": 446}
{"train_info/time_between_train_steps": 0.005048990249633789, "step": 446}
{"info/global_step": 447, "train_info/time_within_train_step": 32.51781725883484, "step": 447}
{"train_info/time_between_train_steps": 0.005120515823364258, "step": 447}
{"info/global_step": 448, "train_info/time_within_train_step": 32.27174782752991, "step": 448}
{"train_info/time_between_train_steps": 0.005041599273681641, "step": 448}
{"info/global_step": 449, "train_info/time_within_train_step": 32.18263554573059, "step": 449}
{"train_info/time_between_train_steps": 0.005173206329345703, "step": 449}
{"info/global_step": 450, "train_info/time_within_train_step": 32.237810134887695, "step": 450}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733702495, "_runtime": 15001}, "step": 450}
{"logs": {"train/loss": 4.0952, "train/learning_rate": 0.00041666666666666664, "train/epoch": 16.02, "_timestamp": 1733702495, "_runtime": 15001}, "step": 450}
{"train_info/time_between_train_steps": 0.012176752090454102, "step": 450}
{"info/global_step": 451, "train_info/time_within_train_step": 32.34288263320923, "step": 451}
{"train_info/time_between_train_steps": 0.0051310062408447266, "step": 451}
{"info/global_step": 452, "train_info/time_within_train_step": 32.33256006240845, "step": 452}
{"train_info/time_between_train_steps": 0.008018016815185547, "step": 452}
{"info/global_step": 453, "train_info/time_within_train_step": 32.402868032455444, "step": 453}
{"train_info/time_between_train_steps": 0.0053005218505859375, "step": 453}
{"info/global_step": 454, "train_info/time_within_train_step": 32.237977743148804, "step": 454}
{"train_info/time_between_train_steps": 0.005115509033203125, "step": 454}
{"info/global_step": 455, "train_info/time_within_train_step": 32.48766565322876, "step": 455}
{"train_info/time_between_train_steps": 0.0051059722900390625, "step": 455}
{"info/global_step": 456, "train_info/time_within_train_step": 32.46036696434021, "step": 456}
{"train_info/time_between_train_steps": 0.010562896728515625, "step": 456}
{"info/global_step": 457, "train_info/time_within_train_step": 32.57489228248596, "step": 457}
{"train_info/time_between_train_steps": 0.01000523567199707, "step": 457}
{"info/global_step": 458, "train_info/time_within_train_step": 32.50670289993286, "step": 458}
{"train_info/time_between_train_steps": 0.005827188491821289, "step": 458}
{"info/global_step": 459, "train_info/time_within_train_step": 32.38246297836304, "step": 459}
{"train_info/time_between_train_steps": 0.0058438777923583984, "step": 459}
{"train_info/time_between_train_steps": 23.20939064025879, "step": 459}
{"info/global_step": 460, "train_info/time_within_train_step": 32.45942258834839, "step": 460}
{"train_info/time_between_train_steps": 0.005711793899536133, "step": 460}
{"info/global_step": 461, "train_info/time_within_train_step": 32.38285994529724, "step": 461}
{"train_info/time_between_train_steps": 0.005269289016723633, "step": 461}
{"info/global_step": 462, "train_info/time_within_train_step": 32.206071853637695, "step": 462}
{"train_info/time_between_train_steps": 0.005174398422241211, "step": 462}
{"info/global_step": 463, "train_info/time_within_train_step": 32.87330603599548, "step": 463}
{"train_info/time_between_train_steps": 0.005399465560913086, "step": 463}
{"info/global_step": 464, "train_info/time_within_train_step": 32.378777265548706, "step": 464}
{"train_info/time_between_train_steps": 0.005547285079956055, "step": 464}
{"info/global_step": 465, "train_info/time_within_train_step": 32.60457468032837, "step": 465}
{"train_info/time_between_train_steps": 0.0053424835205078125, "step": 465}
{"info/global_step": 466, "train_info/time_within_train_step": 32.202648639678955, "step": 466}
{"train_info/time_between_train_steps": 0.005384683609008789, "step": 466}
{"info/global_step": 467, "train_info/time_within_train_step": 32.386587619781494, "step": 467}
{"train_info/time_between_train_steps": 0.005347251892089844, "step": 467}
{"info/global_step": 468, "train_info/time_within_train_step": 32.460891008377075, "step": 468}
{"train_info/time_between_train_steps": 0.004942178726196289, "step": 468}
{"info/global_step": 469, "train_info/time_within_train_step": 32.59860944747925, "step": 469}
{"train_info/time_between_train_steps": 0.005020618438720703, "step": 469}
{"info/global_step": 470, "train_info/time_within_train_step": 31.986740350723267, "step": 470}
{"train_info/time_between_train_steps": 0.004984855651855469, "step": 470}
{"info/global_step": 471, "train_info/time_within_train_step": 32.62618350982666, "step": 471}
{"train_info/time_between_train_steps": 0.0049991607666015625, "step": 471}
{"info/global_step": 472, "train_info/time_within_train_step": 32.25279092788696, "step": 472}
{"train_info/time_between_train_steps": 0.0051500797271728516, "step": 472}
{"info/global_step": 473, "train_info/time_within_train_step": 32.32240891456604, "step": 473}
{"train_info/time_between_train_steps": 0.005159616470336914, "step": 473}
{"info/global_step": 474, "train_info/time_within_train_step": 32.696871757507324, "step": 474}
{"train_info/time_between_train_steps": 0.010191917419433594, "step": 474}
{"info/global_step": 475, "train_info/time_within_train_step": 32.04537653923035, "step": 475}
{"train_info/time_between_train_steps": 0.009853839874267578, "step": 475}
{"info/global_step": 476, "train_info/time_within_train_step": 32.59878659248352, "step": 476}
{"train_info/time_between_train_steps": 0.005199432373046875, "step": 476}
{"info/global_step": 477, "train_info/time_within_train_step": 32.60195970535278, "step": 477}
{"train_info/time_between_train_steps": 0.0052297115325927734, "step": 477}
{"info/global_step": 478, "train_info/time_within_train_step": 32.2260639667511, "step": 478}
{"train_info/time_between_train_steps": 0.007733583450317383, "step": 478}
{"info/global_step": 479, "train_info/time_within_train_step": 32.5276939868927, "step": 479}
{"train_info/time_between_train_steps": 0.00543522834777832, "step": 479}
{"info/global_step": 480, "train_info/time_within_train_step": 32.5105996131897, "step": 480}
{"train_info/time_between_train_steps": 0.005089282989501953, "step": 480}
{"info/global_step": 481, "train_info/time_within_train_step": 32.15965223312378, "step": 481}
{"train_info/time_between_train_steps": 0.008137702941894531, "step": 481}
{"info/global_step": 482, "train_info/time_within_train_step": 32.235591173172, "step": 482}
{"train_info/time_between_train_steps": 0.005106449127197266, "step": 482}
{"info/global_step": 483, "train_info/time_within_train_step": 32.36649799346924, "step": 483}
{"train_info/time_between_train_steps": 0.005560398101806641, "step": 483}
{"info/global_step": 484, "train_info/time_within_train_step": 32.629080057144165, "step": 484}
{"train_info/time_between_train_steps": 0.010206222534179688, "step": 484}
{"info/global_step": 485, "train_info/time_within_train_step": 32.371201038360596, "step": 485}
{"train_info/time_between_train_steps": 0.005312919616699219, "step": 485}
{"info/global_step": 486, "train_info/time_within_train_step": 32.08652472496033, "step": 486}
{"train_info/time_between_train_steps": 0.005599498748779297, "step": 486}
{"train_info/time_between_train_steps": 22.953566312789917, "step": 486}
{"info/global_step": 487, "train_info/time_within_train_step": 32.486432790756226, "step": 487}
{"train_info/time_between_train_steps": 0.0077550411224365234, "step": 487}
{"info/global_step": 488, "train_info/time_within_train_step": 32.613595962524414, "step": 488}
{"train_info/time_between_train_steps": 0.005322933197021484, "step": 488}
{"info/global_step": 489, "train_info/time_within_train_step": 32.63090634346008, "step": 489}
{"train_info/time_between_train_steps": 0.006173372268676758, "step": 489}
{"info/global_step": 490, "train_info/time_within_train_step": 32.35687327384949, "step": 490}
{"train_info/time_between_train_steps": 0.005272865295410156, "step": 490}
{"info/global_step": 491, "train_info/time_within_train_step": 32.330843687057495, "step": 491}
{"train_info/time_between_train_steps": 0.005606651306152344, "step": 491}
{"info/global_step": 492, "train_info/time_within_train_step": 32.572702169418335, "step": 492}
{"train_info/time_between_train_steps": 0.005259275436401367, "step": 492}
{"info/global_step": 493, "train_info/time_within_train_step": 32.26805019378662, "step": 493}
{"train_info/time_between_train_steps": 0.005368709564208984, "step": 493}
{"info/global_step": 494, "train_info/time_within_train_step": 32.473021268844604, "step": 494}
{"train_info/time_between_train_steps": 0.005229473114013672, "step": 494}
{"info/global_step": 495, "train_info/time_within_train_step": 32.367849826812744, "step": 495}
{"train_info/time_between_train_steps": 0.005038022994995117, "step": 495}
{"info/global_step": 496, "train_info/time_within_train_step": 32.253403425216675, "step": 496}
{"train_info/time_between_train_steps": 0.009874582290649414, "step": 496}
{"info/global_step": 497, "train_info/time_within_train_step": 32.0666024684906, "step": 497}
{"train_info/time_between_train_steps": 0.005224943161010742, "step": 497}
{"info/global_step": 498, "train_info/time_within_train_step": 32.2917582988739, "step": 498}
{"train_info/time_between_train_steps": 0.007465839385986328, "step": 498}
{"info/global_step": 499, "train_info/time_within_train_step": 32.646570444107056, "step": 499}
{"train_info/time_between_train_steps": 0.005058765411376953, "step": 499}
{"info/global_step": 500, "train_info/time_within_train_step": 32.318936824798584, "step": 500}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733704162, "_runtime": 16668}, "step": 500}
{"logs": {"train/loss": 3.9534, "train/learning_rate": 0.00038888888888888887, "train/epoch": 18.01, "_timestamp": 1733704162, "_runtime": 16668}, "step": 500}
{"train_info/time_between_train_steps": 2.857863426208496, "step": 500}
{"info/global_step": 501, "train_info/time_within_train_step": 32.23446297645569, "step": 501}
{"train_info/time_between_train_steps": 0.004934072494506836, "step": 501}
{"info/global_step": 502, "train_info/time_within_train_step": 32.12629413604736, "step": 502}
{"train_info/time_between_train_steps": 0.0051860809326171875, "step": 502}
{"info/global_step": 503, "train_info/time_within_train_step": 32.3449547290802, "step": 503}
{"train_info/time_between_train_steps": 0.005079984664916992, "step": 503}
{"info/global_step": 504, "train_info/time_within_train_step": 32.52473068237305, "step": 504}
{"train_info/time_between_train_steps": 0.00513768196105957, "step": 504}
{"info/global_step": 505, "train_info/time_within_train_step": 32.55833673477173, "step": 505}
{"train_info/time_between_train_steps": 0.004988670349121094, "step": 505}
{"info/global_step": 506, "train_info/time_within_train_step": 32.52776575088501, "step": 506}
{"train_info/time_between_train_steps": 0.0050432682037353516, "step": 506}
{"info/global_step": 507, "train_info/time_within_train_step": 32.33571910858154, "step": 507}
{"train_info/time_between_train_steps": 0.005129098892211914, "step": 507}
{"info/global_step": 508, "train_info/time_within_train_step": 31.8094482421875, "step": 508}
{"train_info/time_between_train_steps": 0.00704646110534668, "step": 508}
{"info/global_step": 509, "train_info/time_within_train_step": 32.31798219680786, "step": 509}
{"train_info/time_between_train_steps": 0.00516819953918457, "step": 509}
{"info/global_step": 510, "train_info/time_within_train_step": 32.48737573623657, "step": 510}
{"train_info/time_between_train_steps": 0.005533456802368164, "step": 510}
{"info/global_step": 511, "train_info/time_within_train_step": 32.593042850494385, "step": 511}
{"train_info/time_between_train_steps": 0.00542902946472168, "step": 511}
{"info/global_step": 512, "train_info/time_within_train_step": 32.482524156570435, "step": 512}
{"train_info/time_between_train_steps": 0.00788116455078125, "step": 512}
{"info/global_step": 513, "train_info/time_within_train_step": 32.20320463180542, "step": 513}
{"train_info/time_between_train_steps": 0.005594491958618164, "step": 513}
{"train_info/time_between_train_steps": 23.44024896621704, "step": 513}
{"info/global_step": 514, "train_info/time_within_train_step": 32.72263288497925, "step": 514}
{"train_info/time_between_train_steps": 0.010937929153442383, "step": 514}
{"info/global_step": 515, "train_info/time_within_train_step": 32.67105460166931, "step": 515}
{"train_info/time_between_train_steps": 0.00545191764831543, "step": 515}
{"info/global_step": 516, "train_info/time_within_train_step": 32.591267347335815, "step": 516}
{"train_info/time_between_train_steps": 0.005200386047363281, "step": 516}
{"info/global_step": 517, "train_info/time_within_train_step": 32.701611280441284, "step": 517}
{"train_info/time_between_train_steps": 0.005385637283325195, "step": 517}
{"info/global_step": 518, "train_info/time_within_train_step": 32.28336572647095, "step": 518}
{"train_info/time_between_train_steps": 0.005570173263549805, "step": 518}
{"info/global_step": 519, "train_info/time_within_train_step": 32.48777103424072, "step": 519}
{"train_info/time_between_train_steps": 0.0053081512451171875, "step": 519}
{"info/global_step": 520, "train_info/time_within_train_step": 32.82217502593994, "step": 520}
{"train_info/time_between_train_steps": 0.005515575408935547, "step": 520}
{"info/global_step": 521, "train_info/time_within_train_step": 32.54741358757019, "step": 521}
{"train_info/time_between_train_steps": 0.005791187286376953, "step": 521}
{"info/global_step": 522, "train_info/time_within_train_step": 32.22557973861694, "step": 522}
{"train_info/time_between_train_steps": 0.005134105682373047, "step": 522}
{"info/global_step": 523, "train_info/time_within_train_step": 32.47010111808777, "step": 523}
{"train_info/time_between_train_steps": 0.007131338119506836, "step": 523}
{"info/global_step": 524, "train_info/time_within_train_step": 32.21182060241699, "step": 524}
{"train_info/time_between_train_steps": 0.0052030086517333984, "step": 524}
{"info/global_step": 525, "train_info/time_within_train_step": 32.242151498794556, "step": 525}
{"train_info/time_between_train_steps": 0.00510096549987793, "step": 525}
{"info/global_step": 526, "train_info/time_within_train_step": 32.56828331947327, "step": 526}
{"train_info/time_between_train_steps": 0.005396366119384766, "step": 526}
{"info/global_step": 527, "train_info/time_within_train_step": 32.63383102416992, "step": 527}
{"train_info/time_between_train_steps": 0.005172014236450195, "step": 527}
{"info/global_step": 528, "train_info/time_within_train_step": 32.373942613601685, "step": 528}
{"train_info/time_between_train_steps": 0.010289669036865234, "step": 528}
{"info/global_step": 529, "train_info/time_within_train_step": 32.22522759437561, "step": 529}
{"train_info/time_between_train_steps": 0.005270719528198242, "step": 529}
{"info/global_step": 530, "train_info/time_within_train_step": 31.677039623260498, "step": 530}
{"train_info/time_between_train_steps": 0.007168292999267578, "step": 530}
{"info/global_step": 531, "train_info/time_within_train_step": 32.35060453414917, "step": 531}
{"train_info/time_between_train_steps": 0.005204439163208008, "step": 531}
{"info/global_step": 532, "train_info/time_within_train_step": 32.36952543258667, "step": 532}
{"train_info/time_between_train_steps": 0.0051670074462890625, "step": 532}
{"info/global_step": 533, "train_info/time_within_train_step": 32.278552532196045, "step": 533}
{"train_info/time_between_train_steps": 0.010301828384399414, "step": 533}
{"info/global_step": 534, "train_info/time_within_train_step": 32.50726628303528, "step": 534}
{"train_info/time_between_train_steps": 0.005191326141357422, "step": 534}
{"info/global_step": 535, "train_info/time_within_train_step": 32.62401580810547, "step": 535}
{"train_info/time_between_train_steps": 0.009580612182617188, "step": 535}
{"info/global_step": 536, "train_info/time_within_train_step": 32.10844111442566, "step": 536}
{"train_info/time_between_train_steps": 0.005093097686767578, "step": 536}
{"info/global_step": 537, "train_info/time_within_train_step": 32.296642541885376, "step": 537}
{"train_info/time_between_train_steps": 0.005263090133666992, "step": 537}
{"info/global_step": 538, "train_info/time_within_train_step": 32.5011351108551, "step": 538}
{"train_info/time_between_train_steps": 0.010338306427001953, "step": 538}
{"info/global_step": 539, "train_info/time_within_train_step": 32.66003680229187, "step": 539}
{"train_info/time_between_train_steps": 0.005749702453613281, "step": 539}
{"info/global_step": 540, "train_info/time_within_train_step": 32.58250331878662, "step": 540}
{"train_info/time_between_train_steps": 0.0058441162109375, "step": 540}
{"train_info/time_between_train_steps": 23.906949758529663, "step": 540}
{"info/global_step": 541, "train_info/time_within_train_step": 32.00331950187683, "step": 541}
{"train_info/time_between_train_steps": 0.008070230484008789, "step": 541}
{"info/global_step": 542, "train_info/time_within_train_step": 32.71259164810181, "step": 542}
{"train_info/time_between_train_steps": 0.005349874496459961, "step": 542}
{"info/global_step": 543, "train_info/time_within_train_step": 32.49238610267639, "step": 543}
{"train_info/time_between_train_steps": 0.005117893218994141, "step": 543}
{"info/global_step": 544, "train_info/time_within_train_step": 32.67269492149353, "step": 544}
{"train_info/time_between_train_steps": 0.007421016693115234, "step": 544}
{"info/global_step": 545, "train_info/time_within_train_step": 32.58752965927124, "step": 545}
{"train_info/time_between_train_steps": 0.005208015441894531, "step": 545}
{"info/global_step": 546, "train_info/time_within_train_step": 32.91587710380554, "step": 546}
{"train_info/time_between_train_steps": 0.01092839241027832, "step": 546}
{"info/global_step": 547, "train_info/time_within_train_step": 32.07707500457764, "step": 547}
{"train_info/time_between_train_steps": 0.0071985721588134766, "step": 547}
{"info/global_step": 548, "train_info/time_within_train_step": 32.425986766815186, "step": 548}
{"train_info/time_between_train_steps": 0.00555419921875, "step": 548}
{"info/global_step": 549, "train_info/time_within_train_step": 32.513680934906006, "step": 549}
{"train_info/time_between_train_steps": 0.00859522819519043, "step": 549}
{"info/global_step": 550, "train_info/time_within_train_step": 32.39877486228943, "step": 550}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733705834, "_runtime": 18340}, "step": 550}
{"logs": {"train/loss": 3.831, "train/learning_rate": 0.0003611111111111111, "train/epoch": 20.01, "_timestamp": 1733705834, "_runtime": 18340}, "step": 550}
{"train_info/time_between_train_steps": 0.006832599639892578, "step": 550}
{"info/global_step": 551, "train_info/time_within_train_step": 32.64228892326355, "step": 551}
{"train_info/time_between_train_steps": 0.0051517486572265625, "step": 551}
{"info/global_step": 552, "train_info/time_within_train_step": 32.44235873222351, "step": 552}
{"train_info/time_between_train_steps": 0.00983428955078125, "step": 552}
{"info/global_step": 553, "train_info/time_within_train_step": 32.221405267715454, "step": 553}
{"train_info/time_between_train_steps": 0.005076169967651367, "step": 553}
{"info/global_step": 554, "train_info/time_within_train_step": 32.22242760658264, "step": 554}
{"train_info/time_between_train_steps": 0.005255937576293945, "step": 554}
{"info/global_step": 555, "train_info/time_within_train_step": 32.38246464729309, "step": 555}
{"train_info/time_between_train_steps": 0.005045890808105469, "step": 555}
{"info/global_step": 556, "train_info/time_within_train_step": 32.48442482948303, "step": 556}
{"train_info/time_between_train_steps": 0.005091667175292969, "step": 556}
{"info/global_step": 557, "train_info/time_within_train_step": 32.26198148727417, "step": 557}
{"train_info/time_between_train_steps": 0.007915735244750977, "step": 557}
{"info/global_step": 558, "train_info/time_within_train_step": 32.66205930709839, "step": 558}
{"train_info/time_between_train_steps": 0.005150794982910156, "step": 558}
{"info/global_step": 559, "train_info/time_within_train_step": 32.137126207351685, "step": 559}
{"train_info/time_between_train_steps": 0.006383180618286133, "step": 559}
{"info/global_step": 560, "train_info/time_within_train_step": 32.31962728500366, "step": 560}
{"train_info/time_between_train_steps": 0.00512385368347168, "step": 560}
{"info/global_step": 561, "train_info/time_within_train_step": 32.2489652633667, "step": 561}
{"train_info/time_between_train_steps": 0.0052874088287353516, "step": 561}
{"info/global_step": 562, "train_info/time_within_train_step": 32.35722255706787, "step": 562}
{"train_info/time_between_train_steps": 0.0050885677337646484, "step": 562}
{"info/global_step": 563, "train_info/time_within_train_step": 32.83889937400818, "step": 563}
{"train_info/time_between_train_steps": 0.005156755447387695, "step": 563}
{"info/global_step": 564, "train_info/time_within_train_step": 32.405197620391846, "step": 564}
{"train_info/time_between_train_steps": 0.0054166316986083984, "step": 564}
{"info/global_step": 565, "train_info/time_within_train_step": 31.971935033798218, "step": 565}
{"train_info/time_between_train_steps": 0.005162715911865234, "step": 565}
{"info/global_step": 566, "train_info/time_within_train_step": 32.392829179763794, "step": 566}
{"train_info/time_between_train_steps": 0.005387544631958008, "step": 566}
{"info/global_step": 567, "train_info/time_within_train_step": 32.510549545288086, "step": 567}
{"train_info/time_between_train_steps": 0.0054111480712890625, "step": 567}
{"train_info/time_between_train_steps": 23.338230848312378, "step": 567}
{"info/global_step": 568, "train_info/time_within_train_step": 32.07943058013916, "step": 568}
{"train_info/time_between_train_steps": 0.005002021789550781, "step": 568}
{"info/global_step": 569, "train_info/time_within_train_step": 32.425623416900635, "step": 569}
{"train_info/time_between_train_steps": 0.007276296615600586, "step": 569}
{"info/global_step": 570, "train_info/time_within_train_step": 32.02962255477905, "step": 570}
{"train_info/time_between_train_steps": 0.008228540420532227, "step": 570}
{"info/global_step": 571, "train_info/time_within_train_step": 32.538822174072266, "step": 571}
{"train_info/time_between_train_steps": 0.008112907409667969, "step": 571}
{"info/global_step": 572, "train_info/time_within_train_step": 32.49236989021301, "step": 572}
{"train_info/time_between_train_steps": 0.011657238006591797, "step": 572}
{"info/global_step": 573, "train_info/time_within_train_step": 32.87103486061096, "step": 573}
{"train_info/time_between_train_steps": 0.005408287048339844, "step": 573}
{"info/global_step": 574, "train_info/time_within_train_step": 32.53813600540161, "step": 574}
{"train_info/time_between_train_steps": 0.005410432815551758, "step": 574}
{"info/global_step": 575, "train_info/time_within_train_step": 32.5726683139801, "step": 575}
{"train_info/time_between_train_steps": 0.00557708740234375, "step": 575}
{"info/global_step": 576, "train_info/time_within_train_step": 32.04811978340149, "step": 576}
{"train_info/time_between_train_steps": 0.005273342132568359, "step": 576}
{"info/global_step": 577, "train_info/time_within_train_step": 32.52315855026245, "step": 577}
{"train_info/time_between_train_steps": 0.004969120025634766, "step": 577}
{"info/global_step": 578, "train_info/time_within_train_step": 32.4273407459259, "step": 578}
{"train_info/time_between_train_steps": 0.00982809066772461, "step": 578}
{"info/global_step": 579, "train_info/time_within_train_step": 32.657390117645264, "step": 579}
{"train_info/time_between_train_steps": 0.010014772415161133, "step": 579}
{"info/global_step": 580, "train_info/time_within_train_step": 32.38017725944519, "step": 580}
{"train_info/time_between_train_steps": 0.007009983062744141, "step": 580}
{"info/global_step": 581, "train_info/time_within_train_step": 32.570059299468994, "step": 581}
{"train_info/time_between_train_steps": 0.005475044250488281, "step": 581}
{"info/global_step": 582, "train_info/time_within_train_step": 32.02998089790344, "step": 582}
{"train_info/time_between_train_steps": 0.005202531814575195, "step": 582}
{"info/global_step": 583, "train_info/time_within_train_step": 32.138160705566406, "step": 583}
{"train_info/time_between_train_steps": 0.005211830139160156, "step": 583}
{"info/global_step": 584, "train_info/time_within_train_step": 32.20316004753113, "step": 584}
{"train_info/time_between_train_steps": 0.00528407096862793, "step": 584}
{"info/global_step": 585, "train_info/time_within_train_step": 32.28374767303467, "step": 585}
{"train_info/time_between_train_steps": 0.0052258968353271484, "step": 585}
{"info/global_step": 586, "train_info/time_within_train_step": 32.58183979988098, "step": 586}
{"train_info/time_between_train_steps": 0.005175590515136719, "step": 586}
{"info/global_step": 587, "train_info/time_within_train_step": 32.448155879974365, "step": 587}
{"train_info/time_between_train_steps": 0.008850336074829102, "step": 587}
{"info/global_step": 588, "train_info/time_within_train_step": 32.233038902282715, "step": 588}
{"train_info/time_between_train_steps": 0.005258083343505859, "step": 588}
{"info/global_step": 589, "train_info/time_within_train_step": 32.22959589958191, "step": 589}
{"train_info/time_between_train_steps": 0.005126476287841797, "step": 589}
{"info/global_step": 590, "train_info/time_within_train_step": 32.38295030593872, "step": 590}
{"train_info/time_between_train_steps": 0.0050656795501708984, "step": 590}
{"info/global_step": 591, "train_info/time_within_train_step": 32.57872748374939, "step": 591}
{"train_info/time_between_train_steps": 0.005434513092041016, "step": 591}
{"info/global_step": 592, "train_info/time_within_train_step": 32.378926277160645, "step": 592}
{"train_info/time_between_train_steps": 0.005382537841796875, "step": 592}
{"info/global_step": 593, "train_info/time_within_train_step": 32.46468687057495, "step": 593}
{"train_info/time_between_train_steps": 0.005644083023071289, "step": 593}
{"info/global_step": 594, "train_info/time_within_train_step": 32.74580383300781, "step": 594}
{"train_info/time_between_train_steps": 0.005932807922363281, "step": 594}
{"train_info/time_between_train_steps": 23.062691926956177, "step": 594}
{"info/global_step": 595, "train_info/time_within_train_step": 32.32486414909363, "step": 595}
{"train_info/time_between_train_steps": 0.005522727966308594, "step": 595}
{"info/global_step": 596, "train_info/time_within_train_step": 32.51100420951843, "step": 596}
{"train_info/time_between_train_steps": 0.005440950393676758, "step": 596}
{"info/global_step": 597, "train_info/time_within_train_step": 32.45440912246704, "step": 597}
{"train_info/time_between_train_steps": 0.005420684814453125, "step": 597}
{"info/global_step": 598, "train_info/time_within_train_step": 32.78125596046448, "step": 598}
{"train_info/time_between_train_steps": 0.010076284408569336, "step": 598}
{"info/global_step": 599, "train_info/time_within_train_step": 32.52008247375488, "step": 599}
{"train_info/time_between_train_steps": 0.005438327789306641, "step": 599}
{"info/global_step": 600, "train_info/time_within_train_step": 32.13923907279968, "step": 600}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733707500, "_runtime": 20006}, "step": 600}
{"logs": {"train/loss": 3.7313, "train/learning_rate": 0.0003333333333333333, "train/epoch": 22.0, "_timestamp": 1733707500, "_runtime": 20006}, "step": 600}
{"train_info/time_between_train_steps": 2.8862409591674805, "step": 600}
{"info/global_step": 601, "train_info/time_within_train_step": 32.34042310714722, "step": 601}
{"train_info/time_between_train_steps": 0.005231142044067383, "step": 601}
{"info/global_step": 602, "train_info/time_within_train_step": 32.33927297592163, "step": 602}
{"train_info/time_between_train_steps": 0.006749391555786133, "step": 602}
{"info/global_step": 603, "train_info/time_within_train_step": 32.37821888923645, "step": 603}
{"train_info/time_between_train_steps": 0.00511622428894043, "step": 603}
{"info/global_step": 604, "train_info/time_within_train_step": 32.56428408622742, "step": 604}
{"train_info/time_between_train_steps": 0.005078792572021484, "step": 604}
{"info/global_step": 605, "train_info/time_within_train_step": 32.28351092338562, "step": 605}
{"train_info/time_between_train_steps": 0.010796308517456055, "step": 605}
{"info/global_step": 606, "train_info/time_within_train_step": 32.43317008018494, "step": 606}
{"train_info/time_between_train_steps": 0.00728297233581543, "step": 606}
{"info/global_step": 607, "train_info/time_within_train_step": 32.21800184249878, "step": 607}
{"train_info/time_between_train_steps": 0.005626201629638672, "step": 607}
{"info/global_step": 608, "train_info/time_within_train_step": 32.38512563705444, "step": 608}
{"train_info/time_between_train_steps": 0.005095005035400391, "step": 608}
{"info/global_step": 609, "train_info/time_within_train_step": 32.51882886886597, "step": 609}
{"train_info/time_between_train_steps": 0.00513768196105957, "step": 609}
{"info/global_step": 610, "train_info/time_within_train_step": 32.523839712142944, "step": 610}
{"train_info/time_between_train_steps": 0.005158185958862305, "step": 610}
{"info/global_step": 611, "train_info/time_within_train_step": 32.87521004676819, "step": 611}
{"train_info/time_between_train_steps": 0.014261007308959961, "step": 611}
{"info/global_step": 612, "train_info/time_within_train_step": 32.613526582717896, "step": 612}
{"train_info/time_between_train_steps": 0.005113124847412109, "step": 612}
{"info/global_step": 613, "train_info/time_within_train_step": 32.395880937576294, "step": 613}
{"train_info/time_between_train_steps": 0.006127357482910156, "step": 613}
{"info/global_step": 614, "train_info/time_within_train_step": 32.26653456687927, "step": 614}
{"train_info/time_between_train_steps": 0.00513911247253418, "step": 614}
{"info/global_step": 615, "train_info/time_within_train_step": 32.57195782661438, "step": 615}
{"train_info/time_between_train_steps": 0.005316495895385742, "step": 615}
{"info/global_step": 616, "train_info/time_within_train_step": 32.65190601348877, "step": 616}
{"train_info/time_between_train_steps": 0.005394697189331055, "step": 616}
{"info/global_step": 617, "train_info/time_within_train_step": 32.506019592285156, "step": 617}
{"train_info/time_between_train_steps": 0.005110025405883789, "step": 617}
{"info/global_step": 618, "train_info/time_within_train_step": 32.777992725372314, "step": 618}
{"train_info/time_between_train_steps": 0.00567936897277832, "step": 618}
{"info/global_step": 619, "train_info/time_within_train_step": 32.285125970840454, "step": 619}
{"train_info/time_between_train_steps": 0.005319833755493164, "step": 619}
{"info/global_step": 620, "train_info/time_within_train_step": 32.52779245376587, "step": 620}
{"train_info/time_between_train_steps": 0.0056192874908447266, "step": 620}
{"info/global_step": 621, "train_info/time_within_train_step": 32.534090995788574, "step": 621}
{"train_info/time_between_train_steps": 0.005799770355224609, "step": 621}
{"train_info/time_between_train_steps": 23.749394416809082, "step": 621}
{"info/global_step": 622, "train_info/time_within_train_step": 32.44508194923401, "step": 622}
{"train_info/time_between_train_steps": 0.005541086196899414, "step": 622}
{"info/global_step": 623, "train_info/time_within_train_step": 32.664265871047974, "step": 623}
{"train_info/time_between_train_steps": 0.0053501129150390625, "step": 623}
{"info/global_step": 624, "train_info/time_within_train_step": 32.27399730682373, "step": 624}
{"train_info/time_between_train_steps": 0.009855508804321289, "step": 624}
{"info/global_step": 625, "train_info/time_within_train_step": 32.23417544364929, "step": 625}
{"train_info/time_between_train_steps": 0.005563497543334961, "step": 625}
{"info/global_step": 626, "train_info/time_within_train_step": 32.60963296890259, "step": 626}
{"train_info/time_between_train_steps": 0.0056073665618896484, "step": 626}
{"info/global_step": 627, "train_info/time_within_train_step": 32.69018626213074, "step": 627}
{"train_info/time_between_train_steps": 0.008092164993286133, "step": 627}
{"info/global_step": 628, "train_info/time_within_train_step": 32.49269080162048, "step": 628}
{"train_info/time_between_train_steps": 0.005171298980712891, "step": 628}
{"info/global_step": 629, "train_info/time_within_train_step": 32.52678871154785, "step": 629}
{"train_info/time_between_train_steps": 0.007508277893066406, "step": 629}
{"info/global_step": 630, "train_info/time_within_train_step": 32.70770239830017, "step": 630}
{"train_info/time_between_train_steps": 0.005202770233154297, "step": 630}
{"info/global_step": 631, "train_info/time_within_train_step": 32.08567667007446, "step": 631}
{"train_info/time_between_train_steps": 0.009239673614501953, "step": 631}
{"info/global_step": 632, "train_info/time_within_train_step": 32.69443321228027, "step": 632}
{"train_info/time_between_train_steps": 0.005322933197021484, "step": 632}
{"info/global_step": 633, "train_info/time_within_train_step": 32.4986298084259, "step": 633}
{"train_info/time_between_train_steps": 0.008731365203857422, "step": 633}
{"info/global_step": 634, "train_info/time_within_train_step": 32.44006276130676, "step": 634}
{"train_info/time_between_train_steps": 0.007971525192260742, "step": 634}
{"info/global_step": 635, "train_info/time_within_train_step": 32.64633536338806, "step": 635}
{"train_info/time_between_train_steps": 0.009912967681884766, "step": 635}
{"info/global_step": 636, "train_info/time_within_train_step": 32.80328106880188, "step": 636}
{"train_info/time_between_train_steps": 0.009974956512451172, "step": 636}
{"info/global_step": 637, "train_info/time_within_train_step": 32.061989545822144, "step": 637}
{"train_info/time_between_train_steps": 0.004996538162231445, "step": 637}
{"info/global_step": 638, "train_info/time_within_train_step": 32.396159648895264, "step": 638}
{"train_info/time_between_train_steps": 0.0070040225982666016, "step": 638}
{"info/global_step": 639, "train_info/time_within_train_step": 32.44412851333618, "step": 639}
{"train_info/time_between_train_steps": 0.005128145217895508, "step": 639}
{"info/global_step": 640, "train_info/time_within_train_step": 32.52452492713928, "step": 640}
{"train_info/time_between_train_steps": 0.010030031204223633, "step": 640}
{"info/global_step": 641, "train_info/time_within_train_step": 32.57741689682007, "step": 641}
{"train_info/time_between_train_steps": 0.00836801528930664, "step": 641}
{"info/global_step": 642, "train_info/time_within_train_step": 32.69069766998291, "step": 642}
{"train_info/time_between_train_steps": 0.0070285797119140625, "step": 642}
{"info/global_step": 643, "train_info/time_within_train_step": 32.27258634567261, "step": 643}
{"train_info/time_between_train_steps": 0.00496983528137207, "step": 643}
{"info/global_step": 644, "train_info/time_within_train_step": 32.45308327674866, "step": 644}
{"train_info/time_between_train_steps": 0.0051364898681640625, "step": 644}
{"info/global_step": 645, "train_info/time_within_train_step": 32.315003395080566, "step": 645}
{"train_info/time_between_train_steps": 0.010029792785644531, "step": 645}
{"info/global_step": 646, "train_info/time_within_train_step": 32.55570960044861, "step": 646}
{"train_info/time_between_train_steps": 0.0068302154541015625, "step": 646}
{"info/global_step": 647, "train_info/time_within_train_step": 32.78330135345459, "step": 647}
{"train_info/time_between_train_steps": 0.011020898818969727, "step": 647}
{"info/global_step": 648, "train_info/time_within_train_step": 32.486608028411865, "step": 648}
{"train_info/time_between_train_steps": 0.012178421020507812, "step": 648}
{"train_info/time_between_train_steps": 23.926551342010498, "step": 648}
{"info/global_step": 649, "train_info/time_within_train_step": 32.15944981575012, "step": 649}
{"train_info/time_between_train_steps": 0.0077972412109375, "step": 649}
{"info/global_step": 650, "train_info/time_within_train_step": 32.92580246925354, "step": 650}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733709176, "_runtime": 21682}, "step": 650}
{"logs": {"train/loss": 3.6388, "train/learning_rate": 0.00030555555555555555, "train/epoch": 24.0, "_timestamp": 1733709176, "_runtime": 21682}, "step": 650}
{"train_info/time_between_train_steps": 0.007627010345458984, "step": 650}
{"info/global_step": 651, "train_info/time_within_train_step": 32.25647187232971, "step": 651}
{"train_info/time_between_train_steps": 0.005355119705200195, "step": 651}
{"info/global_step": 652, "train_info/time_within_train_step": 32.53202939033508, "step": 652}
{"train_info/time_between_train_steps": 0.00538945198059082, "step": 652}
{"info/global_step": 653, "train_info/time_within_train_step": 32.655407667160034, "step": 653}
{"train_info/time_between_train_steps": 0.00519251823425293, "step": 653}
{"info/global_step": 654, "train_info/time_within_train_step": 32.8899359703064, "step": 654}
{"train_info/time_between_train_steps": 0.009895801544189453, "step": 654}
{"info/global_step": 655, "train_info/time_within_train_step": 32.3553512096405, "step": 655}
{"train_info/time_between_train_steps": 0.005316257476806641, "step": 655}
{"info/global_step": 656, "train_info/time_within_train_step": 32.15269207954407, "step": 656}
{"train_info/time_between_train_steps": 0.005190372467041016, "step": 656}
{"info/global_step": 657, "train_info/time_within_train_step": 32.46886157989502, "step": 657}
{"train_info/time_between_train_steps": 0.0048258304595947266, "step": 657}
{"info/global_step": 658, "train_info/time_within_train_step": 32.47311973571777, "step": 658}
{"train_info/time_between_train_steps": 0.004900932312011719, "step": 658}
{"info/global_step": 659, "train_info/time_within_train_step": 32.52952551841736, "step": 659}
{"train_info/time_between_train_steps": 0.0051801204681396484, "step": 659}
{"info/global_step": 660, "train_info/time_within_train_step": 32.63337850570679, "step": 660}
{"train_info/time_between_train_steps": 0.010025978088378906, "step": 660}
{"info/global_step": 661, "train_info/time_within_train_step": 32.7012083530426, "step": 661}
{"train_info/time_between_train_steps": 0.005114555358886719, "step": 661}
{"info/global_step": 662, "train_info/time_within_train_step": 31.81190514564514, "step": 662}
{"train_info/time_between_train_steps": 0.005192756652832031, "step": 662}
{"info/global_step": 663, "train_info/time_within_train_step": 32.308501958847046, "step": 663}
{"train_info/time_between_train_steps": 0.005316257476806641, "step": 663}
{"info/global_step": 664, "train_info/time_within_train_step": 32.773677825927734, "step": 664}
{"train_info/time_between_train_steps": 0.005333900451660156, "step": 664}
{"info/global_step": 665, "train_info/time_within_train_step": 32.485291719436646, "step": 665}
{"train_info/time_between_train_steps": 0.005234479904174805, "step": 665}
{"info/global_step": 666, "train_info/time_within_train_step": 32.317065715789795, "step": 666}
{"train_info/time_between_train_steps": 0.007977485656738281, "step": 666}
{"info/global_step": 667, "train_info/time_within_train_step": 32.53290104866028, "step": 667}
{"train_info/time_between_train_steps": 0.005135297775268555, "step": 667}
{"info/global_step": 668, "train_info/time_within_train_step": 32.45036435127258, "step": 668}
{"train_info/time_between_train_steps": 0.005007266998291016, "step": 668}
{"info/global_step": 669, "train_info/time_within_train_step": 32.247780561447144, "step": 669}
{"train_info/time_between_train_steps": 0.0051441192626953125, "step": 669}
{"info/global_step": 670, "train_info/time_within_train_step": 32.48869013786316, "step": 670}
{"train_info/time_between_train_steps": 0.005280017852783203, "step": 670}
{"info/global_step": 671, "train_info/time_within_train_step": 32.389084577560425, "step": 671}
{"train_info/time_between_train_steps": 0.005228519439697266, "step": 671}
{"info/global_step": 672, "train_info/time_within_train_step": 32.37579917907715, "step": 672}
{"train_info/time_between_train_steps": 0.0055692195892333984, "step": 672}
{"info/global_step": 673, "train_info/time_within_train_step": 32.49195408821106, "step": 673}
{"train_info/time_between_train_steps": 0.005297660827636719, "step": 673}
{"info/global_step": 674, "train_info/time_within_train_step": 32.57997536659241, "step": 674}
{"train_info/time_between_train_steps": 0.0054569244384765625, "step": 674}
{"info/global_step": 675, "train_info/time_within_train_step": 32.52033495903015, "step": 675}
{"train_info/time_between_train_steps": 0.0055501461029052734, "step": 675}
{"train_info/time_between_train_steps": 23.24444317817688, "step": 675}
{"info/global_step": 676, "train_info/time_within_train_step": 32.381990909576416, "step": 676}
{"train_info/time_between_train_steps": 0.006124973297119141, "step": 676}
{"info/global_step": 677, "train_info/time_within_train_step": 32.541271686553955, "step": 677}
{"train_info/time_between_train_steps": 0.005452156066894531, "step": 677}
{"info/global_step": 678, "train_info/time_within_train_step": 32.63214612007141, "step": 678}
{"train_info/time_between_train_steps": 0.005189657211303711, "step": 678}
{"info/global_step": 679, "train_info/time_within_train_step": 32.7324275970459, "step": 679}
{"train_info/time_between_train_steps": 0.005388498306274414, "step": 679}
{"info/global_step": 680, "train_info/time_within_train_step": 32.71208310127258, "step": 680}
{"train_info/time_between_train_steps": 0.005609273910522461, "step": 680}
{"info/global_step": 681, "train_info/time_within_train_step": 32.02036905288696, "step": 681}
{"train_info/time_between_train_steps": 0.010075092315673828, "step": 681}
{"info/global_step": 682, "train_info/time_within_train_step": 32.46235799789429, "step": 682}
{"train_info/time_between_train_steps": 0.005627155303955078, "step": 682}
{"info/global_step": 683, "train_info/time_within_train_step": 32.37650990486145, "step": 683}
{"train_info/time_between_train_steps": 0.005242586135864258, "step": 683}
{"info/global_step": 684, "train_info/time_within_train_step": 32.54866337776184, "step": 684}
{"train_info/time_between_train_steps": 0.005141735076904297, "step": 684}
{"info/global_step": 685, "train_info/time_within_train_step": 32.612756967544556, "step": 685}
{"train_info/time_between_train_steps": 0.005100727081298828, "step": 685}
{"info/global_step": 686, "train_info/time_within_train_step": 32.78991651535034, "step": 686}
{"train_info/time_between_train_steps": 0.005105733871459961, "step": 686}
{"info/global_step": 687, "train_info/time_within_train_step": 32.3804452419281, "step": 687}
{"train_info/time_between_train_steps": 0.005049943923950195, "step": 687}
{"info/global_step": 688, "train_info/time_within_train_step": 32.155338287353516, "step": 688}
{"train_info/time_between_train_steps": 0.00515294075012207, "step": 688}
{"info/global_step": 689, "train_info/time_within_train_step": 32.43709754943848, "step": 689}
{"train_info/time_between_train_steps": 0.0051975250244140625, "step": 689}
{"info/global_step": 690, "train_info/time_within_train_step": 32.24974751472473, "step": 690}
{"train_info/time_between_train_steps": 0.005144834518432617, "step": 690}
{"info/global_step": 691, "train_info/time_within_train_step": 32.491522550582886, "step": 691}
{"train_info/time_between_train_steps": 0.005042552947998047, "step": 691}
{"info/global_step": 692, "train_info/time_within_train_step": 32.59416937828064, "step": 692}
{"train_info/time_between_train_steps": 0.010141849517822266, "step": 692}
{"info/global_step": 693, "train_info/time_within_train_step": 32.59670066833496, "step": 693}
{"train_info/time_between_train_steps": 0.009829044342041016, "step": 693}
{"info/global_step": 694, "train_info/time_within_train_step": 32.47878623008728, "step": 694}
{"train_info/time_between_train_steps": 0.010074377059936523, "step": 694}
{"info/global_step": 695, "train_info/time_within_train_step": 32.11550831794739, "step": 695}
{"train_info/time_between_train_steps": 0.005396366119384766, "step": 695}
{"info/global_step": 696, "train_info/time_within_train_step": 32.39174199104309, "step": 696}
{"train_info/time_between_train_steps": 0.005144596099853516, "step": 696}
{"info/global_step": 697, "train_info/time_within_train_step": 32.2558491230011, "step": 697}
{"train_info/time_between_train_steps": 0.005137920379638672, "step": 697}
{"info/global_step": 698, "train_info/time_within_train_step": 32.430216789245605, "step": 698}
{"train_info/time_between_train_steps": 0.005187034606933594, "step": 698}
{"info/global_step": 699, "train_info/time_within_train_step": 32.678308725357056, "step": 699}
{"train_info/time_between_train_steps": 0.005424022674560547, "step": 699}
{"info/global_step": 700, "train_info/time_within_train_step": 32.408344984054565, "step": 700}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733710822, "_runtime": 23328}, "step": 700}
{"logs": {"train/loss": 3.512, "train/learning_rate": 0.0002777777777777778, "train/epoch": 25.02, "_timestamp": 1733710822, "_runtime": 23328}, "step": 700}
{"train_info/time_between_train_steps": 2.3045246601104736, "step": 700}
{"info/global_step": 701, "train_info/time_within_train_step": 32.43240928649902, "step": 701}
{"train_info/time_between_train_steps": 0.005550861358642578, "step": 701}
{"info/global_step": 702, "train_info/time_within_train_step": 32.114853382110596, "step": 702}
{"train_info/time_between_train_steps": 0.005888223648071289, "step": 702}
{"train_info/time_between_train_steps": 23.59015965461731, "step": 702}
{"info/global_step": 703, "train_info/time_within_train_step": 32.274251222610474, "step": 703}
{"train_info/time_between_train_steps": 0.005498409271240234, "step": 703}
{"info/global_step": 704, "train_info/time_within_train_step": 32.533220529556274, "step": 704}
{"train_info/time_between_train_steps": 0.005459785461425781, "step": 704}
{"info/global_step": 705, "train_info/time_within_train_step": 32.46354627609253, "step": 705}
{"train_info/time_between_train_steps": 0.005366325378417969, "step": 705}
{"info/global_step": 706, "train_info/time_within_train_step": 32.362138509750366, "step": 706}
{"train_info/time_between_train_steps": 0.005179882049560547, "step": 706}
{"info/global_step": 707, "train_info/time_within_train_step": 32.377501487731934, "step": 707}
{"train_info/time_between_train_steps": 0.0070362091064453125, "step": 707}
{"info/global_step": 708, "train_info/time_within_train_step": 32.546868324279785, "step": 708}
{"train_info/time_between_train_steps": 0.0050966739654541016, "step": 708}
{"info/global_step": 709, "train_info/time_within_train_step": 32.169944286346436, "step": 709}
{"train_info/time_between_train_steps": 0.006556987762451172, "step": 709}
{"info/global_step": 710, "train_info/time_within_train_step": 32.36545181274414, "step": 710}
{"train_info/time_between_train_steps": 0.00534510612487793, "step": 710}
{"info/global_step": 711, "train_info/time_within_train_step": 31.98538064956665, "step": 711}
{"train_info/time_between_train_steps": 0.005104780197143555, "step": 711}
{"info/global_step": 712, "train_info/time_within_train_step": 32.452841997146606, "step": 712}
{"train_info/time_between_train_steps": 0.005023956298828125, "step": 712}
{"info/global_step": 713, "train_info/time_within_train_step": 32.464693784713745, "step": 713}
{"train_info/time_between_train_steps": 0.007283210754394531, "step": 713}
{"info/global_step": 714, "train_info/time_within_train_step": 32.44520378112793, "step": 714}
{"train_info/time_between_train_steps": 0.01456451416015625, "step": 714}
{"info/global_step": 715, "train_info/time_within_train_step": 32.48294425010681, "step": 715}
{"train_info/time_between_train_steps": 0.0050466060638427734, "step": 715}
{"info/global_step": 716, "train_info/time_within_train_step": 32.187999963760376, "step": 716}
{"train_info/time_between_train_steps": 0.005181074142456055, "step": 716}
{"info/global_step": 717, "train_info/time_within_train_step": 32.25134205818176, "step": 717}
{"train_info/time_between_train_steps": 0.00503230094909668, "step": 717}
{"info/global_step": 718, "train_info/time_within_train_step": 32.15797305107117, "step": 718}
{"train_info/time_between_train_steps": 0.005236148834228516, "step": 718}
{"info/global_step": 719, "train_info/time_within_train_step": 32.81424331665039, "step": 719}
{"train_info/time_between_train_steps": 0.005382061004638672, "step": 719}
{"info/global_step": 720, "train_info/time_within_train_step": 32.2372989654541, "step": 720}
{"train_info/time_between_train_steps": 0.005415201187133789, "step": 720}
{"info/global_step": 721, "train_info/time_within_train_step": 32.352516174316406, "step": 721}
{"train_info/time_between_train_steps": 0.005135774612426758, "step": 721}
{"info/global_step": 722, "train_info/time_within_train_step": 32.598347425460815, "step": 722}
{"train_info/time_between_train_steps": 0.010986089706420898, "step": 722}
{"info/global_step": 723, "train_info/time_within_train_step": 32.38159394264221, "step": 723}
{"train_info/time_between_train_steps": 0.005204200744628906, "step": 723}
{"info/global_step": 724, "train_info/time_within_train_step": 32.63857817649841, "step": 724}
{"train_info/time_between_train_steps": 0.005103111267089844, "step": 724}
{"info/global_step": 725, "train_info/time_within_train_step": 32.4076144695282, "step": 725}
{"train_info/time_between_train_steps": 0.005383491516113281, "step": 725}
{"info/global_step": 726, "train_info/time_within_train_step": 32.39732336997986, "step": 726}
{"train_info/time_between_train_steps": 0.0103912353515625, "step": 726}
{"info/global_step": 727, "train_info/time_within_train_step": 32.29981565475464, "step": 727}
{"train_info/time_between_train_steps": 0.0088653564453125, "step": 727}
{"info/global_step": 728, "train_info/time_within_train_step": 32.70540261268616, "step": 728}
{"train_info/time_between_train_steps": 0.005751371383666992, "step": 728}
{"info/global_step": 729, "train_info/time_within_train_step": 32.225844383239746, "step": 729}
{"train_info/time_between_train_steps": 0.0057337284088134766, "step": 729}
{"train_info/time_between_train_steps": 23.315000772476196, "step": 729}
{"info/global_step": 730, "train_info/time_within_train_step": 32.413360357284546, "step": 730}
{"train_info/time_between_train_steps": 0.00561070442199707, "step": 730}
{"info/global_step": 731, "train_info/time_within_train_step": 32.71511363983154, "step": 731}
{"train_info/time_between_train_steps": 0.00531005859375, "step": 731}
{"info/global_step": 732, "train_info/time_within_train_step": 32.48707389831543, "step": 732}
{"train_info/time_between_train_steps": 0.010630369186401367, "step": 732}
{"info/global_step": 733, "train_info/time_within_train_step": 32.7985463142395, "step": 733}
{"train_info/time_between_train_steps": 0.010855436325073242, "step": 733}
{"info/global_step": 734, "train_info/time_within_train_step": 32.64852333068848, "step": 734}
{"train_info/time_between_train_steps": 0.005318641662597656, "step": 734}
{"info/global_step": 735, "train_info/time_within_train_step": 32.794827699661255, "step": 735}
{"train_info/time_between_train_steps": 0.005472660064697266, "step": 735}
{"info/global_step": 736, "train_info/time_within_train_step": 31.964749336242676, "step": 736}
{"train_info/time_between_train_steps": 0.010501384735107422, "step": 736}
{"info/global_step": 737, "train_info/time_within_train_step": 32.60079503059387, "step": 737}
{"train_info/time_between_train_steps": 0.005327701568603516, "step": 737}
{"info/global_step": 738, "train_info/time_within_train_step": 32.382102727890015, "step": 738}
{"train_info/time_between_train_steps": 0.0051805973052978516, "step": 738}
{"info/global_step": 739, "train_info/time_within_train_step": 32.473018646240234, "step": 739}
{"train_info/time_between_train_steps": 0.0049686431884765625, "step": 739}
{"info/global_step": 740, "train_info/time_within_train_step": 32.407307863235474, "step": 740}
{"train_info/time_between_train_steps": 0.005136013031005859, "step": 740}
{"info/global_step": 741, "train_info/time_within_train_step": 32.41839003562927, "step": 741}
{"train_info/time_between_train_steps": 0.010098457336425781, "step": 741}
{"info/global_step": 742, "train_info/time_within_train_step": 32.6395845413208, "step": 742}
{"train_info/time_between_train_steps": 0.005303382873535156, "step": 742}
{"info/global_step": 743, "train_info/time_within_train_step": 31.946213245391846, "step": 743}
{"train_info/time_between_train_steps": 0.005181074142456055, "step": 743}
{"info/global_step": 744, "train_info/time_within_train_step": 32.40825009346008, "step": 744}
{"train_info/time_between_train_steps": 0.0051727294921875, "step": 744}
{"info/global_step": 745, "train_info/time_within_train_step": 32.53759956359863, "step": 745}
{"train_info/time_between_train_steps": 0.005342006683349609, "step": 745}
{"info/global_step": 746, "train_info/time_within_train_step": 32.364909410476685, "step": 746}
{"train_info/time_between_train_steps": 0.007602691650390625, "step": 746}
{"info/global_step": 747, "train_info/time_within_train_step": 32.49809646606445, "step": 747}
{"train_info/time_between_train_steps": 0.010286331176757812, "step": 747}
{"info/global_step": 748, "train_info/time_within_train_step": 32.49128484725952, "step": 748}
{"train_info/time_between_train_steps": 0.0052564144134521484, "step": 748}
{"info/global_step": 749, "train_info/time_within_train_step": 32.935436487197876, "step": 749}
{"train_info/time_between_train_steps": 0.015002965927124023, "step": 749}
{"info/global_step": 750, "train_info/time_within_train_step": 32.27275037765503, "step": 750}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733712493, "_runtime": 24999}, "step": 750}
{"logs": {"train/loss": 3.4848, "train/learning_rate": 0.00025, "train/epoch": 27.02, "_timestamp": 1733712493, "_runtime": 24999}, "step": 750}
{"train_info/time_between_train_steps": 0.006837129592895508, "step": 750}
{"info/global_step": 751, "train_info/time_within_train_step": 32.14133930206299, "step": 751}
{"train_info/time_between_train_steps": 0.005226850509643555, "step": 751}
{"info/global_step": 752, "train_info/time_within_train_step": 32.41930103302002, "step": 752}
{"train_info/time_between_train_steps": 0.007897377014160156, "step": 752}
{"info/global_step": 753, "train_info/time_within_train_step": 32.36186337471008, "step": 753}
{"train_info/time_between_train_steps": 0.008090734481811523, "step": 753}
{"info/global_step": 754, "train_info/time_within_train_step": 32.51436161994934, "step": 754}
{"train_info/time_between_train_steps": 0.005448579788208008, "step": 754}
{"info/global_step": 755, "train_info/time_within_train_step": 32.72221851348877, "step": 755}
{"train_info/time_between_train_steps": 0.005722999572753906, "step": 755}
{"info/global_step": 756, "train_info/time_within_train_step": 32.492804527282715, "step": 756}
{"train_info/time_between_train_steps": 0.005878448486328125, "step": 756}
{"train_info/time_between_train_steps": 24.146040201187134, "step": 756}
{"info/global_step": 757, "train_info/time_within_train_step": 32.211318254470825, "step": 757}
{"train_info/time_between_train_steps": 0.006867170333862305, "step": 757}
{"info/global_step": 758, "train_info/time_within_train_step": 32.57872128486633, "step": 758}
{"train_info/time_between_train_steps": 0.007745027542114258, "step": 758}
{"info/global_step": 759, "train_info/time_within_train_step": 32.48437023162842, "step": 759}
{"train_info/time_between_train_steps": 0.005853414535522461, "step": 759}
{"info/global_step": 760, "train_info/time_within_train_step": 32.74918842315674, "step": 760}
{"train_info/time_between_train_steps": 0.006460428237915039, "step": 760}
{"info/global_step": 761, "train_info/time_within_train_step": 32.48019886016846, "step": 761}
{"train_info/time_between_train_steps": 0.007110595703125, "step": 761}
{"info/global_step": 762, "train_info/time_within_train_step": 32.82930850982666, "step": 762}
{"train_info/time_between_train_steps": 0.010886669158935547, "step": 762}
{"info/global_step": 763, "train_info/time_within_train_step": 32.20129156112671, "step": 763}
{"train_info/time_between_train_steps": 0.008211851119995117, "step": 763}
{"info/global_step": 764, "train_info/time_within_train_step": 32.32586455345154, "step": 764}
{"train_info/time_between_train_steps": 0.0110931396484375, "step": 764}
{"info/global_step": 765, "train_info/time_within_train_step": 32.26052713394165, "step": 765}
{"train_info/time_between_train_steps": 0.005487918853759766, "step": 765}
{"info/global_step": 766, "train_info/time_within_train_step": 32.34680771827698, "step": 766}
{"train_info/time_between_train_steps": 0.005541563034057617, "step": 766}
{"info/global_step": 767, "train_info/time_within_train_step": 32.548335790634155, "step": 767}
{"train_info/time_between_train_steps": 0.005511760711669922, "step": 767}
{"info/global_step": 768, "train_info/time_within_train_step": 32.27015423774719, "step": 768}
{"train_info/time_between_train_steps": 0.0055904388427734375, "step": 768}
{"info/global_step": 769, "train_info/time_within_train_step": 32.5438277721405, "step": 769}
{"train_info/time_between_train_steps": 0.005470752716064453, "step": 769}
{"info/global_step": 770, "train_info/time_within_train_step": 32.504576444625854, "step": 770}
{"train_info/time_between_train_steps": 0.005542755126953125, "step": 770}
{"info/global_step": 771, "train_info/time_within_train_step": 32.239322662353516, "step": 771}
{"train_info/time_between_train_steps": 0.005377769470214844, "step": 771}
{"info/global_step": 772, "train_info/time_within_train_step": 32.65068745613098, "step": 772}
{"train_info/time_between_train_steps": 0.005631923675537109, "step": 772}
{"info/global_step": 773, "train_info/time_within_train_step": 32.51042366027832, "step": 773}
{"train_info/time_between_train_steps": 0.005625486373901367, "step": 773}
{"info/global_step": 774, "train_info/time_within_train_step": 32.46188497543335, "step": 774}
{"train_info/time_between_train_steps": 0.0057485103607177734, "step": 774}
{"info/global_step": 775, "train_info/time_within_train_step": 32.40325999259949, "step": 775}
{"train_info/time_between_train_steps": 0.005670309066772461, "step": 775}
{"info/global_step": 776, "train_info/time_within_train_step": 32.71456861495972, "step": 776}
{"train_info/time_between_train_steps": 0.0055980682373046875, "step": 776}
{"info/global_step": 777, "train_info/time_within_train_step": 32.636120080947876, "step": 777}
{"train_info/time_between_train_steps": 0.010567426681518555, "step": 777}
{"info/global_step": 778, "train_info/time_within_train_step": 32.60882258415222, "step": 778}
{"train_info/time_between_train_steps": 0.005349874496459961, "step": 778}
{"info/global_step": 779, "train_info/time_within_train_step": 31.84713864326477, "step": 779}
{"train_info/time_between_train_steps": 0.005542755126953125, "step": 779}
{"info/global_step": 780, "train_info/time_within_train_step": 32.728596448898315, "step": 780}
{"train_info/time_between_train_steps": 0.005808353424072266, "step": 780}
{"info/global_step": 781, "train_info/time_within_train_step": 32.5321786403656, "step": 781}
{"train_info/time_between_train_steps": 0.005647897720336914, "step": 781}
{"info/global_step": 782, "train_info/time_within_train_step": 32.50989556312561, "step": 782}
{"train_info/time_between_train_steps": 0.006132364273071289, "step": 782}
{"info/global_step": 783, "train_info/time_within_train_step": 32.615535736083984, "step": 783}
{"train_info/time_between_train_steps": 0.006143808364868164, "step": 783}
{"train_info/time_between_train_steps": 23.646003007888794, "step": 783}
{"info/global_step": 784, "train_info/time_within_train_step": 32.543455600738525, "step": 784}
{"train_info/time_between_train_steps": 0.004987001419067383, "step": 784}
{"info/global_step": 785, "train_info/time_within_train_step": 32.16252541542053, "step": 785}
{"train_info/time_between_train_steps": 0.005273342132568359, "step": 785}
{"info/global_step": 786, "train_info/time_within_train_step": 32.39443349838257, "step": 786}
{"train_info/time_between_train_steps": 0.005320310592651367, "step": 786}
{"info/global_step": 787, "train_info/time_within_train_step": 32.58642506599426, "step": 787}
{"train_info/time_between_train_steps": 0.005274057388305664, "step": 787}
{"info/global_step": 788, "train_info/time_within_train_step": 32.6928985118866, "step": 788}
{"train_info/time_between_train_steps": 0.005068778991699219, "step": 788}
{"info/global_step": 789, "train_info/time_within_train_step": 32.651238441467285, "step": 789}
{"train_info/time_between_train_steps": 0.0050487518310546875, "step": 789}
{"info/global_step": 790, "train_info/time_within_train_step": 32.64600968360901, "step": 790}
{"train_info/time_between_train_steps": 0.005198001861572266, "step": 790}
{"info/global_step": 791, "train_info/time_within_train_step": 32.224194288253784, "step": 791}
{"train_info/time_between_train_steps": 0.007956504821777344, "step": 791}
{"info/global_step": 792, "train_info/time_within_train_step": 32.77102780342102, "step": 792}
{"train_info/time_between_train_steps": 0.005070686340332031, "step": 792}
{"info/global_step": 793, "train_info/time_within_train_step": 31.80497097969055, "step": 793}
{"train_info/time_between_train_steps": 0.004897594451904297, "step": 793}
{"info/global_step": 794, "train_info/time_within_train_step": 32.33507061004639, "step": 794}
{"train_info/time_between_train_steps": 0.0051615238189697266, "step": 794}
{"info/global_step": 795, "train_info/time_within_train_step": 32.40431308746338, "step": 795}
{"train_info/time_between_train_steps": 0.005110502243041992, "step": 795}
{"info/global_step": 796, "train_info/time_within_train_step": 32.3048574924469, "step": 796}
{"train_info/time_between_train_steps": 0.010992288589477539, "step": 796}
{"info/global_step": 797, "train_info/time_within_train_step": 32.43628549575806, "step": 797}
{"train_info/time_between_train_steps": 0.006363391876220703, "step": 797}
{"info/global_step": 798, "train_info/time_within_train_step": 32.599406003952026, "step": 798}
{"train_info/time_between_train_steps": 0.005022525787353516, "step": 798}
{"info/global_step": 799, "train_info/time_within_train_step": 32.35516977310181, "step": 799}
{"train_info/time_between_train_steps": 0.0051152706146240234, "step": 799}
{"info/global_step": 800, "train_info/time_within_train_step": 32.189016819000244, "step": 800}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733714164, "_runtime": 26670}, "step": 800}
{"logs": {"train/loss": 3.4156, "train/learning_rate": 0.00022222222222222218, "train/epoch": 29.01, "_timestamp": 1733714164, "_runtime": 26670}, "step": 800}
{"train_info/time_between_train_steps": 2.268095016479492, "step": 800}
{"info/global_step": 801, "train_info/time_within_train_step": 32.41162610054016, "step": 801}
{"train_info/time_between_train_steps": 0.005146503448486328, "step": 801}
{"info/global_step": 802, "train_info/time_within_train_step": 32.48994970321655, "step": 802}
{"train_info/time_between_train_steps": 0.004967212677001953, "step": 802}
{"info/global_step": 803, "train_info/time_within_train_step": 32.47915291786194, "step": 803}
{"train_info/time_between_train_steps": 0.005116462707519531, "step": 803}
{"info/global_step": 804, "train_info/time_within_train_step": 32.49193024635315, "step": 804}
{"train_info/time_between_train_steps": 0.005156278610229492, "step": 804}
{"info/global_step": 805, "train_info/time_within_train_step": 32.61993670463562, "step": 805}
{"train_info/time_between_train_steps": 0.010245323181152344, "step": 805}
{"info/global_step": 806, "train_info/time_within_train_step": 32.546905517578125, "step": 806}
{"train_info/time_between_train_steps": 0.004994630813598633, "step": 806}
{"info/global_step": 807, "train_info/time_within_train_step": 32.66219162940979, "step": 807}
{"train_info/time_between_train_steps": 0.005543947219848633, "step": 807}
{"info/global_step": 808, "train_info/time_within_train_step": 32.1696891784668, "step": 808}
{"train_info/time_between_train_steps": 0.0051648616790771484, "step": 808}
{"info/global_step": 809, "train_info/time_within_train_step": 32.17286992073059, "step": 809}
{"train_info/time_between_train_steps": 0.0054547786712646484, "step": 809}
{"info/global_step": 810, "train_info/time_within_train_step": 32.44469213485718, "step": 810}
{"train_info/time_between_train_steps": 0.00579833984375, "step": 810}
{"train_info/time_between_train_steps": 23.672747373580933, "step": 810}
{"info/global_step": 811, "train_info/time_within_train_step": 32.48373985290527, "step": 811}
{"train_info/time_between_train_steps": 0.005694866180419922, "step": 811}
{"info/global_step": 812, "train_info/time_within_train_step": 32.93838596343994, "step": 812}
{"train_info/time_between_train_steps": 0.0053653717041015625, "step": 812}
{"info/global_step": 813, "train_info/time_within_train_step": 32.58504629135132, "step": 813}
{"train_info/time_between_train_steps": 0.005524635314941406, "step": 813}
{"info/global_step": 814, "train_info/time_within_train_step": 32.71716380119324, "step": 814}
{"train_info/time_between_train_steps": 0.005417346954345703, "step": 814}
{"info/global_step": 815, "train_info/time_within_train_step": 31.931135654449463, "step": 815}
{"train_info/time_between_train_steps": 0.010546445846557617, "step": 815}
{"info/global_step": 816, "train_info/time_within_train_step": 32.42357635498047, "step": 816}
{"train_info/time_between_train_steps": 0.010437965393066406, "step": 816}
{"info/global_step": 817, "train_info/time_within_train_step": 32.51816654205322, "step": 817}
{"train_info/time_between_train_steps": 0.005338430404663086, "step": 817}
{"info/global_step": 818, "train_info/time_within_train_step": 32.570895195007324, "step": 818}
{"train_info/time_between_train_steps": 0.007853031158447266, "step": 818}
{"info/global_step": 819, "train_info/time_within_train_step": 32.42621088027954, "step": 819}
{"train_info/time_between_train_steps": 0.005198240280151367, "step": 819}
{"info/global_step": 820, "train_info/time_within_train_step": 32.27071762084961, "step": 820}
{"train_info/time_between_train_steps": 0.007775783538818359, "step": 820}
{"info/global_step": 821, "train_info/time_within_train_step": 32.587419509887695, "step": 821}
{"train_info/time_between_train_steps": 0.005063056945800781, "step": 821}
{"info/global_step": 822, "train_info/time_within_train_step": 32.17259669303894, "step": 822}
{"train_info/time_between_train_steps": 0.005149126052856445, "step": 822}
{"info/global_step": 823, "train_info/time_within_train_step": 32.11752486228943, "step": 823}
{"train_info/time_between_train_steps": 0.004948139190673828, "step": 823}
{"info/global_step": 824, "train_info/time_within_train_step": 32.449918031692505, "step": 824}
{"train_info/time_between_train_steps": 0.005199909210205078, "step": 824}
{"info/global_step": 825, "train_info/time_within_train_step": 32.78828549385071, "step": 825}
{"train_info/time_between_train_steps": 0.005175113677978516, "step": 825}
{"info/global_step": 826, "train_info/time_within_train_step": 32.4407320022583, "step": 826}
{"train_info/time_between_train_steps": 0.00698399543762207, "step": 826}
{"info/global_step": 827, "train_info/time_within_train_step": 32.65528345108032, "step": 827}
{"train_info/time_between_train_steps": 0.007183551788330078, "step": 827}
{"info/global_step": 828, "train_info/time_within_train_step": 32.40084958076477, "step": 828}
{"train_info/time_between_train_steps": 0.0051419734954833984, "step": 828}
{"info/global_step": 829, "train_info/time_within_train_step": 32.89570927619934, "step": 829}
{"train_info/time_between_train_steps": 0.005194902420043945, "step": 829}
{"info/global_step": 830, "train_info/time_within_train_step": 32.106022119522095, "step": 830}
{"train_info/time_between_train_steps": 0.005157470703125, "step": 830}
{"info/global_step": 831, "train_info/time_within_train_step": 32.58066511154175, "step": 831}
{"train_info/time_between_train_steps": 0.005244731903076172, "step": 831}
{"info/global_step": 832, "train_info/time_within_train_step": 32.32497596740723, "step": 832}
{"train_info/time_between_train_steps": 0.0052242279052734375, "step": 832}
{"info/global_step": 833, "train_info/time_within_train_step": 32.559855461120605, "step": 833}
{"train_info/time_between_train_steps": 0.005136013031005859, "step": 833}
{"info/global_step": 834, "train_info/time_within_train_step": 32.48972129821777, "step": 834}
{"train_info/time_between_train_steps": 0.01064920425415039, "step": 834}
{"info/global_step": 835, "train_info/time_within_train_step": 32.521597385406494, "step": 835}
{"train_info/time_between_train_steps": 0.005265235900878906, "step": 835}
{"info/global_step": 836, "train_info/time_within_train_step": 32.828386306762695, "step": 836}
{"train_info/time_between_train_steps": 0.005460977554321289, "step": 836}
{"info/global_step": 837, "train_info/time_within_train_step": 32.43342995643616, "step": 837}
{"train_info/time_between_train_steps": 0.007695198059082031, "step": 837}
{"train_info/time_between_train_steps": 23.204593896865845, "step": 837}
{"info/global_step": 838, "train_info/time_within_train_step": 32.31437635421753, "step": 838}
{"train_info/time_between_train_steps": 0.005432844161987305, "step": 838}
{"info/global_step": 839, "train_info/time_within_train_step": 32.95900774002075, "step": 839}
{"train_info/time_between_train_steps": 0.0053675174713134766, "step": 839}
{"info/global_step": 840, "train_info/time_within_train_step": 32.74088430404663, "step": 840}
{"train_info/time_between_train_steps": 0.005291461944580078, "step": 840}
{"info/global_step": 841, "train_info/time_within_train_step": 32.74388289451599, "step": 841}
{"train_info/time_between_train_steps": 0.005780458450317383, "step": 841}
{"info/global_step": 842, "train_info/time_within_train_step": 32.64457368850708, "step": 842}
{"train_info/time_between_train_steps": 0.010757684707641602, "step": 842}
{"info/global_step": 843, "train_info/time_within_train_step": 32.68096685409546, "step": 843}
{"train_info/time_between_train_steps": 0.0072858333587646484, "step": 843}
{"info/global_step": 844, "train_info/time_within_train_step": 32.568809509277344, "step": 844}
{"train_info/time_between_train_steps": 0.010593652725219727, "step": 844}
{"info/global_step": 845, "train_info/time_within_train_step": 31.97560167312622, "step": 845}
{"train_info/time_between_train_steps": 0.005311489105224609, "step": 845}
{"info/global_step": 846, "train_info/time_within_train_step": 32.70095467567444, "step": 846}
{"train_info/time_between_train_steps": 0.005233287811279297, "step": 846}
{"info/global_step": 847, "train_info/time_within_train_step": 32.304877519607544, "step": 847}
{"train_info/time_between_train_steps": 0.008440017700195312, "step": 847}
{"info/global_step": 848, "train_info/time_within_train_step": 32.425047159194946, "step": 848}
{"train_info/time_between_train_steps": 0.005095005035400391, "step": 848}
{"info/global_step": 849, "train_info/time_within_train_step": 32.45704197883606, "step": 849}
{"train_info/time_between_train_steps": 0.0061037540435791016, "step": 849}
{"info/global_step": 850, "train_info/time_within_train_step": 32.46825170516968, "step": 850}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733715838, "_runtime": 28344}, "step": 850}
{"logs": {"train/loss": 3.3545, "train/learning_rate": 0.00019444444444444443, "train/epoch": 31.01, "_timestamp": 1733715838, "_runtime": 28344}, "step": 850}
{"train_info/time_between_train_steps": 0.007602691650390625, "step": 850}
{"info/global_step": 851, "train_info/time_within_train_step": 32.64733266830444, "step": 851}
{"train_info/time_between_train_steps": 0.00509953498840332, "step": 851}
{"info/global_step": 852, "train_info/time_within_train_step": 31.948456048965454, "step": 852}
{"train_info/time_between_train_steps": 0.005088329315185547, "step": 852}
{"info/global_step": 853, "train_info/time_within_train_step": 32.55630445480347, "step": 853}
{"train_info/time_between_train_steps": 0.005186796188354492, "step": 853}
{"info/global_step": 854, "train_info/time_within_train_step": 32.44357109069824, "step": 854}
{"train_info/time_between_train_steps": 0.007970333099365234, "step": 854}
{"info/global_step": 855, "train_info/time_within_train_step": 32.45625185966492, "step": 855}
{"train_info/time_between_train_steps": 0.006945133209228516, "step": 855}
{"info/global_step": 856, "train_info/time_within_train_step": 32.69664120674133, "step": 856}
{"train_info/time_between_train_steps": 0.014968156814575195, "step": 856}
{"info/global_step": 857, "train_info/time_within_train_step": 32.57198929786682, "step": 857}
{"train_info/time_between_train_steps": 0.0050737857818603516, "step": 857}
{"info/global_step": 858, "train_info/time_within_train_step": 32.53890514373779, "step": 858}
{"train_info/time_between_train_steps": 0.005248069763183594, "step": 858}
{"info/global_step": 859, "train_info/time_within_train_step": 32.59367322921753, "step": 859}
{"train_info/time_between_train_steps": 0.005057811737060547, "step": 859}
{"info/global_step": 860, "train_info/time_within_train_step": 32.25776934623718, "step": 860}
{"train_info/time_between_train_steps": 0.005410432815551758, "step": 860}
{"info/global_step": 861, "train_info/time_within_train_step": 32.48209881782532, "step": 861}
{"train_info/time_between_train_steps": 0.005389690399169922, "step": 861}
{"info/global_step": 862, "train_info/time_within_train_step": 32.46128726005554, "step": 862}
{"train_info/time_between_train_steps": 0.005288124084472656, "step": 862}
{"info/global_step": 863, "train_info/time_within_train_step": 32.65105843544006, "step": 863}
{"train_info/time_between_train_steps": 0.005806922912597656, "step": 863}
{"info/global_step": 864, "train_info/time_within_train_step": 32.52425956726074, "step": 864}
{"train_info/time_between_train_steps": 0.005732059478759766, "step": 864}
{"train_info/time_between_train_steps": 23.791876792907715, "step": 864}
{"info/global_step": 865, "train_info/time_within_train_step": 32.86532139778137, "step": 865}
{"train_info/time_between_train_steps": 0.005631685256958008, "step": 865}
{"info/global_step": 866, "train_info/time_within_train_step": 32.80469751358032, "step": 866}
{"train_info/time_between_train_steps": 0.005388021469116211, "step": 866}
{"info/global_step": 867, "train_info/time_within_train_step": 31.885228157043457, "step": 867}
{"train_info/time_between_train_steps": 0.005275726318359375, "step": 867}
{"info/global_step": 868, "train_info/time_within_train_step": 32.573830366134644, "step": 868}
{"train_info/time_between_train_steps": 0.0057201385498046875, "step": 868}
{"info/global_step": 869, "train_info/time_within_train_step": 32.480900287628174, "step": 869}
{"train_info/time_between_train_steps": 0.015213966369628906, "step": 869}
{"info/global_step": 870, "train_info/time_within_train_step": 32.41304039955139, "step": 870}
{"train_info/time_between_train_steps": 0.005285024642944336, "step": 870}
{"info/global_step": 871, "train_info/time_within_train_step": 32.671127796173096, "step": 871}
{"train_info/time_between_train_steps": 0.0055425167083740234, "step": 871}
{"info/global_step": 872, "train_info/time_within_train_step": 32.50855541229248, "step": 872}
{"train_info/time_between_train_steps": 0.005263805389404297, "step": 872}
{"info/global_step": 873, "train_info/time_within_train_step": 32.986161947250366, "step": 873}
{"train_info/time_between_train_steps": 0.005110025405883789, "step": 873}
{"info/global_step": 874, "train_info/time_within_train_step": 32.44510221481323, "step": 874}
{"train_info/time_between_train_steps": 0.00502777099609375, "step": 874}
{"info/global_step": 875, "train_info/time_within_train_step": 32.18052840232849, "step": 875}
{"train_info/time_between_train_steps": 0.0051343441009521484, "step": 875}
{"info/global_step": 876, "train_info/time_within_train_step": 32.39034342765808, "step": 876}
{"train_info/time_between_train_steps": 0.006602764129638672, "step": 876}
{"info/global_step": 877, "train_info/time_within_train_step": 32.245473861694336, "step": 877}
{"train_info/time_between_train_steps": 0.00514984130859375, "step": 877}
{"info/global_step": 878, "train_info/time_within_train_step": 32.364757776260376, "step": 878}
{"train_info/time_between_train_steps": 0.005101442337036133, "step": 878}
{"info/global_step": 879, "train_info/time_within_train_step": 32.7714364528656, "step": 879}
{"train_info/time_between_train_steps": 0.010118246078491211, "step": 879}
{"info/global_step": 880, "train_info/time_within_train_step": 32.49197483062744, "step": 880}
{"train_info/time_between_train_steps": 0.005464315414428711, "step": 880}
{"info/global_step": 881, "train_info/time_within_train_step": 32.47060585021973, "step": 881}
{"train_info/time_between_train_steps": 0.005196571350097656, "step": 881}
{"info/global_step": 882, "train_info/time_within_train_step": 32.53708457946777, "step": 882}
{"train_info/time_between_train_steps": 0.00510859489440918, "step": 882}
{"info/global_step": 883, "train_info/time_within_train_step": 32.5540771484375, "step": 883}
{"train_info/time_between_train_steps": 0.005009174346923828, "step": 883}
{"info/global_step": 884, "train_info/time_within_train_step": 31.995529174804688, "step": 884}
{"train_info/time_between_train_steps": 0.007208824157714844, "step": 884}
{"info/global_step": 885, "train_info/time_within_train_step": 32.44480872154236, "step": 885}
{"train_info/time_between_train_steps": 0.005410909652709961, "step": 885}
{"info/global_step": 886, "train_info/time_within_train_step": 32.55380415916443, "step": 886}
{"train_info/time_between_train_steps": 0.005126237869262695, "step": 886}
{"info/global_step": 887, "train_info/time_within_train_step": 32.58128643035889, "step": 887}
{"train_info/time_between_train_steps": 0.00525355339050293, "step": 887}
{"info/global_step": 888, "train_info/time_within_train_step": 32.62696814537048, "step": 888}
{"train_info/time_between_train_steps": 0.005379438400268555, "step": 888}
{"info/global_step": 889, "train_info/time_within_train_step": 32.51409435272217, "step": 889}
{"train_info/time_between_train_steps": 0.006944894790649414, "step": 889}
{"info/global_step": 890, "train_info/time_within_train_step": 32.346240758895874, "step": 890}
{"train_info/time_between_train_steps": 0.011051416397094727, "step": 890}
{"info/global_step": 891, "train_info/time_within_train_step": 32.76000356674194, "step": 891}
{"train_info/time_between_train_steps": 0.005516529083251953, "step": 891}
{"train_info/time_between_train_steps": 22.998522996902466, "step": 891}
{"info/global_step": 892, "train_info/time_within_train_step": 32.21951222419739, "step": 892}
{"train_info/time_between_train_steps": 0.005073070526123047, "step": 892}
{"info/global_step": 893, "train_info/time_within_train_step": 32.87835097312927, "step": 893}
{"train_info/time_between_train_steps": 0.005246400833129883, "step": 893}
{"info/global_step": 894, "train_info/time_within_train_step": 32.59360074996948, "step": 894}
{"train_info/time_between_train_steps": 0.005251407623291016, "step": 894}
{"info/global_step": 895, "train_info/time_within_train_step": 32.69844961166382, "step": 895}
{"train_info/time_between_train_steps": 0.005433559417724609, "step": 895}
{"info/global_step": 896, "train_info/time_within_train_step": 32.501606702804565, "step": 896}
{"train_info/time_between_train_steps": 0.005624532699584961, "step": 896}
{"info/global_step": 897, "train_info/time_within_train_step": 32.70530557632446, "step": 897}
{"train_info/time_between_train_steps": 0.005372285842895508, "step": 897}
{"info/global_step": 898, "train_info/time_within_train_step": 32.56519174575806, "step": 898}
{"train_info/time_between_train_steps": 0.005522727966308594, "step": 898}
{"info/global_step": 899, "train_info/time_within_train_step": 32.183783531188965, "step": 899}
{"train_info/time_between_train_steps": 0.005433320999145508, "step": 899}
{"info/global_step": 900, "train_info/time_within_train_step": 32.42416071891785, "step": 900}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733717510, "_runtime": 30016}, "step": 900}
{"logs": {"train/loss": 3.2965, "train/learning_rate": 0.00016666666666666666, "train/epoch": 33.01, "_timestamp": 1733717510, "_runtime": 30016}, "step": 900}
{"train_info/time_between_train_steps": 2.2783498764038086, "step": 900}
{"info/global_step": 901, "train_info/time_within_train_step": 32.523646116256714, "step": 901}
{"train_info/time_between_train_steps": 0.005196571350097656, "step": 901}
{"info/global_step": 902, "train_info/time_within_train_step": 32.703144788742065, "step": 902}
{"train_info/time_between_train_steps": 0.005123615264892578, "step": 902}
{"info/global_step": 903, "train_info/time_within_train_step": 32.284706592559814, "step": 903}
{"train_info/time_between_train_steps": 0.005118846893310547, "step": 903}
{"info/global_step": 904, "train_info/time_within_train_step": 32.639381408691406, "step": 904}
{"train_info/time_between_train_steps": 0.0050182342529296875, "step": 904}
{"info/global_step": 905, "train_info/time_within_train_step": 32.54836082458496, "step": 905}
{"train_info/time_between_train_steps": 0.01007533073425293, "step": 905}
{"info/global_step": 906, "train_info/time_within_train_step": 32.55677509307861, "step": 906}
{"train_info/time_between_train_steps": 0.0050199031829833984, "step": 906}
{"info/global_step": 907, "train_info/time_within_train_step": 32.18478727340698, "step": 907}
{"train_info/time_between_train_steps": 0.009745597839355469, "step": 907}
{"info/global_step": 908, "train_info/time_within_train_step": 32.291752099990845, "step": 908}
{"train_info/time_between_train_steps": 0.005086660385131836, "step": 908}
{"info/global_step": 909, "train_info/time_within_train_step": 32.21616816520691, "step": 909}
{"train_info/time_between_train_steps": 0.010016679763793945, "step": 909}
{"info/global_step": 910, "train_info/time_within_train_step": 32.202855587005615, "step": 910}
{"train_info/time_between_train_steps": 0.0053327083587646484, "step": 910}
{"info/global_step": 911, "train_info/time_within_train_step": 32.361475467681885, "step": 911}
{"train_info/time_between_train_steps": 0.005307912826538086, "step": 911}
{"info/global_step": 912, "train_info/time_within_train_step": 32.70781970024109, "step": 912}
{"train_info/time_between_train_steps": 0.007096767425537109, "step": 912}
{"info/global_step": 913, "train_info/time_within_train_step": 32.66788458824158, "step": 913}
{"train_info/time_between_train_steps": 0.005056619644165039, "step": 913}
{"info/global_step": 914, "train_info/time_within_train_step": 32.610586166381836, "step": 914}
{"train_info/time_between_train_steps": 0.0050966739654541016, "step": 914}
{"info/global_step": 915, "train_info/time_within_train_step": 32.26998567581177, "step": 915}
{"train_info/time_between_train_steps": 0.00560307502746582, "step": 915}
{"info/global_step": 916, "train_info/time_within_train_step": 32.422643423080444, "step": 916}
{"train_info/time_between_train_steps": 0.00534510612487793, "step": 916}
{"info/global_step": 917, "train_info/time_within_train_step": 32.61089301109314, "step": 917}
{"train_info/time_between_train_steps": 0.005887269973754883, "step": 917}
{"info/global_step": 918, "train_info/time_within_train_step": 32.33305025100708, "step": 918}
{"train_info/time_between_train_steps": 0.005669832229614258, "step": 918}
{"train_info/time_between_train_steps": 23.26143217086792, "step": 918}
{"info/global_step": 919, "train_info/time_within_train_step": 32.40241003036499, "step": 919}
{"train_info/time_between_train_steps": 0.0055997371673583984, "step": 919}
{"info/global_step": 920, "train_info/time_within_train_step": 32.70798087120056, "step": 920}
{"train_info/time_between_train_steps": 0.005505800247192383, "step": 920}
{"info/global_step": 921, "train_info/time_within_train_step": 32.531848192214966, "step": 921}
{"train_info/time_between_train_steps": 0.005646944046020508, "step": 921}
{"info/global_step": 922, "train_info/time_within_train_step": 32.82938504219055, "step": 922}
{"train_info/time_between_train_steps": 0.005193948745727539, "step": 922}
{"info/global_step": 923, "train_info/time_within_train_step": 32.26529812812805, "step": 923}
{"train_info/time_between_train_steps": 0.01078486442565918, "step": 923}
{"info/global_step": 924, "train_info/time_within_train_step": 32.48995614051819, "step": 924}
{"train_info/time_between_train_steps": 0.007321834564208984, "step": 924}
{"info/global_step": 925, "train_info/time_within_train_step": 32.893611669540405, "step": 925}
{"train_info/time_between_train_steps": 0.005606651306152344, "step": 925}
{"info/global_step": 926, "train_info/time_within_train_step": 32.38892388343811, "step": 926}
{"train_info/time_between_train_steps": 0.014448881149291992, "step": 926}
{"info/global_step": 927, "train_info/time_within_train_step": 32.633195877075195, "step": 927}
{"train_info/time_between_train_steps": 0.0052068233489990234, "step": 927}
{"info/global_step": 928, "train_info/time_within_train_step": 32.690566539764404, "step": 928}
{"train_info/time_between_train_steps": 0.014949560165405273, "step": 928}
{"info/global_step": 929, "train_info/time_within_train_step": 32.66166830062866, "step": 929}
{"train_info/time_between_train_steps": 0.005108833312988281, "step": 929}
{"info/global_step": 930, "train_info/time_within_train_step": 32.630017042160034, "step": 930}
{"train_info/time_between_train_steps": 0.005137205123901367, "step": 930}
{"info/global_step": 931, "train_info/time_within_train_step": 32.172731161117554, "step": 931}
{"train_info/time_between_train_steps": 0.004987239837646484, "step": 931}
{"info/global_step": 932, "train_info/time_within_train_step": 32.58189606666565, "step": 932}
{"train_info/time_between_train_steps": 0.006976127624511719, "step": 932}
{"info/global_step": 933, "train_info/time_within_train_step": 32.52791953086853, "step": 933}
{"train_info/time_between_train_steps": 0.005226612091064453, "step": 933}
{"info/global_step": 934, "train_info/time_within_train_step": 32.41498327255249, "step": 934}
{"train_info/time_between_train_steps": 0.007987022399902344, "step": 934}
{"info/global_step": 935, "train_info/time_within_train_step": 32.52536725997925, "step": 935}
{"train_info/time_between_train_steps": 0.00635838508605957, "step": 935}
{"info/global_step": 936, "train_info/time_within_train_step": 32.378475189208984, "step": 936}
{"train_info/time_between_train_steps": 0.007546186447143555, "step": 936}
{"info/global_step": 937, "train_info/time_within_train_step": 32.74300932884216, "step": 937}
{"train_info/time_between_train_steps": 0.015531778335571289, "step": 937}
{"info/global_step": 938, "train_info/time_within_train_step": 32.44277596473694, "step": 938}
{"train_info/time_between_train_steps": 0.005238533020019531, "step": 938}
{"info/global_step": 939, "train_info/time_within_train_step": 32.69988536834717, "step": 939}
{"train_info/time_between_train_steps": 0.014899253845214844, "step": 939}
{"info/global_step": 940, "train_info/time_within_train_step": 32.1705048084259, "step": 940}
{"train_info/time_between_train_steps": 0.005118131637573242, "step": 940}
{"info/global_step": 941, "train_info/time_within_train_step": 32.47202754020691, "step": 941}
{"train_info/time_between_train_steps": 0.005076885223388672, "step": 941}
{"info/global_step": 942, "train_info/time_within_train_step": 32.5032262802124, "step": 942}
{"train_info/time_between_train_steps": 0.005333900451660156, "step": 942}
{"info/global_step": 943, "train_info/time_within_train_step": 32.52987456321716, "step": 943}
{"train_info/time_between_train_steps": 0.005446434020996094, "step": 943}
{"info/global_step": 944, "train_info/time_within_train_step": 32.434932470321655, "step": 944}
{"train_info/time_between_train_steps": 0.010574102401733398, "step": 944}
{"info/global_step": 945, "train_info/time_within_train_step": 32.51602864265442, "step": 945}
{"train_info/time_between_train_steps": 0.005877494812011719, "step": 945}
{"train_info/time_between_train_steps": 23.639437198638916, "step": 945}
{"info/global_step": 946, "train_info/time_within_train_step": 32.33186984062195, "step": 946}
{"train_info/time_between_train_steps": 0.007529020309448242, "step": 946}
{"info/global_step": 947, "train_info/time_within_train_step": 32.933197021484375, "step": 947}
{"train_info/time_between_train_steps": 0.010409832000732422, "step": 947}
{"info/global_step": 948, "train_info/time_within_train_step": 32.08270525932312, "step": 948}
{"train_info/time_between_train_steps": 0.005202770233154297, "step": 948}
{"info/global_step": 949, "train_info/time_within_train_step": 32.679861068725586, "step": 949}
{"train_info/time_between_train_steps": 0.005407810211181641, "step": 949}
{"info/global_step": 950, "train_info/time_within_train_step": 32.64832067489624, "step": 950}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733719185, "_runtime": 31691}, "step": 950}
{"logs": {"train/loss": 3.245, "train/learning_rate": 0.0001388888888888889, "train/epoch": 35.0, "_timestamp": 1733719185, "_runtime": 31691}, "step": 950}
{"train_info/time_between_train_steps": 0.012748241424560547, "step": 950}
{"info/global_step": 951, "train_info/time_within_train_step": 32.521620988845825, "step": 951}
{"train_info/time_between_train_steps": 0.005429267883300781, "step": 951}
{"info/global_step": 952, "train_info/time_within_train_step": 32.96587157249451, "step": 952}
{"train_info/time_between_train_steps": 0.010576725006103516, "step": 952}
{"info/global_step": 953, "train_info/time_within_train_step": 32.7435040473938, "step": 953}
{"train_info/time_between_train_steps": 0.005886077880859375, "step": 953}
{"info/global_step": 954, "train_info/time_within_train_step": 32.688068866729736, "step": 954}
{"train_info/time_between_train_steps": 0.00533604621887207, "step": 954}
{"info/global_step": 955, "train_info/time_within_train_step": 32.62245225906372, "step": 955}
{"train_info/time_between_train_steps": 0.005070686340332031, "step": 955}
{"info/global_step": 956, "train_info/time_within_train_step": 32.167235374450684, "step": 956}
{"train_info/time_between_train_steps": 0.010013103485107422, "step": 956}
{"info/global_step": 957, "train_info/time_within_train_step": 32.50064039230347, "step": 957}
{"train_info/time_between_train_steps": 0.007584810256958008, "step": 957}
{"info/global_step": 958, "train_info/time_within_train_step": 32.428173780441284, "step": 958}
{"train_info/time_between_train_steps": 0.004981279373168945, "step": 958}
{"info/global_step": 959, "train_info/time_within_train_step": 32.75093221664429, "step": 959}
{"train_info/time_between_train_steps": 0.010187864303588867, "step": 959}
{"info/global_step": 960, "train_info/time_within_train_step": 32.6838595867157, "step": 960}
{"train_info/time_between_train_steps": 0.00495457649230957, "step": 960}
{"info/global_step": 961, "train_info/time_within_train_step": 32.5560941696167, "step": 961}
{"train_info/time_between_train_steps": 0.0049784183502197266, "step": 961}
{"info/global_step": 962, "train_info/time_within_train_step": 32.3573739528656, "step": 962}
{"train_info/time_between_train_steps": 0.00519561767578125, "step": 962}
{"info/global_step": 963, "train_info/time_within_train_step": 32.56954526901245, "step": 963}
{"train_info/time_between_train_steps": 0.004982709884643555, "step": 963}
{"info/global_step": 964, "train_info/time_within_train_step": 32.39994525909424, "step": 964}
{"train_info/time_between_train_steps": 0.005228281021118164, "step": 964}
{"info/global_step": 965, "train_info/time_within_train_step": 32.117154598236084, "step": 965}
{"train_info/time_between_train_steps": 0.005118846893310547, "step": 965}
{"info/global_step": 966, "train_info/time_within_train_step": 32.47038197517395, "step": 966}
{"train_info/time_between_train_steps": 0.0052738189697265625, "step": 966}
{"info/global_step": 967, "train_info/time_within_train_step": 32.44448399543762, "step": 967}
{"train_info/time_between_train_steps": 0.005166292190551758, "step": 967}
{"info/global_step": 968, "train_info/time_within_train_step": 32.7465238571167, "step": 968}
{"train_info/time_between_train_steps": 0.009902477264404297, "step": 968}
{"info/global_step": 969, "train_info/time_within_train_step": 33.02273941040039, "step": 969}
{"train_info/time_between_train_steps": 0.010729551315307617, "step": 969}
{"info/global_step": 970, "train_info/time_within_train_step": 32.626816749572754, "step": 970}
{"train_info/time_between_train_steps": 0.01510310173034668, "step": 970}
{"info/global_step": 971, "train_info/time_within_train_step": 32.4799108505249, "step": 971}
{"train_info/time_between_train_steps": 0.0055637359619140625, "step": 971}
{"info/global_step": 972, "train_info/time_within_train_step": 32.292166233062744, "step": 972}
{"train_info/time_between_train_steps": 0.005741119384765625, "step": 972}
{"train_info/time_between_train_steps": 23.744669914245605, "step": 972}
{"info/global_step": 973, "train_info/time_within_train_step": 32.33320426940918, "step": 973}
{"train_info/time_between_train_steps": 0.005328655242919922, "step": 973}
{"info/global_step": 974, "train_info/time_within_train_step": 32.576268672943115, "step": 974}
{"train_info/time_between_train_steps": 0.005335807800292969, "step": 974}
{"info/global_step": 975, "train_info/time_within_train_step": 32.2947199344635, "step": 975}
{"train_info/time_between_train_steps": 0.005167245864868164, "step": 975}
{"info/global_step": 976, "train_info/time_within_train_step": 32.65237474441528, "step": 976}
{"train_info/time_between_train_steps": 0.005450010299682617, "step": 976}
{"info/global_step": 977, "train_info/time_within_train_step": 32.2985360622406, "step": 977}
{"train_info/time_between_train_steps": 0.0055921077728271484, "step": 977}
{"info/global_step": 978, "train_info/time_within_train_step": 32.80104637145996, "step": 978}
{"train_info/time_between_train_steps": 0.005442619323730469, "step": 978}
{"info/global_step": 979, "train_info/time_within_train_step": 32.68925189971924, "step": 979}
{"train_info/time_between_train_steps": 0.008138656616210938, "step": 979}
{"info/global_step": 980, "train_info/time_within_train_step": 32.7705442905426, "step": 980}
{"train_info/time_between_train_steps": 0.005639553070068359, "step": 980}
{"info/global_step": 981, "train_info/time_within_train_step": 32.05288791656494, "step": 981}
{"train_info/time_between_train_steps": 0.010034322738647461, "step": 981}
{"info/global_step": 982, "train_info/time_within_train_step": 32.38891410827637, "step": 982}
{"train_info/time_between_train_steps": 0.009917259216308594, "step": 982}
{"info/global_step": 983, "train_info/time_within_train_step": 32.570034980773926, "step": 983}
{"train_info/time_between_train_steps": 0.010020017623901367, "step": 983}
{"info/global_step": 984, "train_info/time_within_train_step": 32.429802894592285, "step": 984}
{"train_info/time_between_train_steps": 0.010024785995483398, "step": 984}
{"info/global_step": 985, "train_info/time_within_train_step": 32.462199211120605, "step": 985}
{"train_info/time_between_train_steps": 0.0051724910736083984, "step": 985}
{"info/global_step": 986, "train_info/time_within_train_step": 32.35028791427612, "step": 986}
{"train_info/time_between_train_steps": 0.010101318359375, "step": 986}
{"info/global_step": 987, "train_info/time_within_train_step": 32.78072237968445, "step": 987}
{"train_info/time_between_train_steps": 0.007750034332275391, "step": 987}
{"info/global_step": 988, "train_info/time_within_train_step": 32.449785470962524, "step": 988}
{"train_info/time_between_train_steps": 0.00509953498840332, "step": 988}
{"info/global_step": 989, "train_info/time_within_train_step": 32.77253437042236, "step": 989}
{"train_info/time_between_train_steps": 0.005228519439697266, "step": 989}
{"info/global_step": 990, "train_info/time_within_train_step": 32.245548486709595, "step": 990}
{"train_info/time_between_train_steps": 0.004982471466064453, "step": 990}
{"info/global_step": 991, "train_info/time_within_train_step": 32.46768021583557, "step": 991}
{"train_info/time_between_train_steps": 0.010026931762695312, "step": 991}
{"info/global_step": 992, "train_info/time_within_train_step": 32.32807230949402, "step": 992}
{"train_info/time_between_train_steps": 0.004979133605957031, "step": 992}
{"info/global_step": 993, "train_info/time_within_train_step": 32.493616819381714, "step": 993}
{"train_info/time_between_train_steps": 0.005112409591674805, "step": 993}
{"info/global_step": 994, "train_info/time_within_train_step": 32.809288024902344, "step": 994}
{"train_info/time_between_train_steps": 0.0052373409271240234, "step": 994}
{"info/global_step": 995, "train_info/time_within_train_step": 32.41560912132263, "step": 995}
{"train_info/time_between_train_steps": 0.004984378814697266, "step": 995}
{"info/global_step": 996, "train_info/time_within_train_step": 32.4956488609314, "step": 996}
{"train_info/time_between_train_steps": 0.005393266677856445, "step": 996}
{"info/global_step": 997, "train_info/time_within_train_step": 32.579811811447144, "step": 997}
{"train_info/time_between_train_steps": 0.005229949951171875, "step": 997}
{"info/global_step": 998, "train_info/time_within_train_step": 32.43506741523743, "step": 998}
{"train_info/time_between_train_steps": 0.011224508285522461, "step": 998}
{"info/global_step": 999, "train_info/time_within_train_step": 32.122989654541016, "step": 999}
{"train_info/time_between_train_steps": 0.005808591842651367, "step": 999}
{"train_info/time_between_train_steps": 23.155303716659546, "step": 999}
{"info/global_step": 1000, "train_info/time_within_train_step": 32.555524826049805, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733720858, "_runtime": 33364}, "step": 1000}
{"logs": {"train/loss": 3.1985, "train/learning_rate": 0.00011111111111111109, "train/epoch": 37.0, "_timestamp": 1733720858, "_runtime": 33364}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733720860, "_runtime": 33366}, "step": 1000}
{"logs": {"eval/loss": 4.167860507965088, "eval/runtime": 2.3092, "eval/samples_per_second": 43.306, "eval/steps_per_second": 3.031, "train/epoch": 37.0, "_timestamp": 1733720860, "_runtime": 33366}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733720860, "_runtime": 33366}, "step": 1000}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 4.167860507965088, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 64.57714192261159, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 2.3092, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 43.306, "train/epoch": 37.0, "_timestamp": 1733720860, "_runtime": 33366}, "step": 1000}
{"train_info/time_between_train_steps": 4.53382420539856, "step": 1000}
{"info/global_step": 1001, "train_info/time_within_train_step": 32.574618101119995, "step": 1001}
{"train_info/time_between_train_steps": 0.005338430404663086, "step": 1001}
{"info/global_step": 1002, "train_info/time_within_train_step": 32.58015060424805, "step": 1002}
{"train_info/time_between_train_steps": 0.010655403137207031, "step": 1002}
{"info/global_step": 1003, "train_info/time_within_train_step": 32.782910108566284, "step": 1003}
{"train_info/time_between_train_steps": 0.005330801010131836, "step": 1003}
{"info/global_step": 1004, "train_info/time_within_train_step": 32.58205509185791, "step": 1004}
{"train_info/time_between_train_steps": 0.007493019104003906, "step": 1004}
{"info/global_step": 1005, "train_info/time_within_train_step": 32.79676914215088, "step": 1005}
{"train_info/time_between_train_steps": 0.0071752071380615234, "step": 1005}
{"info/global_step": 1006, "train_info/time_within_train_step": 32.923903465270996, "step": 1006}
{"train_info/time_between_train_steps": 0.005745887756347656, "step": 1006}
{"info/global_step": 1007, "train_info/time_within_train_step": 32.113731384277344, "step": 1007}
{"train_info/time_between_train_steps": 0.005490779876708984, "step": 1007}
{"info/global_step": 1008, "train_info/time_within_train_step": 32.34177327156067, "step": 1008}
{"train_info/time_between_train_steps": 0.005159616470336914, "step": 1008}
{"info/global_step": 1009, "train_info/time_within_train_step": 32.607072830200195, "step": 1009}
{"train_info/time_between_train_steps": 0.004910707473754883, "step": 1009}
{"info/global_step": 1010, "train_info/time_within_train_step": 32.605658769607544, "step": 1010}
{"train_info/time_between_train_steps": 0.005120038986206055, "step": 1010}
{"info/global_step": 1011, "train_info/time_within_train_step": 32.5114541053772, "step": 1011}
{"train_info/time_between_train_steps": 0.004988670349121094, "step": 1011}
{"info/global_step": 1012, "train_info/time_within_train_step": 32.450727701187134, "step": 1012}
{"train_info/time_between_train_steps": 0.005181074142456055, "step": 1012}
{"info/global_step": 1013, "train_info/time_within_train_step": 32.5710027217865, "step": 1013}
{"train_info/time_between_train_steps": 0.005324363708496094, "step": 1013}
{"info/global_step": 1014, "train_info/time_within_train_step": 32.45698142051697, "step": 1014}
{"train_info/time_between_train_steps": 0.005261421203613281, "step": 1014}
{"info/global_step": 1015, "train_info/time_within_train_step": 32.50758194923401, "step": 1015}
{"train_info/time_between_train_steps": 0.0050923824310302734, "step": 1015}
{"info/global_step": 1016, "train_info/time_within_train_step": 32.08777570724487, "step": 1016}
{"train_info/time_between_train_steps": 0.010040998458862305, "step": 1016}
{"info/global_step": 1017, "train_info/time_within_train_step": 32.54966735839844, "step": 1017}
{"train_info/time_between_train_steps": 0.005090951919555664, "step": 1017}
{"info/global_step": 1018, "train_info/time_within_train_step": 32.73867726325989, "step": 1018}
{"train_info/time_between_train_steps": 0.010189056396484375, "step": 1018}
{"info/global_step": 1019, "train_info/time_within_train_step": 32.49020576477051, "step": 1019}
{"train_info/time_between_train_steps": 0.006472110748291016, "step": 1019}
{"info/global_step": 1020, "train_info/time_within_train_step": 32.51219463348389, "step": 1020}
{"train_info/time_between_train_steps": 0.005258083343505859, "step": 1020}
{"info/global_step": 1021, "train_info/time_within_train_step": 32.45355582237244, "step": 1021}
{"train_info/time_between_train_steps": 0.005217790603637695, "step": 1021}
{"info/global_step": 1022, "train_info/time_within_train_step": 32.751415967941284, "step": 1022}
{"train_info/time_between_train_steps": 0.0052487850189208984, "step": 1022}
{"info/global_step": 1023, "train_info/time_within_train_step": 32.43075180053711, "step": 1023}
{"train_info/time_between_train_steps": 0.005524635314941406, "step": 1023}
{"info/global_step": 1024, "train_info/time_within_train_step": 32.39640736579895, "step": 1024}
{"train_info/time_between_train_steps": 0.0053157806396484375, "step": 1024}
{"info/global_step": 1025, "train_info/time_within_train_step": 32.41226053237915, "step": 1025}
{"train_info/time_between_train_steps": 0.011196613311767578, "step": 1025}
{"info/global_step": 1026, "train_info/time_within_train_step": 32.51373076438904, "step": 1026}
{"train_info/time_between_train_steps": 0.005780696868896484, "step": 1026}
{"train_info/time_between_train_steps": 23.393399000167847, "step": 1026}
{"info/global_step": 1027, "train_info/time_within_train_step": 32.63075065612793, "step": 1027}
{"train_info/time_between_train_steps": 0.011924982070922852, "step": 1027}
{"info/global_step": 1028, "train_info/time_within_train_step": 32.708616495132446, "step": 1028}
{"train_info/time_between_train_steps": 0.0052258968353271484, "step": 1028}
{"info/global_step": 1029, "train_info/time_within_train_step": 32.574843645095825, "step": 1029}
{"train_info/time_between_train_steps": 0.00525212287902832, "step": 1029}
{"info/global_step": 1030, "train_info/time_within_train_step": 32.676024198532104, "step": 1030}
{"train_info/time_between_train_steps": 0.005397319793701172, "step": 1030}
{"info/global_step": 1031, "train_info/time_within_train_step": 32.74742865562439, "step": 1031}
{"train_info/time_between_train_steps": 0.005492448806762695, "step": 1031}
{"info/global_step": 1032, "train_info/time_within_train_step": 32.70454931259155, "step": 1032}
{"train_info/time_between_train_steps": 0.005345582962036133, "step": 1032}
{"info/global_step": 1033, "train_info/time_within_train_step": 31.863099813461304, "step": 1033}
{"train_info/time_between_train_steps": 0.005846500396728516, "step": 1033}
{"info/global_step": 1034, "train_info/time_within_train_step": 32.47567558288574, "step": 1034}
{"train_info/time_between_train_steps": 0.0052225589752197266, "step": 1034}
{"info/global_step": 1035, "train_info/time_within_train_step": 32.06742215156555, "step": 1035}
{"train_info/time_between_train_steps": 0.0051593780517578125, "step": 1035}
{"info/global_step": 1036, "train_info/time_within_train_step": 32.58760714530945, "step": 1036}
{"train_info/time_between_train_steps": 0.0050506591796875, "step": 1036}
{"info/global_step": 1037, "train_info/time_within_train_step": 32.60006499290466, "step": 1037}
{"train_info/time_between_train_steps": 0.0051021575927734375, "step": 1037}
{"info/global_step": 1038, "train_info/time_within_train_step": 32.61557102203369, "step": 1038}
{"train_info/time_between_train_steps": 0.005109548568725586, "step": 1038}
{"info/global_step": 1039, "train_info/time_within_train_step": 32.566460609436035, "step": 1039}
{"train_info/time_between_train_steps": 0.00513148307800293, "step": 1039}
{"info/global_step": 1040, "train_info/time_within_train_step": 32.513394832611084, "step": 1040}
{"train_info/time_between_train_steps": 0.005140066146850586, "step": 1040}
{"info/global_step": 1041, "train_info/time_within_train_step": 32.53123426437378, "step": 1041}
{"train_info/time_between_train_steps": 0.005213022232055664, "step": 1041}
{"info/global_step": 1042, "train_info/time_within_train_step": 31.96523118019104, "step": 1042}
{"train_info/time_between_train_steps": 0.005113124847412109, "step": 1042}
{"info/global_step": 1043, "train_info/time_within_train_step": 32.62149500846863, "step": 1043}
{"train_info/time_between_train_steps": 0.005190134048461914, "step": 1043}
{"info/global_step": 1044, "train_info/time_within_train_step": 32.871599435806274, "step": 1044}
{"train_info/time_between_train_steps": 0.0051457881927490234, "step": 1044}
{"info/global_step": 1045, "train_info/time_within_train_step": 32.52317428588867, "step": 1045}
{"train_info/time_between_train_steps": 0.010268449783325195, "step": 1045}
{"info/global_step": 1046, "train_info/time_within_train_step": 32.620352029800415, "step": 1046}
{"train_info/time_between_train_steps": 0.00510859489440918, "step": 1046}
{"info/global_step": 1047, "train_info/time_within_train_step": 32.3938889503479, "step": 1047}
{"train_info/time_between_train_steps": 0.005436897277832031, "step": 1047}
{"info/global_step": 1048, "train_info/time_within_train_step": 32.643479347229004, "step": 1048}
{"train_info/time_between_train_steps": 0.010165214538574219, "step": 1048}
{"info/global_step": 1049, "train_info/time_within_train_step": 32.392234325408936, "step": 1049}
{"train_info/time_between_train_steps": 0.005549430847167969, "step": 1049}
{"info/global_step": 1050, "train_info/time_within_train_step": 32.524189710617065, "step": 1050}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733722512, "_runtime": 35018}, "step": 1050}
{"logs": {"train/loss": 3.118, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 38.02, "_timestamp": 1733722512, "_runtime": 35018}, "step": 1050}
{"train_info/time_between_train_steps": 0.008224248886108398, "step": 1050}
{"info/global_step": 1051, "train_info/time_within_train_step": 32.10860633850098, "step": 1051}
{"train_info/time_between_train_steps": 0.005293607711791992, "step": 1051}
{"info/global_step": 1052, "train_info/time_within_train_step": 32.405293703079224, "step": 1052}
{"train_info/time_between_train_steps": 0.005530118942260742, "step": 1052}
{"info/global_step": 1053, "train_info/time_within_train_step": 32.5845947265625, "step": 1053}
{"train_info/time_between_train_steps": 0.005614280700683594, "step": 1053}
{"train_info/time_between_train_steps": 23.711516857147217, "step": 1053}
{"info/global_step": 1054, "train_info/time_within_train_step": 32.48003077507019, "step": 1054}
{"train_info/time_between_train_steps": 0.005519866943359375, "step": 1054}
{"info/global_step": 1055, "train_info/time_within_train_step": 32.74250102043152, "step": 1055}
{"train_info/time_between_train_steps": 0.015485048294067383, "step": 1055}
{"info/global_step": 1056, "train_info/time_within_train_step": 32.67312431335449, "step": 1056}
{"train_info/time_between_train_steps": 0.0071353912353515625, "step": 1056}
{"info/global_step": 1057, "train_info/time_within_train_step": 32.60746145248413, "step": 1057}
{"train_info/time_between_train_steps": 0.005392313003540039, "step": 1057}
{"info/global_step": 1058, "train_info/time_within_train_step": 32.680795431137085, "step": 1058}
{"train_info/time_between_train_steps": 0.0055294036865234375, "step": 1058}
{"info/global_step": 1059, "train_info/time_within_train_step": 32.07318139076233, "step": 1059}
{"train_info/time_between_train_steps": 0.0052607059478759766, "step": 1059}
{"info/global_step": 1060, "train_info/time_within_train_step": 32.244483947753906, "step": 1060}
{"train_info/time_between_train_steps": 0.00820159912109375, "step": 1060}
{"info/global_step": 1061, "train_info/time_within_train_step": 32.388773679733276, "step": 1061}
{"train_info/time_between_train_steps": 0.010011434555053711, "step": 1061}
{"info/global_step": 1062, "train_info/time_within_train_step": 31.892520666122437, "step": 1062}
{"train_info/time_between_train_steps": 0.006925821304321289, "step": 1062}
{"info/global_step": 1063, "train_info/time_within_train_step": 32.54918122291565, "step": 1063}
{"train_info/time_between_train_steps": 0.004914283752441406, "step": 1063}
{"info/global_step": 1064, "train_info/time_within_train_step": 32.50872826576233, "step": 1064}
{"train_info/time_between_train_steps": 0.007711887359619141, "step": 1064}
{"info/global_step": 1065, "train_info/time_within_train_step": 32.53574228286743, "step": 1065}
{"train_info/time_between_train_steps": 0.005008697509765625, "step": 1065}
{"info/global_step": 1066, "train_info/time_within_train_step": 32.4428014755249, "step": 1066}
{"train_info/time_between_train_steps": 0.01017308235168457, "step": 1066}
{"info/global_step": 1067, "train_info/time_within_train_step": 32.64679026603699, "step": 1067}
{"train_info/time_between_train_steps": 0.005624532699584961, "step": 1067}
{"info/global_step": 1068, "train_info/time_within_train_step": 31.993634700775146, "step": 1068}
{"train_info/time_between_train_steps": 0.005148887634277344, "step": 1068}
{"info/global_step": 1069, "train_info/time_within_train_step": 32.310023069381714, "step": 1069}
{"train_info/time_between_train_steps": 0.005078315734863281, "step": 1069}
{"info/global_step": 1070, "train_info/time_within_train_step": 32.28473877906799, "step": 1070}
{"train_info/time_between_train_steps": 0.005300283432006836, "step": 1070}
{"info/global_step": 1071, "train_info/time_within_train_step": 32.329545736312866, "step": 1071}
{"train_info/time_between_train_steps": 0.010372161865234375, "step": 1071}
{"info/global_step": 1072, "train_info/time_within_train_step": 32.54192805290222, "step": 1072}
{"train_info/time_between_train_steps": 0.005093097686767578, "step": 1072}
{"info/global_step": 1073, "train_info/time_within_train_step": 32.3691463470459, "step": 1073}
{"train_info/time_between_train_steps": 0.0050203800201416016, "step": 1073}
{"info/global_step": 1074, "train_info/time_within_train_step": 32.5672709941864, "step": 1074}
{"train_info/time_between_train_steps": 0.008860588073730469, "step": 1074}
{"info/global_step": 1075, "train_info/time_within_train_step": 32.49737763404846, "step": 1075}
{"train_info/time_between_train_steps": 0.007875204086303711, "step": 1075}
{"info/global_step": 1076, "train_info/time_within_train_step": 32.31774973869324, "step": 1076}
{"train_info/time_between_train_steps": 0.006944417953491211, "step": 1076}
{"info/global_step": 1077, "train_info/time_within_train_step": 32.60784864425659, "step": 1077}
{"train_info/time_between_train_steps": 0.0053937435150146484, "step": 1077}
{"info/global_step": 1078, "train_info/time_within_train_step": 32.12519145011902, "step": 1078}
{"train_info/time_between_train_steps": 0.009908676147460938, "step": 1078}
{"info/global_step": 1079, "train_info/time_within_train_step": 32.25937581062317, "step": 1079}
{"train_info/time_between_train_steps": 0.005455732345581055, "step": 1079}
{"info/global_step": 1080, "train_info/time_within_train_step": 32.090073585510254, "step": 1080}
{"train_info/time_between_train_steps": 0.005741119384765625, "step": 1080}
{"train_info/time_between_train_steps": 23.396389961242676, "step": 1080}
{"info/global_step": 1081, "train_info/time_within_train_step": 32.35739827156067, "step": 1081}
{"train_info/time_between_train_steps": 0.005585670471191406, "step": 1081}
{"info/global_step": 1082, "train_info/time_within_train_step": 32.610599756240845, "step": 1082}
{"train_info/time_between_train_steps": 0.005466938018798828, "step": 1082}
{"info/global_step": 1083, "train_info/time_within_train_step": 32.43036603927612, "step": 1083}
{"train_info/time_between_train_steps": 0.005942583084106445, "step": 1083}
{"info/global_step": 1084, "train_info/time_within_train_step": 32.62315011024475, "step": 1084}
{"train_info/time_between_train_steps": 0.005502462387084961, "step": 1084}
{"info/global_step": 1085, "train_info/time_within_train_step": 32.51217699050903, "step": 1085}
{"train_info/time_between_train_steps": 0.005461931228637695, "step": 1085}
{"info/global_step": 1086, "train_info/time_within_train_step": 32.633044719696045, "step": 1086}
{"train_info/time_between_train_steps": 0.0064945220947265625, "step": 1086}
{"info/global_step": 1087, "train_info/time_within_train_step": 31.888500213623047, "step": 1087}
{"train_info/time_between_train_steps": 0.00514984130859375, "step": 1087}
{"info/global_step": 1088, "train_info/time_within_train_step": 32.37240695953369, "step": 1088}
{"train_info/time_between_train_steps": 0.00879526138305664, "step": 1088}
{"info/global_step": 1089, "train_info/time_within_train_step": 32.22355079650879, "step": 1089}
{"train_info/time_between_train_steps": 0.005172252655029297, "step": 1089}
{"info/global_step": 1090, "train_info/time_within_train_step": 32.304848432540894, "step": 1090}
{"train_info/time_between_train_steps": 0.0050048828125, "step": 1090}
{"info/global_step": 1091, "train_info/time_within_train_step": 32.38803291320801, "step": 1091}
{"train_info/time_between_train_steps": 0.007293224334716797, "step": 1091}
{"info/global_step": 1092, "train_info/time_within_train_step": 32.47734594345093, "step": 1092}
{"train_info/time_between_train_steps": 0.005506038665771484, "step": 1092}
{"info/global_step": 1093, "train_info/time_within_train_step": 32.30240988731384, "step": 1093}
{"train_info/time_between_train_steps": 0.005077362060546875, "step": 1093}
{"info/global_step": 1094, "train_info/time_within_train_step": 32.58521008491516, "step": 1094}
{"train_info/time_between_train_steps": 0.005856513977050781, "step": 1094}
{"info/global_step": 1095, "train_info/time_within_train_step": 32.37787914276123, "step": 1095}
{"train_info/time_between_train_steps": 0.00528407096862793, "step": 1095}
{"info/global_step": 1096, "train_info/time_within_train_step": 32.25933051109314, "step": 1096}
{"train_info/time_between_train_steps": 0.005078554153442383, "step": 1096}
{"info/global_step": 1097, "train_info/time_within_train_step": 32.18082523345947, "step": 1097}
{"train_info/time_between_train_steps": 0.00532984733581543, "step": 1097}
{"info/global_step": 1098, "train_info/time_within_train_step": 32.43955993652344, "step": 1098}
{"train_info/time_between_train_steps": 0.005186796188354492, "step": 1098}
{"info/global_step": 1099, "train_info/time_within_train_step": 32.36618781089783, "step": 1099}
{"train_info/time_between_train_steps": 0.00977945327758789, "step": 1099}
{"info/global_step": 1100, "train_info/time_within_train_step": 32.68421411514282, "step": 1100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733724180, "_runtime": 36686}, "step": 1100}
{"logs": {"train/loss": 3.1211, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 40.02, "_timestamp": 1733724180, "_runtime": 36686}, "step": 1100}
{"train_info/time_between_train_steps": 2.3389899730682373, "step": 1100}
{"info/global_step": 1101, "train_info/time_within_train_step": 32.4447820186615, "step": 1101}
{"train_info/time_between_train_steps": 0.008471012115478516, "step": 1101}
{"info/global_step": 1102, "train_info/time_within_train_step": 32.18058896064758, "step": 1102}
{"train_info/time_between_train_steps": 0.005427122116088867, "step": 1102}
{"info/global_step": 1103, "train_info/time_within_train_step": 32.38553166389465, "step": 1103}
{"train_info/time_between_train_steps": 0.005090236663818359, "step": 1103}
{"info/global_step": 1104, "train_info/time_within_train_step": 32.6368145942688, "step": 1104}
{"train_info/time_between_train_steps": 0.008000612258911133, "step": 1104}
{"info/global_step": 1105, "train_info/time_within_train_step": 32.47830677032471, "step": 1105}
{"train_info/time_between_train_steps": 0.005568504333496094, "step": 1105}
{"info/global_step": 1106, "train_info/time_within_train_step": 32.263845682144165, "step": 1106}
{"train_info/time_between_train_steps": 0.006072998046875, "step": 1106}
{"info/global_step": 1107, "train_info/time_within_train_step": 32.39831066131592, "step": 1107}
{"train_info/time_between_train_steps": 0.010680913925170898, "step": 1107}
{"train_info/time_between_train_steps": 23.257410287857056, "step": 1107}
{"info/global_step": 1108, "train_info/time_within_train_step": 32.34362816810608, "step": 1108}
{"train_info/time_between_train_steps": 0.009562969207763672, "step": 1108}
{"info/global_step": 1109, "train_info/time_within_train_step": 32.45009398460388, "step": 1109}
{"train_info/time_between_train_steps": 0.0055544376373291016, "step": 1109}
{"info/global_step": 1110, "train_info/time_within_train_step": 32.492231607437134, "step": 1110}
{"train_info/time_between_train_steps": 0.0053250789642333984, "step": 1110}
{"info/global_step": 1111, "train_info/time_within_train_step": 32.82653880119324, "step": 1111}
{"train_info/time_between_train_steps": 0.010478496551513672, "step": 1111}
{"info/global_step": 1112, "train_info/time_within_train_step": 32.60397219657898, "step": 1112}
{"train_info/time_between_train_steps": 0.01035451889038086, "step": 1112}
{"info/global_step": 1113, "train_info/time_within_train_step": 32.73411583900452, "step": 1113}
{"train_info/time_between_train_steps": 0.005232334136962891, "step": 1113}
{"info/global_step": 1114, "train_info/time_within_train_step": 32.31852078437805, "step": 1114}
{"train_info/time_between_train_steps": 0.005343198776245117, "step": 1114}
{"info/global_step": 1115, "train_info/time_within_train_step": 32.383352756500244, "step": 1115}
{"train_info/time_between_train_steps": 0.008354902267456055, "step": 1115}
{"info/global_step": 1116, "train_info/time_within_train_step": 32.486902713775635, "step": 1116}
{"train_info/time_between_train_steps": 0.007101297378540039, "step": 1116}
{"info/global_step": 1117, "train_info/time_within_train_step": 32.357048988342285, "step": 1117}
{"train_info/time_between_train_steps": 0.005105257034301758, "step": 1117}
{"info/global_step": 1118, "train_info/time_within_train_step": 32.684733629226685, "step": 1118}
{"train_info/time_between_train_steps": 0.0051958560943603516, "step": 1118}
{"info/global_step": 1119, "train_info/time_within_train_step": 32.60068225860596, "step": 1119}
{"train_info/time_between_train_steps": 0.005252361297607422, "step": 1119}
{"info/global_step": 1120, "train_info/time_within_train_step": 32.14653563499451, "step": 1120}
{"train_info/time_between_train_steps": 0.005214214324951172, "step": 1120}
{"info/global_step": 1121, "train_info/time_within_train_step": 32.43388867378235, "step": 1121}
{"train_info/time_between_train_steps": 0.005252838134765625, "step": 1121}
{"info/global_step": 1122, "train_info/time_within_train_step": 32.475727796554565, "step": 1122}
{"train_info/time_between_train_steps": 0.010080575942993164, "step": 1122}
{"info/global_step": 1123, "train_info/time_within_train_step": 32.68372297286987, "step": 1123}
{"train_info/time_between_train_steps": 0.0051195621490478516, "step": 1123}
{"info/global_step": 1124, "train_info/time_within_train_step": 32.41713762283325, "step": 1124}
{"train_info/time_between_train_steps": 0.00504612922668457, "step": 1124}
{"info/global_step": 1125, "train_info/time_within_train_step": 32.05005121231079, "step": 1125}
{"train_info/time_between_train_steps": 0.00787973403930664, "step": 1125}
{"info/global_step": 1126, "train_info/time_within_train_step": 32.088438272476196, "step": 1126}
{"train_info/time_between_train_steps": 0.004976987838745117, "step": 1126}
{"info/global_step": 1127, "train_info/time_within_train_step": 32.275930881500244, "step": 1127}
{"train_info/time_between_train_steps": 0.005199432373046875, "step": 1127}
{"info/global_step": 1128, "train_info/time_within_train_step": 32.154422998428345, "step": 1128}
{"train_info/time_between_train_steps": 0.010729789733886719, "step": 1128}
{"info/global_step": 1129, "train_info/time_within_train_step": 32.508535861968994, "step": 1129}
{"train_info/time_between_train_steps": 0.00503087043762207, "step": 1129}
{"info/global_step": 1130, "train_info/time_within_train_step": 32.52656149864197, "step": 1130}
{"train_info/time_between_train_steps": 0.007467985153198242, "step": 1130}
{"info/global_step": 1131, "train_info/time_within_train_step": 32.762134075164795, "step": 1131}
{"train_info/time_between_train_steps": 0.0054759979248046875, "step": 1131}
{"info/global_step": 1132, "train_info/time_within_train_step": 32.676987171173096, "step": 1132}
{"train_info/time_between_train_steps": 0.0053098201751708984, "step": 1132}
{"info/global_step": 1133, "train_info/time_within_train_step": 32.714192628860474, "step": 1133}
{"train_info/time_between_train_steps": 0.0054738521575927734, "step": 1133}
{"info/global_step": 1134, "train_info/time_within_train_step": 32.74700117111206, "step": 1134}
{"train_info/time_between_train_steps": 0.005693197250366211, "step": 1134}
{"train_info/time_between_train_steps": 23.424667358398438, "step": 1134}
{"info/global_step": 1135, "train_info/time_within_train_step": 32.28910732269287, "step": 1135}
{"train_info/time_between_train_steps": 0.005080699920654297, "step": 1135}
{"info/global_step": 1136, "train_info/time_within_train_step": 32.63151669502258, "step": 1136}
{"train_info/time_between_train_steps": 0.005404233932495117, "step": 1136}
{"info/global_step": 1137, "train_info/time_within_train_step": 32.3203911781311, "step": 1137}
{"train_info/time_between_train_steps": 0.0052225589752197266, "step": 1137}
{"info/global_step": 1138, "train_info/time_within_train_step": 32.55228853225708, "step": 1138}
{"train_info/time_between_train_steps": 0.005515336990356445, "step": 1138}
{"info/global_step": 1139, "train_info/time_within_train_step": 32.41717600822449, "step": 1139}
{"train_info/time_between_train_steps": 0.006043195724487305, "step": 1139}
{"info/global_step": 1140, "train_info/time_within_train_step": 32.358612298965454, "step": 1140}
{"train_info/time_between_train_steps": 0.0054187774658203125, "step": 1140}
{"info/global_step": 1141, "train_info/time_within_train_step": 32.350451946258545, "step": 1141}
{"train_info/time_between_train_steps": 0.010173320770263672, "step": 1141}
{"info/global_step": 1142, "train_info/time_within_train_step": 32.745444774627686, "step": 1142}
{"train_info/time_between_train_steps": 0.008051633834838867, "step": 1142}
{"info/global_step": 1143, "train_info/time_within_train_step": 32.38227701187134, "step": 1143}
{"train_info/time_between_train_steps": 0.007067441940307617, "step": 1143}
{"info/global_step": 1144, "train_info/time_within_train_step": 31.83616876602173, "step": 1144}
{"train_info/time_between_train_steps": 0.005030393600463867, "step": 1144}
{"info/global_step": 1145, "train_info/time_within_train_step": 32.31272029876709, "step": 1145}
{"train_info/time_between_train_steps": 0.004972934722900391, "step": 1145}
{"info/global_step": 1146, "train_info/time_within_train_step": 32.12177324295044, "step": 1146}
{"train_info/time_between_train_steps": 0.0052411556243896484, "step": 1146}
{"info/global_step": 1147, "train_info/time_within_train_step": 32.36172866821289, "step": 1147}
{"train_info/time_between_train_steps": 0.005044460296630859, "step": 1147}
{"info/global_step": 1148, "train_info/time_within_train_step": 32.40004825592041, "step": 1148}
{"train_info/time_between_train_steps": 0.0050716400146484375, "step": 1148}
{"info/global_step": 1149, "train_info/time_within_train_step": 32.33332562446594, "step": 1149}
{"train_info/time_between_train_steps": 0.005208730697631836, "step": 1149}
{"info/global_step": 1150, "train_info/time_within_train_step": 32.312798261642456, "step": 1150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733725851, "_runtime": 38357}, "step": 1150}
{"logs": {"train/loss": 3.0899, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 42.01, "_timestamp": 1733725851, "_runtime": 38357}, "step": 1150}
{"train_info/time_between_train_steps": 0.006968498229980469, "step": 1150}
{"info/global_step": 1151, "train_info/time_within_train_step": 32.523411989212036, "step": 1151}
{"train_info/time_between_train_steps": 0.010648012161254883, "step": 1151}
{"info/global_step": 1152, "train_info/time_within_train_step": 32.69681239128113, "step": 1152}
{"train_info/time_between_train_steps": 0.0050127506256103516, "step": 1152}
{"info/global_step": 1153, "train_info/time_within_train_step": 32.444236516952515, "step": 1153}
{"train_info/time_between_train_steps": 0.0072400569915771484, "step": 1153}
{"info/global_step": 1154, "train_info/time_within_train_step": 32.66499948501587, "step": 1154}
{"train_info/time_between_train_steps": 0.00500035285949707, "step": 1154}
{"info/global_step": 1155, "train_info/time_within_train_step": 31.835116624832153, "step": 1155}
{"train_info/time_between_train_steps": 0.005203723907470703, "step": 1155}
{"info/global_step": 1156, "train_info/time_within_train_step": 32.41193723678589, "step": 1156}
{"train_info/time_between_train_steps": 0.005199909210205078, "step": 1156}
{"info/global_step": 1157, "train_info/time_within_train_step": 32.211623191833496, "step": 1157}
{"train_info/time_between_train_steps": 0.005201101303100586, "step": 1157}
{"info/global_step": 1158, "train_info/time_within_train_step": 32.39504075050354, "step": 1158}
{"train_info/time_between_train_steps": 0.010124683380126953, "step": 1158}
{"info/global_step": 1159, "train_info/time_within_train_step": 32.50739789009094, "step": 1159}
{"train_info/time_between_train_steps": 0.007232666015625, "step": 1159}
{"info/global_step": 1160, "train_info/time_within_train_step": 32.49799084663391, "step": 1160}
{"train_info/time_between_train_steps": 0.0055310726165771484, "step": 1160}
{"info/global_step": 1161, "train_info/time_within_train_step": 32.69520926475525, "step": 1161}
{"train_info/time_between_train_steps": 0.009070873260498047, "step": 1161}
{"train_info/time_between_train_steps": 23.52774405479431, "step": 1161}
{"info/global_step": 1162, "train_info/time_within_train_step": 32.57188701629639, "step": 1162}
{"train_info/time_between_train_steps": 0.007739543914794922, "step": 1162}
{"info/global_step": 1163, "train_info/time_within_train_step": 32.76412606239319, "step": 1163}
{"train_info/time_between_train_steps": 0.004954099655151367, "step": 1163}
{"info/global_step": 1164, "train_info/time_within_train_step": 31.746580362319946, "step": 1164}
{"train_info/time_between_train_steps": 0.005589485168457031, "step": 1164}
{"info/global_step": 1165, "train_info/time_within_train_step": 32.61931324005127, "step": 1165}
{"train_info/time_between_train_steps": 0.005505084991455078, "step": 1165}
{"info/global_step": 1166, "train_info/time_within_train_step": 32.4040150642395, "step": 1166}
{"train_info/time_between_train_steps": 0.0056896209716796875, "step": 1166}
{"info/global_step": 1167, "train_info/time_within_train_step": 32.5894410610199, "step": 1167}
{"train_info/time_between_train_steps": 0.005385160446166992, "step": 1167}
{"info/global_step": 1168, "train_info/time_within_train_step": 32.64838123321533, "step": 1168}
{"train_info/time_between_train_steps": 0.005587577819824219, "step": 1168}
{"info/global_step": 1169, "train_info/time_within_train_step": 32.71733283996582, "step": 1169}
{"train_info/time_between_train_steps": 0.006257057189941406, "step": 1169}
{"info/global_step": 1170, "train_info/time_within_train_step": 32.66189908981323, "step": 1170}
{"train_info/time_between_train_steps": 0.010601997375488281, "step": 1170}
{"info/global_step": 1171, "train_info/time_within_train_step": 32.90180492401123, "step": 1171}
{"train_info/time_between_train_steps": 0.005133867263793945, "step": 1171}
{"info/global_step": 1172, "train_info/time_within_train_step": 32.569063901901245, "step": 1172}
{"train_info/time_between_train_steps": 0.00933074951171875, "step": 1172}
{"info/global_step": 1173, "train_info/time_within_train_step": 32.521910667419434, "step": 1173}
{"train_info/time_between_train_steps": 0.0050127506256103516, "step": 1173}
{"info/global_step": 1174, "train_info/time_within_train_step": 31.77979016304016, "step": 1174}
{"train_info/time_between_train_steps": 0.005103588104248047, "step": 1174}
{"info/global_step": 1175, "train_info/time_within_train_step": 32.46205401420593, "step": 1175}
{"train_info/time_between_train_steps": 0.010120391845703125, "step": 1175}
{"info/global_step": 1176, "train_info/time_within_train_step": 32.508074045181274, "step": 1176}
{"train_info/time_between_train_steps": 0.005440711975097656, "step": 1176}
{"info/global_step": 1177, "train_info/time_within_train_step": 32.632550954818726, "step": 1177}
{"train_info/time_between_train_steps": 0.00526881217956543, "step": 1177}
{"info/global_step": 1178, "train_info/time_within_train_step": 32.51667404174805, "step": 1178}
{"train_info/time_between_train_steps": 0.005349159240722656, "step": 1178}
{"info/global_step": 1179, "train_info/time_within_train_step": 32.642656087875366, "step": 1179}
{"train_info/time_between_train_steps": 0.005127429962158203, "step": 1179}
{"info/global_step": 1180, "train_info/time_within_train_step": 32.338791608810425, "step": 1180}
{"train_info/time_between_train_steps": 0.00519561767578125, "step": 1180}
{"info/global_step": 1181, "train_info/time_within_train_step": 32.58080768585205, "step": 1181}
{"train_info/time_between_train_steps": 0.005291938781738281, "step": 1181}
{"info/global_step": 1182, "train_info/time_within_train_step": 32.73372673988342, "step": 1182}
{"train_info/time_between_train_steps": 0.007031440734863281, "step": 1182}
{"info/global_step": 1183, "train_info/time_within_train_step": 32.66990041732788, "step": 1183}
{"train_info/time_between_train_steps": 0.010188579559326172, "step": 1183}
{"info/global_step": 1184, "train_info/time_within_train_step": 31.943094968795776, "step": 1184}
{"train_info/time_between_train_steps": 0.010227203369140625, "step": 1184}
{"info/global_step": 1185, "train_info/time_within_train_step": 32.63136625289917, "step": 1185}
{"train_info/time_between_train_steps": 0.010444879531860352, "step": 1185}
{"info/global_step": 1186, "train_info/time_within_train_step": 32.62476396560669, "step": 1186}
{"train_info/time_between_train_steps": 0.005576372146606445, "step": 1186}
{"info/global_step": 1187, "train_info/time_within_train_step": 32.350085973739624, "step": 1187}
{"train_info/time_between_train_steps": 0.005647182464599609, "step": 1187}
{"info/global_step": 1188, "train_info/time_within_train_step": 32.281291484832764, "step": 1188}
{"train_info/time_between_train_steps": 0.006712436676025391, "step": 1188}
{"train_info/time_between_train_steps": 23.640511512756348, "step": 1188}
{"info/global_step": 1189, "train_info/time_within_train_step": 32.634724140167236, "step": 1189}
{"train_info/time_between_train_steps": 0.004839181900024414, "step": 1189}
{"info/global_step": 1190, "train_info/time_within_train_step": 32.57356524467468, "step": 1190}
{"train_info/time_between_train_steps": 0.005076408386230469, "step": 1190}
{"info/global_step": 1191, "train_info/time_within_train_step": 32.70925188064575, "step": 1191}
{"train_info/time_between_train_steps": 0.007187366485595703, "step": 1191}
{"info/global_step": 1192, "train_info/time_within_train_step": 32.8284547328949, "step": 1192}
{"train_info/time_between_train_steps": 0.005383729934692383, "step": 1192}
{"info/global_step": 1193, "train_info/time_within_train_step": 32.145328521728516, "step": 1193}
{"train_info/time_between_train_steps": 0.005089521408081055, "step": 1193}
{"info/global_step": 1194, "train_info/time_within_train_step": 32.340402364730835, "step": 1194}
{"train_info/time_between_train_steps": 0.006170034408569336, "step": 1194}
{"info/global_step": 1195, "train_info/time_within_train_step": 32.54878807067871, "step": 1195}
{"train_info/time_between_train_steps": 0.0052683353424072266, "step": 1195}
{"info/global_step": 1196, "train_info/time_within_train_step": 32.607439279556274, "step": 1196}
{"train_info/time_between_train_steps": 0.005195140838623047, "step": 1196}
{"info/global_step": 1197, "train_info/time_within_train_step": 32.42896628379822, "step": 1197}
{"train_info/time_between_train_steps": 0.005165815353393555, "step": 1197}
{"info/global_step": 1198, "train_info/time_within_train_step": 32.45104646682739, "step": 1198}
{"train_info/time_between_train_steps": 0.005135059356689453, "step": 1198}
{"info/global_step": 1199, "train_info/time_within_train_step": 32.54623484611511, "step": 1199}
{"train_info/time_between_train_steps": 0.014158487319946289, "step": 1199}
{"info/global_step": 1200, "train_info/time_within_train_step": 32.49672484397888, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733727523, "_runtime": 40029}, "step": 1200}
{"logs": {"train/loss": 3.0661, "train/learning_rate": 0.0, "train/epoch": 44.01, "_timestamp": 1733727523, "_runtime": 40029}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733727526, "_runtime": 40032}, "step": 1200}
{"logs": {"train/train_runtime": 40032.4352, "train/train_samples_per_second": 15.348, "train/train_steps_per_second": 0.03, "train/total_flos": 3.2843363254272e+17, "train/train_loss": 4.048229904174804, "train/epoch": 44.01, "_timestamp": 1733727526, "_runtime": 40032}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733727529, "_runtime": 40035}, "step": 1200}
{"logs": {"eval/loss": 4.195606231689453, "eval/runtime": 2.3056, "eval/samples_per_second": 43.372, "eval/steps_per_second": 3.036, "train/epoch": 44.01, "_timestamp": 1733727529, "_runtime": 40035}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733727529, "_runtime": 40035}, "step": 1200}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 4.195606231689453, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 66.39396950761237, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 2.3056, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 43.372, "train/epoch": 44.01, "_timestamp": 1733727529, "_runtime": 40035}, "step": 1200}