FR-GPT2small / metrics.json
xiulinyang's picture
Adding model checkpoints and config files
d42d53d
{"num_parameters": 124439808, "trainable_parameters": 124439808, "step": 0}
{"train_info/time_between_train_steps": 3.297989845275879, "step": 0}
{"info/global_step": 1, "train_info/time_within_train_step": 34.628830432891846, "step": 1}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 19761.71484375, "train_info/memory_reserved": 22624.0, "train_info/memory_max_reserved": 22624.0, "_timestamp": 1734103269, "_runtime": 43}, "step": 1}
{"logs": {"train/loss": 10.9692, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1734103269, "_runtime": 43}, "step": 1}
{"train_info/time_between_train_steps": 0.008312463760375977, "step": 1}
{"info/global_step": 2, "train_info/time_within_train_step": 34.20987153053284, "step": 2}
{"train_info/time_between_train_steps": 0.0075757503509521484, "step": 2}
{"info/global_step": 3, "train_info/time_within_train_step": 34.07279324531555, "step": 3}
{"train_info/time_between_train_steps": 0.006949663162231445, "step": 3}
{"info/global_step": 4, "train_info/time_within_train_step": 34.223024129867554, "step": 4}
{"train_info/time_between_train_steps": 0.006000995635986328, "step": 4}
{"info/global_step": 5, "train_info/time_within_train_step": 34.07366490364075, "step": 5}
{"train_info/time_between_train_steps": 0.006024360656738281, "step": 5}
{"info/global_step": 6, "train_info/time_within_train_step": 34.114654779434204, "step": 6}
{"train_info/time_between_train_steps": 0.012681961059570312, "step": 6}
{"info/global_step": 7, "train_info/time_within_train_step": 34.1095507144928, "step": 7}
{"train_info/time_between_train_steps": 0.006123065948486328, "step": 7}
{"info/global_step": 8, "train_info/time_within_train_step": 34.12714505195618, "step": 8}
{"train_info/time_between_train_steps": 0.005871295928955078, "step": 8}
{"info/global_step": 9, "train_info/time_within_train_step": 34.07063412666321, "step": 9}
{"train_info/time_between_train_steps": 0.006299257278442383, "step": 9}
{"info/global_step": 10, "train_info/time_within_train_step": 34.39842510223389, "step": 10}
{"train_info/time_between_train_steps": 0.00597691535949707, "step": 10}
{"info/global_step": 11, "train_info/time_within_train_step": 34.02418041229248, "step": 11}
{"train_info/time_between_train_steps": 0.006429433822631836, "step": 11}
{"info/global_step": 12, "train_info/time_within_train_step": 34.26666712760925, "step": 12}
{"train_info/time_between_train_steps": 0.011114120483398438, "step": 12}
{"info/global_step": 13, "train_info/time_within_train_step": 34.1406683921814, "step": 13}
{"train_info/time_between_train_steps": 0.0064275264739990234, "step": 13}
{"info/global_step": 14, "train_info/time_within_train_step": 34.172898292541504, "step": 14}
{"train_info/time_between_train_steps": 0.006298542022705078, "step": 14}
{"info/global_step": 15, "train_info/time_within_train_step": 34.01993227005005, "step": 15}
{"train_info/time_between_train_steps": 0.006302356719970703, "step": 15}
{"info/global_step": 16, "train_info/time_within_train_step": 34.414761543273926, "step": 16}
{"train_info/time_between_train_steps": 0.006123542785644531, "step": 16}
{"info/global_step": 17, "train_info/time_within_train_step": 34.2340669631958, "step": 17}
{"train_info/time_between_train_steps": 0.005972385406494141, "step": 17}
{"info/global_step": 18, "train_info/time_within_train_step": 34.16475486755371, "step": 18}
{"train_info/time_between_train_steps": 0.006621599197387695, "step": 18}
{"info/global_step": 19, "train_info/time_within_train_step": 33.976221323013306, "step": 19}
{"train_info/time_between_train_steps": 0.005835771560668945, "step": 19}
{"info/global_step": 20, "train_info/time_within_train_step": 34.17757749557495, "step": 20}
{"train_info/time_between_train_steps": 0.010526657104492188, "step": 20}
{"info/global_step": 21, "train_info/time_within_train_step": 33.93839931488037, "step": 21}
{"train_info/time_between_train_steps": 0.005980014801025391, "step": 21}
{"info/global_step": 22, "train_info/time_within_train_step": 34.1718430519104, "step": 22}
{"train_info/time_between_train_steps": 0.005974292755126953, "step": 22}
{"info/global_step": 23, "train_info/time_within_train_step": 33.997549295425415, "step": 23}
{"train_info/time_between_train_steps": 0.010979652404785156, "step": 23}
{"info/global_step": 24, "train_info/time_within_train_step": 34.03124403953552, "step": 24}
{"train_info/time_between_train_steps": 0.00600743293762207, "step": 24}
{"info/global_step": 25, "train_info/time_within_train_step": 34.142186403274536, "step": 25}
{"train_info/time_between_train_steps": 0.009710073471069336, "step": 25}
{"info/global_step": 26, "train_info/time_within_train_step": 34.08016800880432, "step": 26}
{"train_info/time_between_train_steps": 0.005670309066772461, "step": 26}
{"info/global_step": 27, "train_info/time_within_train_step": 33.939308643341064, "step": 27}
{"train_info/time_between_train_steps": 0.005646228790283203, "step": 27}
{"info/global_step": 28, "train_info/time_within_train_step": 33.94676351547241, "step": 28}
{"train_info/time_between_train_steps": 0.006059408187866211, "step": 28}
{"info/global_step": 29, "train_info/time_within_train_step": 34.02413630485535, "step": 29}
{"train_info/time_between_train_steps": 0.005883216857910156, "step": 29}
{"info/global_step": 30, "train_info/time_within_train_step": 33.999385833740234, "step": 30}
{"train_info/time_between_train_steps": 0.0059549808502197266, "step": 30}
{"info/global_step": 31, "train_info/time_within_train_step": 34.009385108947754, "step": 31}
{"train_info/time_between_train_steps": 0.010637521743774414, "step": 31}
{"info/global_step": 32, "train_info/time_within_train_step": 34.40701985359192, "step": 32}
{"train_info/time_between_train_steps": 0.005700111389160156, "step": 32}
{"info/global_step": 33, "train_info/time_within_train_step": 34.181543588638306, "step": 33}
{"train_info/time_between_train_steps": 0.011119365692138672, "step": 33}
{"info/global_step": 34, "train_info/time_within_train_step": 33.952494859695435, "step": 34}
{"train_info/time_between_train_steps": 0.010421514511108398, "step": 34}
{"info/global_step": 35, "train_info/time_within_train_step": 34.04700326919556, "step": 35}
{"train_info/time_between_train_steps": 0.006119251251220703, "step": 35}
{"info/global_step": 36, "train_info/time_within_train_step": 34.03579568862915, "step": 36}
{"train_info/time_between_train_steps": 0.011108875274658203, "step": 36}
{"info/global_step": 37, "train_info/time_within_train_step": 34.049686908721924, "step": 37}
{"train_info/time_between_train_steps": 0.006178379058837891, "step": 37}
{"info/global_step": 38, "train_info/time_within_train_step": 34.00304341316223, "step": 38}
{"train_info/time_between_train_steps": 0.006015777587890625, "step": 38}
{"info/global_step": 39, "train_info/time_within_train_step": 34.04485607147217, "step": 39}
{"train_info/time_between_train_steps": 0.005945920944213867, "step": 39}
{"info/global_step": 40, "train_info/time_within_train_step": 34.15958333015442, "step": 40}
{"train_info/time_between_train_steps": 0.011073827743530273, "step": 40}
{"info/global_step": 41, "train_info/time_within_train_step": 33.988128900527954, "step": 41}
{"train_info/time_between_train_steps": 0.011303424835205078, "step": 41}
{"info/global_step": 42, "train_info/time_within_train_step": 34.016297817230225, "step": 42}
{"train_info/time_between_train_steps": 0.006157636642456055, "step": 42}
{"info/global_step": 43, "train_info/time_within_train_step": 33.98608660697937, "step": 43}
{"train_info/time_between_train_steps": 0.007946491241455078, "step": 43}
{"train_info/time_between_train_steps": 26.678837776184082, "step": 43}
{"info/global_step": 44, "train_info/time_within_train_step": 34.128310680389404, "step": 44}
{"train_info/time_between_train_steps": 0.006017446517944336, "step": 44}
{"info/global_step": 45, "train_info/time_within_train_step": 34.37034797668457, "step": 45}
{"train_info/time_between_train_steps": 0.01040029525756836, "step": 45}
{"info/global_step": 46, "train_info/time_within_train_step": 34.09983205795288, "step": 46}
{"train_info/time_between_train_steps": 0.01437234878540039, "step": 46}
{"info/global_step": 47, "train_info/time_within_train_step": 34.491761684417725, "step": 47}
{"train_info/time_between_train_steps": 0.011160135269165039, "step": 47}
{"info/global_step": 48, "train_info/time_within_train_step": 34.01581621170044, "step": 48}
{"train_info/time_between_train_steps": 0.006865978240966797, "step": 48}
{"info/global_step": 49, "train_info/time_within_train_step": 34.19405794143677, "step": 49}
{"train_info/time_between_train_steps": 0.011288166046142578, "step": 49}
{"info/global_step": 50, "train_info/time_within_train_step": 34.03675723075867, "step": 50}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734104967, "_runtime": 1741}, "step": 50}
{"logs": {"train/loss": 8.063, "train/learning_rate": 0.00025, "train/epoch": 1.01, "_timestamp": 1734104967, "_runtime": 1741}, "step": 50}
{"train_info/time_between_train_steps": 0.014880657196044922, "step": 50}
{"info/global_step": 51, "train_info/time_within_train_step": 34.43704843521118, "step": 51}
{"train_info/time_between_train_steps": 0.00587010383605957, "step": 51}
{"info/global_step": 52, "train_info/time_within_train_step": 34.032713413238525, "step": 52}
{"train_info/time_between_train_steps": 0.011790037155151367, "step": 52}
{"info/global_step": 53, "train_info/time_within_train_step": 34.2328565120697, "step": 53}
{"train_info/time_between_train_steps": 0.010440587997436523, "step": 53}
{"info/global_step": 54, "train_info/time_within_train_step": 34.06965780258179, "step": 54}
{"train_info/time_between_train_steps": 0.006509065628051758, "step": 54}
{"info/global_step": 55, "train_info/time_within_train_step": 34.133347511291504, "step": 55}
{"train_info/time_between_train_steps": 0.00635218620300293, "step": 55}
{"info/global_step": 56, "train_info/time_within_train_step": 34.003483057022095, "step": 56}
{"train_info/time_between_train_steps": 0.00652003288269043, "step": 56}
{"info/global_step": 57, "train_info/time_within_train_step": 34.10663342475891, "step": 57}
{"train_info/time_between_train_steps": 0.0066013336181640625, "step": 57}
{"info/global_step": 58, "train_info/time_within_train_step": 33.97434401512146, "step": 58}
{"train_info/time_between_train_steps": 0.006099700927734375, "step": 58}
{"info/global_step": 59, "train_info/time_within_train_step": 34.132346630096436, "step": 59}
{"train_info/time_between_train_steps": 0.0062830448150634766, "step": 59}
{"info/global_step": 60, "train_info/time_within_train_step": 34.05021405220032, "step": 60}
{"train_info/time_between_train_steps": 0.0060956478118896484, "step": 60}
{"info/global_step": 61, "train_info/time_within_train_step": 34.207785844802856, "step": 61}
{"train_info/time_between_train_steps": 0.006537199020385742, "step": 61}
{"info/global_step": 62, "train_info/time_within_train_step": 34.39036726951599, "step": 62}
{"train_info/time_between_train_steps": 0.013213396072387695, "step": 62}
{"info/global_step": 63, "train_info/time_within_train_step": 34.25332689285278, "step": 63}
{"train_info/time_between_train_steps": 0.006379842758178711, "step": 63}
{"info/global_step": 64, "train_info/time_within_train_step": 34.114147901535034, "step": 64}
{"train_info/time_between_train_steps": 0.00608515739440918, "step": 64}
{"info/global_step": 65, "train_info/time_within_train_step": 34.33029770851135, "step": 65}
{"train_info/time_between_train_steps": 0.005980014801025391, "step": 65}
{"info/global_step": 66, "train_info/time_within_train_step": 33.982744455337524, "step": 66}
{"train_info/time_between_train_steps": 0.00606846809387207, "step": 66}
{"info/global_step": 67, "train_info/time_within_train_step": 34.10791325569153, "step": 67}
{"train_info/time_between_train_steps": 0.00613856315612793, "step": 67}
{"info/global_step": 68, "train_info/time_within_train_step": 33.97837734222412, "step": 68}
{"train_info/time_between_train_steps": 0.00578761100769043, "step": 68}
{"info/global_step": 69, "train_info/time_within_train_step": 33.97697401046753, "step": 69}
{"train_info/time_between_train_steps": 0.005650997161865234, "step": 69}
{"info/global_step": 70, "train_info/time_within_train_step": 33.97154927253723, "step": 70}
{"train_info/time_between_train_steps": 0.005816459655761719, "step": 70}
{"info/global_step": 71, "train_info/time_within_train_step": 34.099146127700806, "step": 71}
{"train_info/time_between_train_steps": 0.005956411361694336, "step": 71}
{"info/global_step": 72, "train_info/time_within_train_step": 33.95953607559204, "step": 72}
{"train_info/time_between_train_steps": 0.010850906372070312, "step": 72}
{"info/global_step": 73, "train_info/time_within_train_step": 34.101675510406494, "step": 73}
{"train_info/time_between_train_steps": 0.005932331085205078, "step": 73}
{"info/global_step": 74, "train_info/time_within_train_step": 34.169727087020874, "step": 74}
{"train_info/time_between_train_steps": 0.011009693145751953, "step": 74}
{"info/global_step": 75, "train_info/time_within_train_step": 34.070053577423096, "step": 75}
{"train_info/time_between_train_steps": 0.005931377410888672, "step": 75}
{"info/global_step": 76, "train_info/time_within_train_step": 33.96268939971924, "step": 76}
{"train_info/time_between_train_steps": 0.006032705307006836, "step": 76}
{"info/global_step": 77, "train_info/time_within_train_step": 34.21854853630066, "step": 77}
{"train_info/time_between_train_steps": 0.010517120361328125, "step": 77}
{"info/global_step": 78, "train_info/time_within_train_step": 34.253164768218994, "step": 78}
{"train_info/time_between_train_steps": 0.0058934688568115234, "step": 78}
{"info/global_step": 79, "train_info/time_within_train_step": 34.027881383895874, "step": 79}
{"train_info/time_between_train_steps": 0.006011486053466797, "step": 79}
{"info/global_step": 80, "train_info/time_within_train_step": 34.01552104949951, "step": 80}
{"train_info/time_between_train_steps": 0.006032466888427734, "step": 80}
{"info/global_step": 81, "train_info/time_within_train_step": 33.99306583404541, "step": 81}
{"train_info/time_between_train_steps": 0.00598907470703125, "step": 81}
{"info/global_step": 82, "train_info/time_within_train_step": 34.00684595108032, "step": 82}
{"train_info/time_between_train_steps": 0.00599217414855957, "step": 82}
{"info/global_step": 83, "train_info/time_within_train_step": 34.07675099372864, "step": 83}
{"train_info/time_between_train_steps": 0.006205081939697266, "step": 83}
{"info/global_step": 84, "train_info/time_within_train_step": 34.066481590270996, "step": 84}
{"train_info/time_between_train_steps": 0.006195783615112305, "step": 84}
{"info/global_step": 85, "train_info/time_within_train_step": 34.09758710861206, "step": 85}
{"train_info/time_between_train_steps": 0.0059778690338134766, "step": 85}
{"info/global_step": 86, "train_info/time_within_train_step": 34.10645079612732, "step": 86}
{"train_info/time_between_train_steps": 0.007472515106201172, "step": 86}
{"train_info/time_between_train_steps": 26.998816967010498, "step": 86}
{"info/global_step": 87, "train_info/time_within_train_step": 33.93523025512695, "step": 87}
{"train_info/time_between_train_steps": 0.005706787109375, "step": 87}
{"info/global_step": 88, "train_info/time_within_train_step": 34.233001470565796, "step": 88}
{"train_info/time_between_train_steps": 0.0057337284088134766, "step": 88}
{"info/global_step": 89, "train_info/time_within_train_step": 34.1071720123291, "step": 89}
{"train_info/time_between_train_steps": 0.010866403579711914, "step": 89}
{"info/global_step": 90, "train_info/time_within_train_step": 34.33950901031494, "step": 90}
{"train_info/time_between_train_steps": 0.005949735641479492, "step": 90}
{"info/global_step": 91, "train_info/time_within_train_step": 34.2009482383728, "step": 91}
{"train_info/time_between_train_steps": 0.006268501281738281, "step": 91}
{"info/global_step": 92, "train_info/time_within_train_step": 34.352221727371216, "step": 92}
{"train_info/time_between_train_steps": 0.006669044494628906, "step": 92}
{"info/global_step": 93, "train_info/time_within_train_step": 34.43699598312378, "step": 93}
{"train_info/time_between_train_steps": 0.009888410568237305, "step": 93}
{"info/global_step": 94, "train_info/time_within_train_step": 34.40203595161438, "step": 94}
{"train_info/time_between_train_steps": 0.006142616271972656, "step": 94}
{"info/global_step": 95, "train_info/time_within_train_step": 34.151134967803955, "step": 95}
{"train_info/time_between_train_steps": 0.008754253387451172, "step": 95}
{"info/global_step": 96, "train_info/time_within_train_step": 34.227824211120605, "step": 96}
{"train_info/time_between_train_steps": 0.006209373474121094, "step": 96}
{"info/global_step": 97, "train_info/time_within_train_step": 34.00497817993164, "step": 97}
{"train_info/time_between_train_steps": 0.006583213806152344, "step": 97}
{"info/global_step": 98, "train_info/time_within_train_step": 34.27884817123413, "step": 98}
{"train_info/time_between_train_steps": 0.006081104278564453, "step": 98}
{"info/global_step": 99, "train_info/time_within_train_step": 34.09269046783447, "step": 99}
{"train_info/time_between_train_steps": 0.006224632263183594, "step": 99}
{"info/global_step": 100, "train_info/time_within_train_step": 34.216843366622925, "step": 100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734106702, "_runtime": 3476}, "step": 100}
{"logs": {"train/loss": 4.9432, "train/learning_rate": 0.0005, "train/epoch": 2.01, "_timestamp": 1734106702, "_runtime": 3476}, "step": 100}
{"train_info/time_between_train_steps": 2.4277727603912354, "step": 100}
{"info/global_step": 101, "train_info/time_within_train_step": 34.14482498168945, "step": 101}
{"train_info/time_between_train_steps": 0.013328075408935547, "step": 101}
{"info/global_step": 102, "train_info/time_within_train_step": 34.31666684150696, "step": 102}
{"train_info/time_between_train_steps": 0.006052732467651367, "step": 102}
{"info/global_step": 103, "train_info/time_within_train_step": 34.184476375579834, "step": 103}
{"train_info/time_between_train_steps": 0.010954856872558594, "step": 103}
{"info/global_step": 104, "train_info/time_within_train_step": 34.327900409698486, "step": 104}
{"train_info/time_between_train_steps": 0.012780189514160156, "step": 104}
{"info/global_step": 105, "train_info/time_within_train_step": 34.038135290145874, "step": 105}
{"train_info/time_between_train_steps": 0.006447315216064453, "step": 105}
{"info/global_step": 106, "train_info/time_within_train_step": 34.237308502197266, "step": 106}
{"train_info/time_between_train_steps": 0.0064694881439208984, "step": 106}
{"info/global_step": 107, "train_info/time_within_train_step": 34.31100654602051, "step": 107}
{"train_info/time_between_train_steps": 0.0062541961669921875, "step": 107}
{"info/global_step": 108, "train_info/time_within_train_step": 34.44370985031128, "step": 108}
{"train_info/time_between_train_steps": 0.00604701042175293, "step": 108}
{"info/global_step": 109, "train_info/time_within_train_step": 33.98950481414795, "step": 109}
{"train_info/time_between_train_steps": 0.00627446174621582, "step": 109}
{"info/global_step": 110, "train_info/time_within_train_step": 34.10311770439148, "step": 110}
{"train_info/time_between_train_steps": 0.00597381591796875, "step": 110}
{"info/global_step": 111, "train_info/time_within_train_step": 33.95146894454956, "step": 111}
{"train_info/time_between_train_steps": 0.005796194076538086, "step": 111}
{"info/global_step": 112, "train_info/time_within_train_step": 33.91622042655945, "step": 112}
{"train_info/time_between_train_steps": 0.005632638931274414, "step": 112}
{"info/global_step": 113, "train_info/time_within_train_step": 34.06853890419006, "step": 113}
{"train_info/time_between_train_steps": 0.0058591365814208984, "step": 113}
{"info/global_step": 114, "train_info/time_within_train_step": 33.98193693161011, "step": 114}
{"train_info/time_between_train_steps": 0.005868434906005859, "step": 114}
{"info/global_step": 115, "train_info/time_within_train_step": 34.10750484466553, "step": 115}
{"train_info/time_between_train_steps": 0.010039329528808594, "step": 115}
{"info/global_step": 116, "train_info/time_within_train_step": 34.06043314933777, "step": 116}
{"train_info/time_between_train_steps": 0.011075496673583984, "step": 116}
{"info/global_step": 117, "train_info/time_within_train_step": 34.109694719314575, "step": 117}
{"train_info/time_between_train_steps": 0.006011486053466797, "step": 117}
{"info/global_step": 118, "train_info/time_within_train_step": 34.06697702407837, "step": 118}
{"train_info/time_between_train_steps": 0.005789279937744141, "step": 118}
{"info/global_step": 119, "train_info/time_within_train_step": 33.992974519729614, "step": 119}
{"train_info/time_between_train_steps": 0.005853414535522461, "step": 119}
{"info/global_step": 120, "train_info/time_within_train_step": 34.085267782211304, "step": 120}
{"train_info/time_between_train_steps": 0.009496450424194336, "step": 120}
{"info/global_step": 121, "train_info/time_within_train_step": 33.973928928375244, "step": 121}
{"train_info/time_between_train_steps": 0.006155967712402344, "step": 121}
{"info/global_step": 122, "train_info/time_within_train_step": 33.9691858291626, "step": 122}
{"train_info/time_between_train_steps": 0.006226062774658203, "step": 122}
{"info/global_step": 123, "train_info/time_within_train_step": 34.13701319694519, "step": 123}
{"train_info/time_between_train_steps": 0.010181427001953125, "step": 123}
{"info/global_step": 124, "train_info/time_within_train_step": 34.30875301361084, "step": 124}
{"train_info/time_between_train_steps": 0.00594329833984375, "step": 124}
{"info/global_step": 125, "train_info/time_within_train_step": 34.03130793571472, "step": 125}
{"train_info/time_between_train_steps": 0.005944490432739258, "step": 125}
{"info/global_step": 126, "train_info/time_within_train_step": 34.26348567008972, "step": 126}
{"train_info/time_between_train_steps": 0.010583639144897461, "step": 126}
{"info/global_step": 127, "train_info/time_within_train_step": 34.12160801887512, "step": 127}
{"train_info/time_between_train_steps": 0.011493921279907227, "step": 127}
{"info/global_step": 128, "train_info/time_within_train_step": 34.2010383605957, "step": 128}
{"train_info/time_between_train_steps": 0.007249116897583008, "step": 128}
{"info/global_step": 129, "train_info/time_within_train_step": 34.083139419555664, "step": 129}
{"train_info/time_between_train_steps": 0.0077838897705078125, "step": 129}
{"train_info/time_between_train_steps": 26.455042839050293, "step": 129}
{"info/global_step": 130, "train_info/time_within_train_step": 34.138805627822876, "step": 130}
{"train_info/time_between_train_steps": 0.010879039764404297, "step": 130}
{"info/global_step": 131, "train_info/time_within_train_step": 34.18527150154114, "step": 131}
{"train_info/time_between_train_steps": 0.006087541580200195, "step": 131}
{"info/global_step": 132, "train_info/time_within_train_step": 34.03929829597473, "step": 132}
{"train_info/time_between_train_steps": 0.0063190460205078125, "step": 132}
{"info/global_step": 133, "train_info/time_within_train_step": 34.40725636482239, "step": 133}
{"train_info/time_between_train_steps": 0.011921405792236328, "step": 133}
{"info/global_step": 134, "train_info/time_within_train_step": 34.173869609832764, "step": 134}
{"train_info/time_between_train_steps": 0.00628209114074707, "step": 134}
{"info/global_step": 135, "train_info/time_within_train_step": 34.23080563545227, "step": 135}
{"train_info/time_between_train_steps": 0.011024236679077148, "step": 135}
{"info/global_step": 136, "train_info/time_within_train_step": 34.04381513595581, "step": 136}
{"train_info/time_between_train_steps": 0.006269693374633789, "step": 136}
{"info/global_step": 137, "train_info/time_within_train_step": 34.20708179473877, "step": 137}
{"train_info/time_between_train_steps": 0.01582479476928711, "step": 137}
{"info/global_step": 138, "train_info/time_within_train_step": 34.1086540222168, "step": 138}
{"train_info/time_between_train_steps": 0.010560989379882812, "step": 138}
{"info/global_step": 139, "train_info/time_within_train_step": 34.41243553161621, "step": 139}
{"train_info/time_between_train_steps": 0.0060520172119140625, "step": 139}
{"info/global_step": 140, "train_info/time_within_train_step": 33.96278691291809, "step": 140}
{"train_info/time_between_train_steps": 0.006061553955078125, "step": 140}
{"info/global_step": 141, "train_info/time_within_train_step": 34.25464177131653, "step": 141}
{"train_info/time_between_train_steps": 0.0072023868560791016, "step": 141}
{"info/global_step": 142, "train_info/time_within_train_step": 33.954254388809204, "step": 142}
{"train_info/time_between_train_steps": 0.006177663803100586, "step": 142}
{"info/global_step": 143, "train_info/time_within_train_step": 34.184962034225464, "step": 143}
{"train_info/time_between_train_steps": 0.005902767181396484, "step": 143}
{"info/global_step": 144, "train_info/time_within_train_step": 33.9515814781189, "step": 144}
{"train_info/time_between_train_steps": 0.0062716007232666016, "step": 144}
{"info/global_step": 145, "train_info/time_within_train_step": 34.09170413017273, "step": 145}
{"train_info/time_between_train_steps": 0.0058040618896484375, "step": 145}
{"info/global_step": 146, "train_info/time_within_train_step": 33.99659848213196, "step": 146}
{"train_info/time_between_train_steps": 0.016162872314453125, "step": 146}
{"info/global_step": 147, "train_info/time_within_train_step": 34.153289794921875, "step": 147}
{"train_info/time_between_train_steps": 0.01579904556274414, "step": 147}
{"info/global_step": 148, "train_info/time_within_train_step": 34.02837562561035, "step": 148}
{"train_info/time_between_train_steps": 0.006356954574584961, "step": 148}
{"info/global_step": 149, "train_info/time_within_train_step": 34.27915000915527, "step": 149}
{"train_info/time_between_train_steps": 0.01056361198425293, "step": 149}
{"info/global_step": 150, "train_info/time_within_train_step": 34.090068340301514, "step": 150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734108437, "_runtime": 5211}, "step": 150}
{"logs": {"train/loss": 3.9936, "train/learning_rate": 0.0005833333333333333, "train/epoch": 3.02, "_timestamp": 1734108437, "_runtime": 5211}, "step": 150}
{"train_info/time_between_train_steps": 0.010942697525024414, "step": 150}
{"info/global_step": 151, "train_info/time_within_train_step": 34.18484115600586, "step": 151}
{"train_info/time_between_train_steps": 0.006128072738647461, "step": 151}
{"info/global_step": 152, "train_info/time_within_train_step": 34.09914016723633, "step": 152}
{"train_info/time_between_train_steps": 0.006451129913330078, "step": 152}
{"info/global_step": 153, "train_info/time_within_train_step": 34.51227402687073, "step": 153}
{"train_info/time_between_train_steps": 0.006573200225830078, "step": 153}
{"info/global_step": 154, "train_info/time_within_train_step": 34.06673622131348, "step": 154}
{"train_info/time_between_train_steps": 0.0058634281158447266, "step": 154}
{"info/global_step": 155, "train_info/time_within_train_step": 34.284374475479126, "step": 155}
{"train_info/time_between_train_steps": 0.005832672119140625, "step": 155}
{"info/global_step": 156, "train_info/time_within_train_step": 34.041964530944824, "step": 156}
{"train_info/time_between_train_steps": 0.012196779251098633, "step": 156}
{"info/global_step": 157, "train_info/time_within_train_step": 33.97952318191528, "step": 157}
{"train_info/time_between_train_steps": 0.00589299201965332, "step": 157}
{"info/global_step": 158, "train_info/time_within_train_step": 34.06334137916565, "step": 158}
{"train_info/time_between_train_steps": 0.010143280029296875, "step": 158}
{"info/global_step": 159, "train_info/time_within_train_step": 34.183645486831665, "step": 159}
{"train_info/time_between_train_steps": 0.0060100555419921875, "step": 159}
{"info/global_step": 160, "train_info/time_within_train_step": 33.987900257110596, "step": 160}
{"train_info/time_between_train_steps": 0.00578618049621582, "step": 160}
{"info/global_step": 161, "train_info/time_within_train_step": 34.16641139984131, "step": 161}
{"train_info/time_between_train_steps": 0.00895237922668457, "step": 161}
{"info/global_step": 162, "train_info/time_within_train_step": 34.027055501937866, "step": 162}
{"train_info/time_between_train_steps": 0.005893230438232422, "step": 162}
{"info/global_step": 163, "train_info/time_within_train_step": 34.19103693962097, "step": 163}
{"train_info/time_between_train_steps": 0.006663322448730469, "step": 163}
{"info/global_step": 164, "train_info/time_within_train_step": 34.13284635543823, "step": 164}
{"train_info/time_between_train_steps": 0.011075019836425781, "step": 164}
{"info/global_step": 165, "train_info/time_within_train_step": 34.08873534202576, "step": 165}
{"train_info/time_between_train_steps": 0.0133209228515625, "step": 165}
{"info/global_step": 166, "train_info/time_within_train_step": 33.98133635520935, "step": 166}
{"train_info/time_between_train_steps": 0.0059735774993896484, "step": 166}
{"info/global_step": 167, "train_info/time_within_train_step": 33.98197364807129, "step": 167}
{"train_info/time_between_train_steps": 0.011775970458984375, "step": 167}
{"info/global_step": 168, "train_info/time_within_train_step": 34.10615921020508, "step": 168}
{"train_info/time_between_train_steps": 0.006138801574707031, "step": 168}
{"info/global_step": 169, "train_info/time_within_train_step": 34.02271771430969, "step": 169}
{"train_info/time_between_train_steps": 0.006166219711303711, "step": 169}
{"info/global_step": 170, "train_info/time_within_train_step": 34.24866318702698, "step": 170}
{"train_info/time_between_train_steps": 0.011521100997924805, "step": 170}
{"info/global_step": 171, "train_info/time_within_train_step": 33.99662137031555, "step": 171}
{"train_info/time_between_train_steps": 0.0061626434326171875, "step": 171}
{"info/global_step": 172, "train_info/time_within_train_step": 34.094831228256226, "step": 172}
{"train_info/time_between_train_steps": 0.007615327835083008, "step": 172}
{"train_info/time_between_train_steps": 26.613930463790894, "step": 172}
{"info/global_step": 173, "train_info/time_within_train_step": 34.06336998939514, "step": 173}
{"train_info/time_between_train_steps": 0.006183624267578125, "step": 173}
{"info/global_step": 174, "train_info/time_within_train_step": 34.16358041763306, "step": 174}
{"train_info/time_between_train_steps": 0.006063222885131836, "step": 174}
{"info/global_step": 175, "train_info/time_within_train_step": 34.00797510147095, "step": 175}
{"train_info/time_between_train_steps": 0.0062808990478515625, "step": 175}
{"info/global_step": 176, "train_info/time_within_train_step": 34.19510006904602, "step": 176}
{"train_info/time_between_train_steps": 0.00628662109375, "step": 176}
{"info/global_step": 177, "train_info/time_within_train_step": 33.98099732398987, "step": 177}
{"train_info/time_between_train_steps": 0.0062198638916015625, "step": 177}
{"info/global_step": 178, "train_info/time_within_train_step": 34.2129590511322, "step": 178}
{"train_info/time_between_train_steps": 0.006035327911376953, "step": 178}
{"info/global_step": 179, "train_info/time_within_train_step": 34.008423805236816, "step": 179}
{"train_info/time_between_train_steps": 0.006090641021728516, "step": 179}
{"info/global_step": 180, "train_info/time_within_train_step": 34.25611066818237, "step": 180}
{"train_info/time_between_train_steps": 0.011289119720458984, "step": 180}
{"info/global_step": 181, "train_info/time_within_train_step": 34.192341804504395, "step": 181}
{"train_info/time_between_train_steps": 0.00638890266418457, "step": 181}
{"info/global_step": 182, "train_info/time_within_train_step": 34.474809646606445, "step": 182}
{"train_info/time_between_train_steps": 0.005979061126708984, "step": 182}
{"info/global_step": 183, "train_info/time_within_train_step": 34.199124574661255, "step": 183}
{"train_info/time_between_train_steps": 0.006303548812866211, "step": 183}
{"info/global_step": 184, "train_info/time_within_train_step": 34.42536187171936, "step": 184}
{"train_info/time_between_train_steps": 0.006540536880493164, "step": 184}
{"info/global_step": 185, "train_info/time_within_train_step": 34.333367109298706, "step": 185}
{"train_info/time_between_train_steps": 0.006980419158935547, "step": 185}
{"info/global_step": 186, "train_info/time_within_train_step": 34.3673529624939, "step": 186}
{"train_info/time_between_train_steps": 0.006993532180786133, "step": 186}
{"info/global_step": 187, "train_info/time_within_train_step": 34.2272675037384, "step": 187}
{"train_info/time_between_train_steps": 0.00651860237121582, "step": 187}
{"info/global_step": 188, "train_info/time_within_train_step": 34.29303741455078, "step": 188}
{"train_info/time_between_train_steps": 0.011284828186035156, "step": 188}
{"info/global_step": 189, "train_info/time_within_train_step": 34.15441679954529, "step": 189}
{"train_info/time_between_train_steps": 0.006312847137451172, "step": 189}
{"info/global_step": 190, "train_info/time_within_train_step": 34.21016311645508, "step": 190}
{"train_info/time_between_train_steps": 0.006408214569091797, "step": 190}
{"info/global_step": 191, "train_info/time_within_train_step": 34.043492555618286, "step": 191}
{"train_info/time_between_train_steps": 0.00628209114074707, "step": 191}
{"info/global_step": 192, "train_info/time_within_train_step": 34.1928927898407, "step": 192}
{"train_info/time_between_train_steps": 0.006371259689331055, "step": 192}
{"info/global_step": 193, "train_info/time_within_train_step": 34.09074306488037, "step": 193}
{"train_info/time_between_train_steps": 0.011012792587280273, "step": 193}
{"info/global_step": 194, "train_info/time_within_train_step": 34.25008678436279, "step": 194}
{"train_info/time_between_train_steps": 0.012501239776611328, "step": 194}
{"info/global_step": 195, "train_info/time_within_train_step": 34.07308626174927, "step": 195}
{"train_info/time_between_train_steps": 0.016669750213623047, "step": 195}
{"info/global_step": 196, "train_info/time_within_train_step": 34.20056700706482, "step": 196}
{"train_info/time_between_train_steps": 0.006210803985595703, "step": 196}
{"info/global_step": 197, "train_info/time_within_train_step": 34.07547688484192, "step": 197}
{"train_info/time_between_train_steps": 0.015059709548950195, "step": 197}
{"info/global_step": 198, "train_info/time_within_train_step": 34.05401134490967, "step": 198}
{"train_info/time_between_train_steps": 0.0057697296142578125, "step": 198}
{"info/global_step": 199, "train_info/time_within_train_step": 34.034796953201294, "step": 199}
{"train_info/time_between_train_steps": 0.005800962448120117, "step": 199}
{"info/global_step": 200, "train_info/time_within_train_step": 34.068708658218384, "step": 200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734110172, "_runtime": 6946}, "step": 200}
{"logs": {"train/loss": 3.7529, "train/learning_rate": 0.0005555555555555556, "train/epoch": 4.02, "_timestamp": 1734110172, "_runtime": 6946}, "step": 200}
{"train_info/time_between_train_steps": 2.745527744293213, "step": 200}
{"info/global_step": 201, "train_info/time_within_train_step": 34.46287250518799, "step": 201}
{"train_info/time_between_train_steps": 0.006052970886230469, "step": 201}
{"info/global_step": 202, "train_info/time_within_train_step": 34.08556842803955, "step": 202}
{"train_info/time_between_train_steps": 0.005838632583618164, "step": 202}
{"info/global_step": 203, "train_info/time_within_train_step": 34.26433968544006, "step": 203}
{"train_info/time_between_train_steps": 0.010427474975585938, "step": 203}
{"info/global_step": 204, "train_info/time_within_train_step": 34.150113105773926, "step": 204}
{"train_info/time_between_train_steps": 0.005831003189086914, "step": 204}
{"info/global_step": 205, "train_info/time_within_train_step": 34.133689880371094, "step": 205}
{"train_info/time_between_train_steps": 0.005990266799926758, "step": 205}
{"info/global_step": 206, "train_info/time_within_train_step": 34.08969831466675, "step": 206}
{"train_info/time_between_train_steps": 0.006070613861083984, "step": 206}
{"info/global_step": 207, "train_info/time_within_train_step": 34.083009243011475, "step": 207}
{"train_info/time_between_train_steps": 0.005859851837158203, "step": 207}
{"info/global_step": 208, "train_info/time_within_train_step": 34.090167760849, "step": 208}
{"train_info/time_between_train_steps": 0.005912303924560547, "step": 208}
{"info/global_step": 209, "train_info/time_within_train_step": 34.1972222328186, "step": 209}
{"train_info/time_between_train_steps": 0.007247209548950195, "step": 209}
{"info/global_step": 210, "train_info/time_within_train_step": 34.05272436141968, "step": 210}
{"train_info/time_between_train_steps": 0.006012916564941406, "step": 210}
{"info/global_step": 211, "train_info/time_within_train_step": 34.15764403343201, "step": 211}
{"train_info/time_between_train_steps": 0.010639190673828125, "step": 211}
{"info/global_step": 212, "train_info/time_within_train_step": 34.247702836990356, "step": 212}
{"train_info/time_between_train_steps": 0.005982637405395508, "step": 212}
{"info/global_step": 213, "train_info/time_within_train_step": 34.11182689666748, "step": 213}
{"train_info/time_between_train_steps": 0.011190414428710938, "step": 213}
{"info/global_step": 214, "train_info/time_within_train_step": 34.22276449203491, "step": 214}
{"train_info/time_between_train_steps": 0.008890867233276367, "step": 214}
{"info/global_step": 215, "train_info/time_within_train_step": 34.360405921936035, "step": 215}
{"train_info/time_between_train_steps": 0.013082504272460938, "step": 215}
{"train_info/time_between_train_steps": 26.81517004966736, "step": 215}
{"info/global_step": 216, "train_info/time_within_train_step": 34.40673828125, "step": 216}
{"train_info/time_between_train_steps": 0.005603790283203125, "step": 216}
{"info/global_step": 217, "train_info/time_within_train_step": 34.3634672164917, "step": 217}
{"train_info/time_between_train_steps": 0.00600433349609375, "step": 217}
{"info/global_step": 218, "train_info/time_within_train_step": 34.149338722229004, "step": 218}
{"train_info/time_between_train_steps": 0.010584831237792969, "step": 218}
{"info/global_step": 219, "train_info/time_within_train_step": 34.28304076194763, "step": 219}
{"train_info/time_between_train_steps": 0.005861759185791016, "step": 219}
{"info/global_step": 220, "train_info/time_within_train_step": 34.08326959609985, "step": 220}
{"train_info/time_between_train_steps": 0.006216764450073242, "step": 220}
{"info/global_step": 221, "train_info/time_within_train_step": 34.44823122024536, "step": 221}
{"train_info/time_between_train_steps": 0.009979963302612305, "step": 221}
{"info/global_step": 222, "train_info/time_within_train_step": 34.1723358631134, "step": 222}
{"train_info/time_between_train_steps": 0.007128715515136719, "step": 222}
{"info/global_step": 223, "train_info/time_within_train_step": 34.2101776599884, "step": 223}
{"train_info/time_between_train_steps": 0.005918979644775391, "step": 223}
{"info/global_step": 224, "train_info/time_within_train_step": 34.231805086135864, "step": 224}
{"train_info/time_between_train_steps": 0.006223440170288086, "step": 224}
{"info/global_step": 225, "train_info/time_within_train_step": 34.270036935806274, "step": 225}
{"train_info/time_between_train_steps": 0.010921001434326172, "step": 225}
{"info/global_step": 226, "train_info/time_within_train_step": 34.18270754814148, "step": 226}
{"train_info/time_between_train_steps": 0.010262727737426758, "step": 226}
{"info/global_step": 227, "train_info/time_within_train_step": 34.36387491226196, "step": 227}
{"train_info/time_between_train_steps": 0.011190414428710938, "step": 227}
{"info/global_step": 228, "train_info/time_within_train_step": 34.13195037841797, "step": 228}
{"train_info/time_between_train_steps": 0.006173610687255859, "step": 228}
{"info/global_step": 229, "train_info/time_within_train_step": 34.29951763153076, "step": 229}
{"train_info/time_between_train_steps": 0.006455898284912109, "step": 229}
{"info/global_step": 230, "train_info/time_within_train_step": 34.13550567626953, "step": 230}
{"train_info/time_between_train_steps": 0.01055765151977539, "step": 230}
{"info/global_step": 231, "train_info/time_within_train_step": 34.43753266334534, "step": 231}
{"train_info/time_between_train_steps": 0.006089448928833008, "step": 231}
{"info/global_step": 232, "train_info/time_within_train_step": 34.22939944267273, "step": 232}
{"train_info/time_between_train_steps": 0.010111331939697266, "step": 232}
{"info/global_step": 233, "train_info/time_within_train_step": 34.68118619918823, "step": 233}
{"train_info/time_between_train_steps": 0.011347532272338867, "step": 233}
{"info/global_step": 234, "train_info/time_within_train_step": 34.17653250694275, "step": 234}
{"train_info/time_between_train_steps": 0.005821943283081055, "step": 234}
{"info/global_step": 235, "train_info/time_within_train_step": 34.21333384513855, "step": 235}
{"train_info/time_between_train_steps": 0.010896444320678711, "step": 235}
{"info/global_step": 236, "train_info/time_within_train_step": 34.024845361709595, "step": 236}
{"train_info/time_between_train_steps": 0.006018161773681641, "step": 236}
{"info/global_step": 237, "train_info/time_within_train_step": 34.30338764190674, "step": 237}
{"train_info/time_between_train_steps": 0.005991220474243164, "step": 237}
{"info/global_step": 238, "train_info/time_within_train_step": 34.13879656791687, "step": 238}
{"train_info/time_between_train_steps": 0.0061304569244384766, "step": 238}
{"info/global_step": 239, "train_info/time_within_train_step": 34.196686029434204, "step": 239}
{"train_info/time_between_train_steps": 0.006178379058837891, "step": 239}
{"info/global_step": 240, "train_info/time_within_train_step": 34.062493324279785, "step": 240}
{"train_info/time_between_train_steps": 0.00568699836730957, "step": 240}
{"info/global_step": 241, "train_info/time_within_train_step": 34.14719891548157, "step": 241}
{"train_info/time_between_train_steps": 0.009709596633911133, "step": 241}
{"info/global_step": 242, "train_info/time_within_train_step": 34.29735231399536, "step": 242}
{"train_info/time_between_train_steps": 0.006089687347412109, "step": 242}
{"info/global_step": 243, "train_info/time_within_train_step": 34.17421817779541, "step": 243}
{"train_info/time_between_train_steps": 0.005987644195556641, "step": 243}
{"info/global_step": 244, "train_info/time_within_train_step": 34.117730140686035, "step": 244}
{"train_info/time_between_train_steps": 0.0059490203857421875, "step": 244}
{"info/global_step": 245, "train_info/time_within_train_step": 34.129117250442505, "step": 245}
{"train_info/time_between_train_steps": 0.010821342468261719, "step": 245}
{"info/global_step": 246, "train_info/time_within_train_step": 34.24424934387207, "step": 246}
{"train_info/time_between_train_steps": 0.010487079620361328, "step": 246}
{"info/global_step": 247, "train_info/time_within_train_step": 34.42402410507202, "step": 247}
{"train_info/time_between_train_steps": 0.005831003189086914, "step": 247}
{"info/global_step": 248, "train_info/time_within_train_step": 34.21126317977905, "step": 248}
{"train_info/time_between_train_steps": 0.010119199752807617, "step": 248}
{"info/global_step": 249, "train_info/time_within_train_step": 34.07240056991577, "step": 249}
{"train_info/time_between_train_steps": 0.006201982498168945, "step": 249}
{"info/global_step": 250, "train_info/time_within_train_step": 34.13998317718506, "step": 250}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734111913, "_runtime": 8687}, "step": 250}
{"logs": {"train/loss": 3.6008, "train/learning_rate": 0.0005277777777777777, "train/epoch": 5.03, "_timestamp": 1734111913, "_runtime": 8687}, "step": 250}
{"train_info/time_between_train_steps": 0.013815879821777344, "step": 250}
{"info/global_step": 251, "train_info/time_within_train_step": 34.17178916931152, "step": 251}
{"train_info/time_between_train_steps": 0.010366439819335938, "step": 251}
{"info/global_step": 252, "train_info/time_within_train_step": 34.126707553863525, "step": 252}
{"train_info/time_between_train_steps": 0.01095724105834961, "step": 252}
{"info/global_step": 253, "train_info/time_within_train_step": 34.17957139015198, "step": 253}
{"train_info/time_between_train_steps": 0.006711006164550781, "step": 253}
{"info/global_step": 254, "train_info/time_within_train_step": 34.19972586631775, "step": 254}
{"train_info/time_between_train_steps": 0.00725102424621582, "step": 254}
{"info/global_step": 255, "train_info/time_within_train_step": 34.188737869262695, "step": 255}
{"train_info/time_between_train_steps": 0.006234407424926758, "step": 255}
{"info/global_step": 256, "train_info/time_within_train_step": 34.18542957305908, "step": 256}
{"train_info/time_between_train_steps": 0.006170749664306641, "step": 256}
{"info/global_step": 257, "train_info/time_within_train_step": 34.29308199882507, "step": 257}
{"train_info/time_between_train_steps": 0.010462760925292969, "step": 257}
{"info/global_step": 258, "train_info/time_within_train_step": 34.281450033187866, "step": 258}
{"train_info/time_between_train_steps": 0.015820741653442383, "step": 258}
{"train_info/time_between_train_steps": 27.13924765586853, "step": 258}
{"info/global_step": 259, "train_info/time_within_train_step": 34.221776723861694, "step": 259}
{"train_info/time_between_train_steps": 0.006587028503417969, "step": 259}
{"info/global_step": 260, "train_info/time_within_train_step": 34.51504683494568, "step": 260}
{"train_info/time_between_train_steps": 0.00722813606262207, "step": 260}
{"info/global_step": 261, "train_info/time_within_train_step": 34.09301543235779, "step": 261}
{"train_info/time_between_train_steps": 0.016392230987548828, "step": 261}
{"info/global_step": 262, "train_info/time_within_train_step": 34.63077759742737, "step": 262}
{"train_info/time_between_train_steps": 0.006147623062133789, "step": 262}
{"info/global_step": 263, "train_info/time_within_train_step": 34.31304717063904, "step": 263}
{"train_info/time_between_train_steps": 0.006626605987548828, "step": 263}
{"info/global_step": 264, "train_info/time_within_train_step": 34.38344669342041, "step": 264}
{"train_info/time_between_train_steps": 0.011461734771728516, "step": 264}
{"info/global_step": 265, "train_info/time_within_train_step": 34.271610736846924, "step": 265}
{"train_info/time_between_train_steps": 0.0065975189208984375, "step": 265}
{"info/global_step": 266, "train_info/time_within_train_step": 34.32634210586548, "step": 266}
{"train_info/time_between_train_steps": 0.01064157485961914, "step": 266}
{"info/global_step": 267, "train_info/time_within_train_step": 34.24335837364197, "step": 267}
{"train_info/time_between_train_steps": 0.010327577590942383, "step": 267}
{"info/global_step": 268, "train_info/time_within_train_step": 34.41081953048706, "step": 268}
{"train_info/time_between_train_steps": 0.0064983367919921875, "step": 268}
{"info/global_step": 269, "train_info/time_within_train_step": 34.332743406295776, "step": 269}
{"train_info/time_between_train_steps": 0.01320505142211914, "step": 269}
{"info/global_step": 270, "train_info/time_within_train_step": 34.325939416885376, "step": 270}
{"train_info/time_between_train_steps": 0.007215976715087891, "step": 270}
{"info/global_step": 271, "train_info/time_within_train_step": 34.40087604522705, "step": 271}
{"train_info/time_between_train_steps": 0.011053323745727539, "step": 271}
{"info/global_step": 272, "train_info/time_within_train_step": 34.39207172393799, "step": 272}
{"train_info/time_between_train_steps": 0.006018877029418945, "step": 272}
{"info/global_step": 273, "train_info/time_within_train_step": 34.39733958244324, "step": 273}
{"train_info/time_between_train_steps": 0.012217521667480469, "step": 273}
{"info/global_step": 274, "train_info/time_within_train_step": 34.38490700721741, "step": 274}
{"train_info/time_between_train_steps": 0.00912022590637207, "step": 274}
{"info/global_step": 275, "train_info/time_within_train_step": 34.16107130050659, "step": 275}
{"train_info/time_between_train_steps": 0.010946512222290039, "step": 275}
{"info/global_step": 276, "train_info/time_within_train_step": 34.39081859588623, "step": 276}
{"train_info/time_between_train_steps": 0.00670170783996582, "step": 276}
{"info/global_step": 277, "train_info/time_within_train_step": 34.16358494758606, "step": 277}
{"train_info/time_between_train_steps": 0.013059616088867188, "step": 277}
{"info/global_step": 278, "train_info/time_within_train_step": 34.97800135612488, "step": 278}
{"train_info/time_between_train_steps": 0.01386117935180664, "step": 278}
{"info/global_step": 279, "train_info/time_within_train_step": 34.199803829193115, "step": 279}
{"train_info/time_between_train_steps": 0.006385326385498047, "step": 279}
{"info/global_step": 280, "train_info/time_within_train_step": 34.38776779174805, "step": 280}
{"train_info/time_between_train_steps": 0.012097358703613281, "step": 280}
{"info/global_step": 281, "train_info/time_within_train_step": 34.2164990901947, "step": 281}
{"train_info/time_between_train_steps": 0.0066378116607666016, "step": 281}
{"info/global_step": 282, "train_info/time_within_train_step": 34.38660383224487, "step": 282}
{"train_info/time_between_train_steps": 0.006817817687988281, "step": 282}
{"info/global_step": 283, "train_info/time_within_train_step": 34.07837414741516, "step": 283}
{"train_info/time_between_train_steps": 0.005988121032714844, "step": 283}
{"info/global_step": 284, "train_info/time_within_train_step": 34.18168640136719, "step": 284}
{"train_info/time_between_train_steps": 0.006245613098144531, "step": 284}
{"info/global_step": 285, "train_info/time_within_train_step": 34.09514021873474, "step": 285}
{"train_info/time_between_train_steps": 0.009616851806640625, "step": 285}
{"info/global_step": 286, "train_info/time_within_train_step": 34.13654088973999, "step": 286}
{"train_info/time_between_train_steps": 0.006100893020629883, "step": 286}
{"info/global_step": 287, "train_info/time_within_train_step": 34.041560649871826, "step": 287}
{"train_info/time_between_train_steps": 0.0078084468841552734, "step": 287}
{"info/global_step": 288, "train_info/time_within_train_step": 34.090166330337524, "step": 288}
{"train_info/time_between_train_steps": 0.010449886322021484, "step": 288}
{"info/global_step": 289, "train_info/time_within_train_step": 34.202399253845215, "step": 289}
{"train_info/time_between_train_steps": 0.005972862243652344, "step": 289}
{"info/global_step": 290, "train_info/time_within_train_step": 34.103012561798096, "step": 290}
{"train_info/time_between_train_steps": 0.005843639373779297, "step": 290}
{"info/global_step": 291, "train_info/time_within_train_step": 34.06982398033142, "step": 291}
{"train_info/time_between_train_steps": 0.01540994644165039, "step": 291}
{"info/global_step": 292, "train_info/time_within_train_step": 34.230393409729004, "step": 292}
{"train_info/time_between_train_steps": 0.010387897491455078, "step": 292}
{"info/global_step": 293, "train_info/time_within_train_step": 34.386269330978394, "step": 293}
{"train_info/time_between_train_steps": 0.005856990814208984, "step": 293}
{"info/global_step": 294, "train_info/time_within_train_step": 34.08035063743591, "step": 294}
{"train_info/time_between_train_steps": 0.00757288932800293, "step": 294}
{"info/global_step": 295, "train_info/time_within_train_step": 34.25092673301697, "step": 295}
{"train_info/time_between_train_steps": 0.0060083866119384766, "step": 295}
{"info/global_step": 296, "train_info/time_within_train_step": 34.24820852279663, "step": 296}
{"train_info/time_between_train_steps": 0.00952005386352539, "step": 296}
{"info/global_step": 297, "train_info/time_within_train_step": 34.23806142807007, "step": 297}
{"train_info/time_between_train_steps": 0.006866455078125, "step": 297}
{"info/global_step": 298, "train_info/time_within_train_step": 34.11659598350525, "step": 298}
{"train_info/time_between_train_steps": 0.011444568634033203, "step": 298}
{"info/global_step": 299, "train_info/time_within_train_step": 35.239144802093506, "step": 299}
{"train_info/time_between_train_steps": 0.0060329437255859375, "step": 299}
{"info/global_step": 300, "train_info/time_within_train_step": 35.62387466430664, "step": 300}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734113656, "_runtime": 10430}, "step": 300}
{"logs": {"train/loss": 3.3332, "train/learning_rate": 0.0005, "train/epoch": 6.04, "_timestamp": 1734113656, "_runtime": 10430}, "step": 300}
{"train_info/time_between_train_steps": 14.12177324295044, "step": 300}
{"info/global_step": 301, "train_info/time_within_train_step": 34.261027336120605, "step": 301}
{"train_info/time_between_train_steps": 0.007962465286254883, "step": 301}
{"train_info/time_between_train_steps": 27.580817222595215, "step": 301}
{"info/global_step": 302, "train_info/time_within_train_step": 34.28074836730957, "step": 302}
{"train_info/time_between_train_steps": 0.00862884521484375, "step": 302}
{"info/global_step": 303, "train_info/time_within_train_step": 34.37270641326904, "step": 303}
{"train_info/time_between_train_steps": 0.009365558624267578, "step": 303}
{"info/global_step": 304, "train_info/time_within_train_step": 34.26587414741516, "step": 304}
{"train_info/time_between_train_steps": 0.006726264953613281, "step": 304}
{"info/global_step": 305, "train_info/time_within_train_step": 34.37726902961731, "step": 305}
{"train_info/time_between_train_steps": 0.00701594352722168, "step": 305}
{"info/global_step": 306, "train_info/time_within_train_step": 34.217069149017334, "step": 306}
{"train_info/time_between_train_steps": 0.013765335083007812, "step": 306}
{"info/global_step": 307, "train_info/time_within_train_step": 34.474120140075684, "step": 307}
{"train_info/time_between_train_steps": 0.006487369537353516, "step": 307}
{"info/global_step": 308, "train_info/time_within_train_step": 34.44165372848511, "step": 308}
{"train_info/time_between_train_steps": 0.016546249389648438, "step": 308}
{"info/global_step": 309, "train_info/time_within_train_step": 34.370197772979736, "step": 309}
{"train_info/time_between_train_steps": 0.012229681015014648, "step": 309}
{"info/global_step": 310, "train_info/time_within_train_step": 34.229565382003784, "step": 310}
{"train_info/time_between_train_steps": 0.0067102909088134766, "step": 310}
{"info/global_step": 311, "train_info/time_within_train_step": 34.38563895225525, "step": 311}
{"train_info/time_between_train_steps": 0.0061495304107666016, "step": 311}
{"info/global_step": 312, "train_info/time_within_train_step": 34.22708773612976, "step": 312}
{"train_info/time_between_train_steps": 0.00654292106628418, "step": 312}
{"info/global_step": 313, "train_info/time_within_train_step": 34.344260692596436, "step": 313}
{"train_info/time_between_train_steps": 0.006395578384399414, "step": 313}
{"info/global_step": 314, "train_info/time_within_train_step": 34.28732681274414, "step": 314}
{"train_info/time_between_train_steps": 0.006659746170043945, "step": 314}
{"info/global_step": 315, "train_info/time_within_train_step": 34.515645265579224, "step": 315}
{"train_info/time_between_train_steps": 0.009372949600219727, "step": 315}
{"info/global_step": 316, "train_info/time_within_train_step": 34.207900524139404, "step": 316}
{"train_info/time_between_train_steps": 0.01212930679321289, "step": 316}
{"info/global_step": 317, "train_info/time_within_train_step": 34.55086374282837, "step": 317}
{"train_info/time_between_train_steps": 0.008608579635620117, "step": 317}
{"info/global_step": 318, "train_info/time_within_train_step": 34.20672011375427, "step": 318}
{"train_info/time_between_train_steps": 0.01114034652709961, "step": 318}
{"info/global_step": 319, "train_info/time_within_train_step": 34.480952501297, "step": 319}
{"train_info/time_between_train_steps": 0.012526273727416992, "step": 319}
{"info/global_step": 320, "train_info/time_within_train_step": 34.10595750808716, "step": 320}
{"train_info/time_between_train_steps": 0.012215375900268555, "step": 320}
{"info/global_step": 321, "train_info/time_within_train_step": 34.2928512096405, "step": 321}
{"train_info/time_between_train_steps": 0.009712934494018555, "step": 321}
{"info/global_step": 322, "train_info/time_within_train_step": 34.270238637924194, "step": 322}
{"train_info/time_between_train_steps": 0.006621122360229492, "step": 322}
{"info/global_step": 323, "train_info/time_within_train_step": 34.3855459690094, "step": 323}
{"train_info/time_between_train_steps": 0.007115364074707031, "step": 323}
{"info/global_step": 324, "train_info/time_within_train_step": 34.412190437316895, "step": 324}
{"train_info/time_between_train_steps": 0.0067424774169921875, "step": 324}
{"info/global_step": 325, "train_info/time_within_train_step": 34.32795524597168, "step": 325}
{"train_info/time_between_train_steps": 0.010703563690185547, "step": 325}
{"info/global_step": 326, "train_info/time_within_train_step": 34.223628759384155, "step": 326}
{"train_info/time_between_train_steps": 0.010785579681396484, "step": 326}
{"info/global_step": 327, "train_info/time_within_train_step": 34.27396631240845, "step": 327}
{"train_info/time_between_train_steps": 0.01644277572631836, "step": 327}
{"info/global_step": 328, "train_info/time_within_train_step": 34.25175380706787, "step": 328}
{"train_info/time_between_train_steps": 0.011823892593383789, "step": 328}
{"info/global_step": 329, "train_info/time_within_train_step": 34.13899040222168, "step": 329}
{"train_info/time_between_train_steps": 0.006155252456665039, "step": 329}
{"info/global_step": 330, "train_info/time_within_train_step": 34.259663820266724, "step": 330}
{"train_info/time_between_train_steps": 0.00694727897644043, "step": 330}
{"info/global_step": 331, "train_info/time_within_train_step": 34.24352788925171, "step": 331}
{"train_info/time_between_train_steps": 0.010040521621704102, "step": 331}
{"info/global_step": 332, "train_info/time_within_train_step": 34.18221569061279, "step": 332}
{"train_info/time_between_train_steps": 0.006060600280761719, "step": 332}
{"info/global_step": 333, "train_info/time_within_train_step": 34.249038219451904, "step": 333}
{"train_info/time_between_train_steps": 0.008282899856567383, "step": 333}
{"info/global_step": 334, "train_info/time_within_train_step": 34.251885414123535, "step": 334}
{"train_info/time_between_train_steps": 0.011467456817626953, "step": 334}
{"info/global_step": 335, "train_info/time_within_train_step": 34.130019426345825, "step": 335}
{"train_info/time_between_train_steps": 0.006550312042236328, "step": 335}
{"info/global_step": 336, "train_info/time_within_train_step": 34.26395297050476, "step": 336}
{"train_info/time_between_train_steps": 0.005912303924560547, "step": 336}
{"info/global_step": 337, "train_info/time_within_train_step": 34.22209072113037, "step": 337}
{"train_info/time_between_train_steps": 0.010677337646484375, "step": 337}
{"info/global_step": 338, "train_info/time_within_train_step": 34.1513397693634, "step": 338}
{"train_info/time_between_train_steps": 0.010461807250976562, "step": 338}
{"info/global_step": 339, "train_info/time_within_train_step": 34.441017389297485, "step": 339}
{"train_info/time_between_train_steps": 0.012062311172485352, "step": 339}
{"info/global_step": 340, "train_info/time_within_train_step": 34.20897078514099, "step": 340}
{"train_info/time_between_train_steps": 0.01101994514465332, "step": 340}
{"info/global_step": 341, "train_info/time_within_train_step": 34.24276041984558, "step": 341}
{"train_info/time_between_train_steps": 0.017126798629760742, "step": 341}
{"info/global_step": 342, "train_info/time_within_train_step": 34.33103370666504, "step": 342}
{"train_info/time_between_train_steps": 0.0062983036041259766, "step": 342}
{"info/global_step": 343, "train_info/time_within_train_step": 34.18323111534119, "step": 343}
{"train_info/time_between_train_steps": 0.006414651870727539, "step": 343}
{"info/global_step": 344, "train_info/time_within_train_step": 34.204798221588135, "step": 344}
{"train_info/time_between_train_steps": 0.012496709823608398, "step": 344}
{"train_info/time_between_train_steps": 27.11453866958618, "step": 344}
{"info/global_step": 345, "train_info/time_within_train_step": 34.230499505996704, "step": 345}
{"train_info/time_between_train_steps": 0.008006572723388672, "step": 345}
{"info/global_step": 346, "train_info/time_within_train_step": 34.32986497879028, "step": 346}
{"train_info/time_between_train_steps": 0.006192684173583984, "step": 346}
{"info/global_step": 347, "train_info/time_within_train_step": 34.18634247779846, "step": 347}
{"train_info/time_between_train_steps": 0.006623506546020508, "step": 347}
{"info/global_step": 348, "train_info/time_within_train_step": 34.48545813560486, "step": 348}
{"train_info/time_between_train_steps": 0.006570339202880859, "step": 348}
{"info/global_step": 349, "train_info/time_within_train_step": 34.35677194595337, "step": 349}
{"train_info/time_between_train_steps": 0.0063610076904296875, "step": 349}
{"info/global_step": 350, "train_info/time_within_train_step": 34.34046649932861, "step": 350}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734115440, "_runtime": 12214}, "step": 350}
{"logs": {"train/loss": 3.089, "train/learning_rate": 0.00047222222222222224, "train/epoch": 8.01, "_timestamp": 1734115440, "_runtime": 12214}, "step": 350}
{"train_info/time_between_train_steps": 0.01392507553100586, "step": 350}
{"info/global_step": 351, "train_info/time_within_train_step": 34.31817650794983, "step": 351}
{"train_info/time_between_train_steps": 0.010648012161254883, "step": 351}
{"info/global_step": 352, "train_info/time_within_train_step": 34.44677925109863, "step": 352}
{"train_info/time_between_train_steps": 0.011536836624145508, "step": 352}
{"info/global_step": 353, "train_info/time_within_train_step": 34.25729560852051, "step": 353}
{"train_info/time_between_train_steps": 0.010808944702148438, "step": 353}
{"info/global_step": 354, "train_info/time_within_train_step": 34.62841439247131, "step": 354}
{"train_info/time_between_train_steps": 0.014727592468261719, "step": 354}
{"info/global_step": 355, "train_info/time_within_train_step": 34.074073791503906, "step": 355}
{"train_info/time_between_train_steps": 0.006512641906738281, "step": 355}
{"info/global_step": 356, "train_info/time_within_train_step": 34.376864194869995, "step": 356}
{"train_info/time_between_train_steps": 0.011105537414550781, "step": 356}
{"info/global_step": 357, "train_info/time_within_train_step": 34.190125703811646, "step": 357}
{"train_info/time_between_train_steps": 0.010584115982055664, "step": 357}
{"info/global_step": 358, "train_info/time_within_train_step": 34.49840807914734, "step": 358}
{"train_info/time_between_train_steps": 0.013538360595703125, "step": 358}
{"info/global_step": 359, "train_info/time_within_train_step": 34.229185342788696, "step": 359}
{"train_info/time_between_train_steps": 0.012097835540771484, "step": 359}
{"info/global_step": 360, "train_info/time_within_train_step": 34.43581247329712, "step": 360}
{"train_info/time_between_train_steps": 0.011346578598022461, "step": 360}
{"info/global_step": 361, "train_info/time_within_train_step": 34.25221085548401, "step": 361}
{"train_info/time_between_train_steps": 0.007520437240600586, "step": 361}
{"info/global_step": 362, "train_info/time_within_train_step": 34.57213115692139, "step": 362}
{"train_info/time_between_train_steps": 0.0065801143646240234, "step": 362}
{"info/global_step": 363, "train_info/time_within_train_step": 34.208927154541016, "step": 363}
{"train_info/time_between_train_steps": 0.006808757781982422, "step": 363}
{"info/global_step": 364, "train_info/time_within_train_step": 34.42774820327759, "step": 364}
{"train_info/time_between_train_steps": 0.012075662612915039, "step": 364}
{"info/global_step": 365, "train_info/time_within_train_step": 34.30966138839722, "step": 365}
{"train_info/time_between_train_steps": 0.01192617416381836, "step": 365}
{"info/global_step": 366, "train_info/time_within_train_step": 34.37486481666565, "step": 366}
{"train_info/time_between_train_steps": 0.00728607177734375, "step": 366}
{"info/global_step": 367, "train_info/time_within_train_step": 34.13842511177063, "step": 367}
{"train_info/time_between_train_steps": 0.012042760848999023, "step": 367}
{"info/global_step": 368, "train_info/time_within_train_step": 34.39811301231384, "step": 368}
{"train_info/time_between_train_steps": 0.010215997695922852, "step": 368}
{"info/global_step": 369, "train_info/time_within_train_step": 34.25152897834778, "step": 369}
{"train_info/time_between_train_steps": 0.009418487548828125, "step": 369}
{"info/global_step": 370, "train_info/time_within_train_step": 34.42754244804382, "step": 370}
{"train_info/time_between_train_steps": 0.01241922378540039, "step": 370}
{"info/global_step": 371, "train_info/time_within_train_step": 34.24987173080444, "step": 371}
{"train_info/time_between_train_steps": 0.010465145111083984, "step": 371}
{"info/global_step": 372, "train_info/time_within_train_step": 34.26999497413635, "step": 372}
{"train_info/time_between_train_steps": 0.012844562530517578, "step": 372}
{"info/global_step": 373, "train_info/time_within_train_step": 34.22074031829834, "step": 373}
{"train_info/time_between_train_steps": 0.011411190032958984, "step": 373}
{"info/global_step": 374, "train_info/time_within_train_step": 34.24028754234314, "step": 374}
{"train_info/time_between_train_steps": 0.006029844284057617, "step": 374}
{"info/global_step": 375, "train_info/time_within_train_step": 34.141282081604004, "step": 375}
{"train_info/time_between_train_steps": 0.007599830627441406, "step": 375}
{"info/global_step": 376, "train_info/time_within_train_step": 34.13849496841431, "step": 376}
{"train_info/time_between_train_steps": 0.010254621505737305, "step": 376}
{"info/global_step": 377, "train_info/time_within_train_step": 34.19999289512634, "step": 377}
{"train_info/time_between_train_steps": 0.016499757766723633, "step": 377}
{"info/global_step": 378, "train_info/time_within_train_step": 34.2524528503418, "step": 378}
{"train_info/time_between_train_steps": 0.009219169616699219, "step": 378}
{"info/global_step": 379, "train_info/time_within_train_step": 34.243844985961914, "step": 379}
{"train_info/time_between_train_steps": 0.012581110000610352, "step": 379}
{"info/global_step": 380, "train_info/time_within_train_step": 34.22904706001282, "step": 380}
{"train_info/time_between_train_steps": 0.006061077117919922, "step": 380}
{"info/global_step": 381, "train_info/time_within_train_step": 34.27211380004883, "step": 381}
{"train_info/time_between_train_steps": 0.01650547981262207, "step": 381}
{"info/global_step": 382, "train_info/time_within_train_step": 34.216931104660034, "step": 382}
{"train_info/time_between_train_steps": 0.006096839904785156, "step": 382}
{"info/global_step": 383, "train_info/time_within_train_step": 34.2033007144928, "step": 383}
{"train_info/time_between_train_steps": 0.0060002803802490234, "step": 383}
{"info/global_step": 384, "train_info/time_within_train_step": 34.27495551109314, "step": 384}
{"train_info/time_between_train_steps": 0.01219320297241211, "step": 384}
{"info/global_step": 385, "train_info/time_within_train_step": 34.19855833053589, "step": 385}
{"train_info/time_between_train_steps": 0.006455898284912109, "step": 385}
{"info/global_step": 386, "train_info/time_within_train_step": 34.46439456939697, "step": 386}
{"train_info/time_between_train_steps": 0.010283231735229492, "step": 386}
{"info/global_step": 387, "train_info/time_within_train_step": 34.2139208316803, "step": 387}
{"train_info/time_between_train_steps": 0.00972890853881836, "step": 387}
{"train_info/time_between_train_steps": 26.96681809425354, "step": 387}
{"info/global_step": 388, "train_info/time_within_train_step": 34.27231693267822, "step": 388}
{"train_info/time_between_train_steps": 0.006596803665161133, "step": 388}
{"info/global_step": 389, "train_info/time_within_train_step": 34.40229678153992, "step": 389}
{"train_info/time_between_train_steps": 0.013120889663696289, "step": 389}
{"info/global_step": 390, "train_info/time_within_train_step": 34.21338152885437, "step": 390}
{"train_info/time_between_train_steps": 0.006009101867675781, "step": 390}
{"info/global_step": 391, "train_info/time_within_train_step": 34.39407515525818, "step": 391}
{"train_info/time_between_train_steps": 0.006142377853393555, "step": 391}
{"info/global_step": 392, "train_info/time_within_train_step": 34.225438594818115, "step": 392}
{"train_info/time_between_train_steps": 0.005970478057861328, "step": 392}
{"info/global_step": 393, "train_info/time_within_train_step": 34.51599836349487, "step": 393}
{"train_info/time_between_train_steps": 0.011084794998168945, "step": 393}
{"info/global_step": 394, "train_info/time_within_train_step": 34.3559467792511, "step": 394}
{"train_info/time_between_train_steps": 0.006688117980957031, "step": 394}
{"info/global_step": 395, "train_info/time_within_train_step": 34.536405086517334, "step": 395}
{"train_info/time_between_train_steps": 0.012242555618286133, "step": 395}
{"info/global_step": 396, "train_info/time_within_train_step": 34.30248689651489, "step": 396}
{"train_info/time_between_train_steps": 0.006634235382080078, "step": 396}
{"info/global_step": 397, "train_info/time_within_train_step": 34.242165327072144, "step": 397}
{"train_info/time_between_train_steps": 0.006259441375732422, "step": 397}
{"info/global_step": 398, "train_info/time_within_train_step": 34.12793517112732, "step": 398}
{"train_info/time_between_train_steps": 0.010818719863891602, "step": 398}
{"info/global_step": 399, "train_info/time_within_train_step": 34.3171546459198, "step": 399}
{"train_info/time_between_train_steps": 0.010056257247924805, "step": 399}
{"info/global_step": 400, "train_info/time_within_train_step": 34.374067544937134, "step": 400}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734117182, "_runtime": 13956}, "step": 400}
{"logs": {"train/loss": 2.8687, "train/learning_rate": 0.00044444444444444436, "train/epoch": 9.01, "_timestamp": 1734117182, "_runtime": 13956}, "step": 400}
{"train_info/time_between_train_steps": 2.4523239135742188, "step": 400}
{"info/global_step": 401, "train_info/time_within_train_step": 34.626179933547974, "step": 401}
{"train_info/time_between_train_steps": 0.010234594345092773, "step": 401}
{"info/global_step": 402, "train_info/time_within_train_step": 34.16065239906311, "step": 402}
{"train_info/time_between_train_steps": 0.00637054443359375, "step": 402}
{"info/global_step": 403, "train_info/time_within_train_step": 34.476956844329834, "step": 403}
{"train_info/time_between_train_steps": 0.00923013687133789, "step": 403}
{"info/global_step": 404, "train_info/time_within_train_step": 34.258948802948, "step": 404}
{"train_info/time_between_train_steps": 0.013486623764038086, "step": 404}
{"info/global_step": 405, "train_info/time_within_train_step": 34.66417217254639, "step": 405}
{"train_info/time_between_train_steps": 0.007865190505981445, "step": 405}
{"info/global_step": 406, "train_info/time_within_train_step": 34.25385546684265, "step": 406}
{"train_info/time_between_train_steps": 0.010846376419067383, "step": 406}
{"info/global_step": 407, "train_info/time_within_train_step": 34.507702589035034, "step": 407}
{"train_info/time_between_train_steps": 0.008769750595092773, "step": 407}
{"info/global_step": 408, "train_info/time_within_train_step": 34.29817080497742, "step": 408}
{"train_info/time_between_train_steps": 0.010591268539428711, "step": 408}
{"info/global_step": 409, "train_info/time_within_train_step": 34.51061964035034, "step": 409}
{"train_info/time_between_train_steps": 0.015600442886352539, "step": 409}
{"info/global_step": 410, "train_info/time_within_train_step": 34.171226263046265, "step": 410}
{"train_info/time_between_train_steps": 0.0061452388763427734, "step": 410}
{"info/global_step": 411, "train_info/time_within_train_step": 34.23405075073242, "step": 411}
{"train_info/time_between_train_steps": 0.010849714279174805, "step": 411}
{"info/global_step": 412, "train_info/time_within_train_step": 34.18108129501343, "step": 412}
{"train_info/time_between_train_steps": 0.0056302547454833984, "step": 412}
{"info/global_step": 413, "train_info/time_within_train_step": 34.174219608306885, "step": 413}
{"train_info/time_between_train_steps": 0.005770683288574219, "step": 413}
{"info/global_step": 414, "train_info/time_within_train_step": 34.149423599243164, "step": 414}
{"train_info/time_between_train_steps": 0.0062410831451416016, "step": 414}
{"info/global_step": 415, "train_info/time_within_train_step": 34.249091148376465, "step": 415}
{"train_info/time_between_train_steps": 0.0059931278228759766, "step": 415}
{"info/global_step": 416, "train_info/time_within_train_step": 34.3414888381958, "step": 416}
{"train_info/time_between_train_steps": 0.010881423950195312, "step": 416}
{"info/global_step": 417, "train_info/time_within_train_step": 34.23281383514404, "step": 417}
{"train_info/time_between_train_steps": 0.01588916778564453, "step": 417}
{"info/global_step": 418, "train_info/time_within_train_step": 34.25144338607788, "step": 418}
{"train_info/time_between_train_steps": 0.010384321212768555, "step": 418}
{"info/global_step": 419, "train_info/time_within_train_step": 34.2304470539093, "step": 419}
{"train_info/time_between_train_steps": 0.005838632583618164, "step": 419}
{"info/global_step": 420, "train_info/time_within_train_step": 34.27642607688904, "step": 420}
{"train_info/time_between_train_steps": 0.0069963932037353516, "step": 420}
{"info/global_step": 421, "train_info/time_within_train_step": 34.108726978302, "step": 421}
{"train_info/time_between_train_steps": 0.007053852081298828, "step": 421}
{"info/global_step": 422, "train_info/time_within_train_step": 34.29093837738037, "step": 422}
{"train_info/time_between_train_steps": 0.006242036819458008, "step": 422}
{"info/global_step": 423, "train_info/time_within_train_step": 34.12834978103638, "step": 423}
{"train_info/time_between_train_steps": 0.010939359664916992, "step": 423}
{"info/global_step": 424, "train_info/time_within_train_step": 34.26067137718201, "step": 424}
{"train_info/time_between_train_steps": 0.00581669807434082, "step": 424}
{"info/global_step": 425, "train_info/time_within_train_step": 34.05459928512573, "step": 425}
{"train_info/time_between_train_steps": 0.00594782829284668, "step": 425}
{"info/global_step": 426, "train_info/time_within_train_step": 34.236175537109375, "step": 426}
{"train_info/time_between_train_steps": 0.01226949691772461, "step": 426}
{"info/global_step": 427, "train_info/time_within_train_step": 34.16599440574646, "step": 427}
{"train_info/time_between_train_steps": 0.010962724685668945, "step": 427}
{"info/global_step": 428, "train_info/time_within_train_step": 34.19647479057312, "step": 428}
{"train_info/time_between_train_steps": 0.013801336288452148, "step": 428}
{"info/global_step": 429, "train_info/time_within_train_step": 34.21749448776245, "step": 429}
{"train_info/time_between_train_steps": 0.006133556365966797, "step": 429}
{"info/global_step": 430, "train_info/time_within_train_step": 34.17213821411133, "step": 430}
{"train_info/time_between_train_steps": 0.006654262542724609, "step": 430}
{"train_info/time_between_train_steps": 27.047775745391846, "step": 430}
{"info/global_step": 431, "train_info/time_within_train_step": 34.32418870925903, "step": 431}
{"train_info/time_between_train_steps": 0.010808229446411133, "step": 431}
{"info/global_step": 432, "train_info/time_within_train_step": 34.44138836860657, "step": 432}
{"train_info/time_between_train_steps": 0.010810613632202148, "step": 432}
{"info/global_step": 433, "train_info/time_within_train_step": 34.21999001502991, "step": 433}
{"train_info/time_between_train_steps": 0.006345272064208984, "step": 433}
{"info/global_step": 434, "train_info/time_within_train_step": 34.278661012649536, "step": 434}
{"train_info/time_between_train_steps": 0.010560035705566406, "step": 434}
{"info/global_step": 435, "train_info/time_within_train_step": 34.23353290557861, "step": 435}
{"train_info/time_between_train_steps": 0.020226001739501953, "step": 435}
{"info/global_step": 436, "train_info/time_within_train_step": 34.46163034439087, "step": 436}
{"train_info/time_between_train_steps": 0.06933474540710449, "step": 436}
{"info/global_step": 437, "train_info/time_within_train_step": 34.21932411193848, "step": 437}
{"train_info/time_between_train_steps": 0.01134490966796875, "step": 437}
{"info/global_step": 438, "train_info/time_within_train_step": 34.43331289291382, "step": 438}
{"train_info/time_between_train_steps": 0.0062105655670166016, "step": 438}
{"info/global_step": 439, "train_info/time_within_train_step": 34.24573636054993, "step": 439}
{"train_info/time_between_train_steps": 0.012279272079467773, "step": 439}
{"info/global_step": 440, "train_info/time_within_train_step": 34.35757517814636, "step": 440}
{"train_info/time_between_train_steps": 0.006437540054321289, "step": 440}
{"info/global_step": 441, "train_info/time_within_train_step": 34.30779004096985, "step": 441}
{"train_info/time_between_train_steps": 0.006403446197509766, "step": 441}
{"info/global_step": 442, "train_info/time_within_train_step": 34.40252351760864, "step": 442}
{"train_info/time_between_train_steps": 0.006175994873046875, "step": 442}
{"info/global_step": 443, "train_info/time_within_train_step": 34.24928903579712, "step": 443}
{"train_info/time_between_train_steps": 0.006517171859741211, "step": 443}
{"info/global_step": 444, "train_info/time_within_train_step": 34.33958888053894, "step": 444}
{"train_info/time_between_train_steps": 0.006097316741943359, "step": 444}
{"info/global_step": 445, "train_info/time_within_train_step": 34.281001806259155, "step": 445}
{"train_info/time_between_train_steps": 0.01520681381225586, "step": 445}
{"info/global_step": 446, "train_info/time_within_train_step": 34.39946627616882, "step": 446}
{"train_info/time_between_train_steps": 0.011952400207519531, "step": 446}
{"info/global_step": 447, "train_info/time_within_train_step": 34.40530967712402, "step": 447}
{"train_info/time_between_train_steps": 0.006262779235839844, "step": 447}
{"info/global_step": 448, "train_info/time_within_train_step": 34.29689359664917, "step": 448}
{"train_info/time_between_train_steps": 0.007628917694091797, "step": 448}
{"info/global_step": 449, "train_info/time_within_train_step": 34.29534411430359, "step": 449}
{"train_info/time_between_train_steps": 0.010848283767700195, "step": 449}
{"info/global_step": 450, "train_info/time_within_train_step": 34.353333711624146, "step": 450}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734118927, "_runtime": 15701}, "step": 450}
{"logs": {"train/loss": 2.7458, "train/learning_rate": 0.00041666666666666664, "train/epoch": 10.02, "_timestamp": 1734118927, "_runtime": 15701}, "step": 450}
{"train_info/time_between_train_steps": 0.01526498794555664, "step": 450}
{"info/global_step": 451, "train_info/time_within_train_step": 34.49733090400696, "step": 451}
{"train_info/time_between_train_steps": 0.016574621200561523, "step": 451}
{"info/global_step": 452, "train_info/time_within_train_step": 34.50250697135925, "step": 452}
{"train_info/time_between_train_steps": 0.016497373580932617, "step": 452}
{"info/global_step": 453, "train_info/time_within_train_step": 34.219095945358276, "step": 453}
{"train_info/time_between_train_steps": 0.006143808364868164, "step": 453}
{"info/global_step": 454, "train_info/time_within_train_step": 34.3866400718689, "step": 454}
{"train_info/time_between_train_steps": 0.006653308868408203, "step": 454}
{"info/global_step": 455, "train_info/time_within_train_step": 34.161216735839844, "step": 455}
{"train_info/time_between_train_steps": 0.01116037368774414, "step": 455}
{"info/global_step": 456, "train_info/time_within_train_step": 34.22563099861145, "step": 456}
{"train_info/time_between_train_steps": 0.005871295928955078, "step": 456}
{"info/global_step": 457, "train_info/time_within_train_step": 34.174144983291626, "step": 457}
{"train_info/time_between_train_steps": 0.008954524993896484, "step": 457}
{"info/global_step": 458, "train_info/time_within_train_step": 34.2636399269104, "step": 458}
{"train_info/time_between_train_steps": 0.0059757232666015625, "step": 458}
{"info/global_step": 459, "train_info/time_within_train_step": 34.22693085670471, "step": 459}
{"train_info/time_between_train_steps": 0.00598454475402832, "step": 459}
{"info/global_step": 460, "train_info/time_within_train_step": 34.233824014663696, "step": 460}
{"train_info/time_between_train_steps": 0.009868383407592773, "step": 460}
{"info/global_step": 461, "train_info/time_within_train_step": 34.16066002845764, "step": 461}
{"train_info/time_between_train_steps": 0.009977579116821289, "step": 461}
{"info/global_step": 462, "train_info/time_within_train_step": 34.483423471450806, "step": 462}
{"train_info/time_between_train_steps": 0.005892038345336914, "step": 462}
{"info/global_step": 463, "train_info/time_within_train_step": 34.229106426239014, "step": 463}
{"train_info/time_between_train_steps": 0.011104822158813477, "step": 463}
{"info/global_step": 464, "train_info/time_within_train_step": 34.1636266708374, "step": 464}
{"train_info/time_between_train_steps": 0.010305643081665039, "step": 464}
{"info/global_step": 465, "train_info/time_within_train_step": 34.20463180541992, "step": 465}
{"train_info/time_between_train_steps": 0.010340452194213867, "step": 465}
{"info/global_step": 466, "train_info/time_within_train_step": 34.152164459228516, "step": 466}
{"train_info/time_between_train_steps": 0.0072290897369384766, "step": 466}
{"info/global_step": 467, "train_info/time_within_train_step": 34.271260499954224, "step": 467}
{"train_info/time_between_train_steps": 0.00651240348815918, "step": 467}
{"info/global_step": 468, "train_info/time_within_train_step": 34.16133737564087, "step": 468}
{"train_info/time_between_train_steps": 0.007525444030761719, "step": 468}
{"info/global_step": 469, "train_info/time_within_train_step": 34.18739700317383, "step": 469}
{"train_info/time_between_train_steps": 0.006215572357177734, "step": 469}
{"info/global_step": 470, "train_info/time_within_train_step": 34.29199004173279, "step": 470}
{"train_info/time_between_train_steps": 0.010882854461669922, "step": 470}
{"info/global_step": 471, "train_info/time_within_train_step": 34.20367121696472, "step": 471}
{"train_info/time_between_train_steps": 0.015743732452392578, "step": 471}
{"info/global_step": 472, "train_info/time_within_train_step": 34.27704620361328, "step": 472}
{"train_info/time_between_train_steps": 0.0061643123626708984, "step": 472}
{"info/global_step": 473, "train_info/time_within_train_step": 34.1949622631073, "step": 473}
{"train_info/time_between_train_steps": 0.0075795650482177734, "step": 473}
{"train_info/time_between_train_steps": 27.24807643890381, "step": 473}
{"info/global_step": 474, "train_info/time_within_train_step": 34.344685554504395, "step": 474}
{"train_info/time_between_train_steps": 0.013912677764892578, "step": 474}
{"info/global_step": 475, "train_info/time_within_train_step": 34.40579271316528, "step": 475}
{"train_info/time_between_train_steps": 0.0060656070709228516, "step": 475}
{"info/global_step": 476, "train_info/time_within_train_step": 34.04628324508667, "step": 476}
{"train_info/time_between_train_steps": 0.006333827972412109, "step": 476}
{"info/global_step": 477, "train_info/time_within_train_step": 34.38899779319763, "step": 477}
{"train_info/time_between_train_steps": 0.006237983703613281, "step": 477}
{"info/global_step": 478, "train_info/time_within_train_step": 34.257739305496216, "step": 478}
{"train_info/time_between_train_steps": 0.013155937194824219, "step": 478}
{"info/global_step": 479, "train_info/time_within_train_step": 34.219367027282715, "step": 479}
{"train_info/time_between_train_steps": 0.006004810333251953, "step": 479}
{"info/global_step": 480, "train_info/time_within_train_step": 34.14010047912598, "step": 480}
{"train_info/time_between_train_steps": 0.0057942867279052734, "step": 480}
{"info/global_step": 481, "train_info/time_within_train_step": 34.38756275177002, "step": 481}
{"train_info/time_between_train_steps": 0.010551691055297852, "step": 481}
{"info/global_step": 482, "train_info/time_within_train_step": 34.15002107620239, "step": 482}
{"train_info/time_between_train_steps": 0.006742715835571289, "step": 482}
{"info/global_step": 483, "train_info/time_within_train_step": 34.41441488265991, "step": 483}
{"train_info/time_between_train_steps": 0.007697105407714844, "step": 483}
{"info/global_step": 484, "train_info/time_within_train_step": 34.20892548561096, "step": 484}
{"train_info/time_between_train_steps": 0.013153553009033203, "step": 484}
{"info/global_step": 485, "train_info/time_within_train_step": 34.325063705444336, "step": 485}
{"train_info/time_between_train_steps": 0.01287531852722168, "step": 485}
{"info/global_step": 486, "train_info/time_within_train_step": 34.280336141586304, "step": 486}
{"train_info/time_between_train_steps": 0.01083993911743164, "step": 486}
{"info/global_step": 487, "train_info/time_within_train_step": 34.32875204086304, "step": 487}
{"train_info/time_between_train_steps": 0.01056671142578125, "step": 487}
{"info/global_step": 488, "train_info/time_within_train_step": 34.24668097496033, "step": 488}
{"train_info/time_between_train_steps": 0.010980606079101562, "step": 488}
{"info/global_step": 489, "train_info/time_within_train_step": 34.34947967529297, "step": 489}
{"train_info/time_between_train_steps": 0.012169122695922852, "step": 489}
{"info/global_step": 490, "train_info/time_within_train_step": 34.24467873573303, "step": 490}
{"train_info/time_between_train_steps": 0.010976791381835938, "step": 490}
{"info/global_step": 491, "train_info/time_within_train_step": 34.30964708328247, "step": 491}
{"train_info/time_between_train_steps": 0.006029605865478516, "step": 491}
{"info/global_step": 492, "train_info/time_within_train_step": 34.24773907661438, "step": 492}
{"train_info/time_between_train_steps": 0.008191108703613281, "step": 492}
{"info/global_step": 493, "train_info/time_within_train_step": 34.57613754272461, "step": 493}
{"train_info/time_between_train_steps": 0.011923074722290039, "step": 493}
{"info/global_step": 494, "train_info/time_within_train_step": 34.22636413574219, "step": 494}
{"train_info/time_between_train_steps": 0.0065441131591796875, "step": 494}
{"info/global_step": 495, "train_info/time_within_train_step": 34.3091721534729, "step": 495}
{"train_info/time_between_train_steps": 0.013613224029541016, "step": 495}
{"info/global_step": 496, "train_info/time_within_train_step": 34.09157586097717, "step": 496}
{"train_info/time_between_train_steps": 0.010081052780151367, "step": 496}
{"info/global_step": 497, "train_info/time_within_train_step": 34.220709800720215, "step": 497}
{"train_info/time_between_train_steps": 0.006437540054321289, "step": 497}
{"info/global_step": 498, "train_info/time_within_train_step": 34.2237491607666, "step": 498}
{"train_info/time_between_train_steps": 0.007735013961791992, "step": 498}
{"info/global_step": 499, "train_info/time_within_train_step": 34.12373232841492, "step": 499}
{"train_info/time_between_train_steps": 0.0059032440185546875, "step": 499}
{"info/global_step": 500, "train_info/time_within_train_step": 34.205392599105835, "step": 500}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734120668, "_runtime": 17442}, "step": 500}
{"logs": {"train/loss": 2.6512, "train/learning_rate": 0.00038888888888888887, "train/epoch": 11.02, "_timestamp": 1734120668, "_runtime": 17442}, "step": 500}
{"train_info/time_between_train_steps": 2.8262345790863037, "step": 500}
{"info/global_step": 501, "train_info/time_within_train_step": 34.13348627090454, "step": 501}
{"train_info/time_between_train_steps": 0.005853176116943359, "step": 501}
{"info/global_step": 502, "train_info/time_within_train_step": 34.15781855583191, "step": 502}
{"train_info/time_between_train_steps": 0.0073244571685791016, "step": 502}
{"info/global_step": 503, "train_info/time_within_train_step": 34.15312385559082, "step": 503}
{"train_info/time_between_train_steps": 0.006014585494995117, "step": 503}
{"info/global_step": 504, "train_info/time_within_train_step": 34.1995153427124, "step": 504}
{"train_info/time_between_train_steps": 0.011486053466796875, "step": 504}
{"info/global_step": 505, "train_info/time_within_train_step": 34.241010904312134, "step": 505}
{"train_info/time_between_train_steps": 0.010224342346191406, "step": 505}
{"info/global_step": 506, "train_info/time_within_train_step": 34.329920053482056, "step": 506}
{"train_info/time_between_train_steps": 0.00638270378112793, "step": 506}
{"info/global_step": 507, "train_info/time_within_train_step": 34.189268827438354, "step": 507}
{"train_info/time_between_train_steps": 0.007884979248046875, "step": 507}
{"info/global_step": 508, "train_info/time_within_train_step": 34.31252384185791, "step": 508}
{"train_info/time_between_train_steps": 0.010063886642456055, "step": 508}
{"info/global_step": 509, "train_info/time_within_train_step": 34.52673387527466, "step": 509}
{"train_info/time_between_train_steps": 0.010354042053222656, "step": 509}
{"info/global_step": 510, "train_info/time_within_train_step": 34.1627357006073, "step": 510}
{"train_info/time_between_train_steps": 0.006110191345214844, "step": 510}
{"info/global_step": 511, "train_info/time_within_train_step": 34.13082718849182, "step": 511}
{"train_info/time_between_train_steps": 0.006104946136474609, "step": 511}
{"info/global_step": 512, "train_info/time_within_train_step": 34.110987424850464, "step": 512}
{"train_info/time_between_train_steps": 0.006043195724487305, "step": 512}
{"info/global_step": 513, "train_info/time_within_train_step": 34.067649364471436, "step": 513}
{"train_info/time_between_train_steps": 0.006325721740722656, "step": 513}
{"info/global_step": 514, "train_info/time_within_train_step": 34.269243001937866, "step": 514}
{"train_info/time_between_train_steps": 0.0060579776763916016, "step": 514}
{"info/global_step": 515, "train_info/time_within_train_step": 34.28069090843201, "step": 515}
{"train_info/time_between_train_steps": 0.006068706512451172, "step": 515}
{"info/global_step": 516, "train_info/time_within_train_step": 34.19450879096985, "step": 516}
{"train_info/time_between_train_steps": 0.0077168941497802734, "step": 516}
{"train_info/time_between_train_steps": 26.782163858413696, "step": 516}
{"info/global_step": 517, "train_info/time_within_train_step": 34.123366594314575, "step": 517}
{"train_info/time_between_train_steps": 0.0063152313232421875, "step": 517}
{"info/global_step": 518, "train_info/time_within_train_step": 34.50156235694885, "step": 518}
{"train_info/time_between_train_steps": 0.006186485290527344, "step": 518}
{"info/global_step": 519, "train_info/time_within_train_step": 34.09600615501404, "step": 519}
{"train_info/time_between_train_steps": 0.005697965621948242, "step": 519}
{"info/global_step": 520, "train_info/time_within_train_step": 34.38106679916382, "step": 520}
{"train_info/time_between_train_steps": 0.011285543441772461, "step": 520}
{"info/global_step": 521, "train_info/time_within_train_step": 34.24753379821777, "step": 521}
{"train_info/time_between_train_steps": 0.011147737503051758, "step": 521}
{"info/global_step": 522, "train_info/time_within_train_step": 34.35384011268616, "step": 522}
{"train_info/time_between_train_steps": 0.006408214569091797, "step": 522}
{"info/global_step": 523, "train_info/time_within_train_step": 34.585439682006836, "step": 523}
{"train_info/time_between_train_steps": 0.010995149612426758, "step": 523}
{"info/global_step": 524, "train_info/time_within_train_step": 34.47183918952942, "step": 524}
{"train_info/time_between_train_steps": 0.009949684143066406, "step": 524}
{"info/global_step": 525, "train_info/time_within_train_step": 34.33820033073425, "step": 525}
{"train_info/time_between_train_steps": 0.010818004608154297, "step": 525}
{"info/global_step": 526, "train_info/time_within_train_step": 34.42714858055115, "step": 526}
{"train_info/time_between_train_steps": 0.0063915252685546875, "step": 526}
{"info/global_step": 527, "train_info/time_within_train_step": 34.22901797294617, "step": 527}
{"train_info/time_between_train_steps": 0.010382890701293945, "step": 527}
{"info/global_step": 528, "train_info/time_within_train_step": 34.48767280578613, "step": 528}
{"train_info/time_between_train_steps": 0.007463693618774414, "step": 528}
{"info/global_step": 529, "train_info/time_within_train_step": 34.044663429260254, "step": 529}
{"train_info/time_between_train_steps": 0.005769491195678711, "step": 529}
{"info/global_step": 530, "train_info/time_within_train_step": 34.36780118942261, "step": 530}
{"train_info/time_between_train_steps": 0.015834569931030273, "step": 530}
{"info/global_step": 531, "train_info/time_within_train_step": 34.264111042022705, "step": 531}
{"train_info/time_between_train_steps": 0.006176471710205078, "step": 531}
{"info/global_step": 532, "train_info/time_within_train_step": 34.391122341156006, "step": 532}
{"train_info/time_between_train_steps": 0.011737346649169922, "step": 532}
{"info/global_step": 533, "train_info/time_within_train_step": 34.11233115196228, "step": 533}
{"train_info/time_between_train_steps": 0.005987882614135742, "step": 533}
{"info/global_step": 534, "train_info/time_within_train_step": 34.39034128189087, "step": 534}
{"train_info/time_between_train_steps": 0.006752967834472656, "step": 534}
{"info/global_step": 535, "train_info/time_within_train_step": 34.38403582572937, "step": 535}
{"train_info/time_between_train_steps": 0.012380838394165039, "step": 535}
{"info/global_step": 536, "train_info/time_within_train_step": 34.41766405105591, "step": 536}
{"train_info/time_between_train_steps": 0.006514072418212891, "step": 536}
{"info/global_step": 537, "train_info/time_within_train_step": 34.193036794662476, "step": 537}
{"train_info/time_between_train_steps": 0.006551265716552734, "step": 537}
{"info/global_step": 538, "train_info/time_within_train_step": 34.406596660614014, "step": 538}
{"train_info/time_between_train_steps": 0.006449699401855469, "step": 538}
{"info/global_step": 539, "train_info/time_within_train_step": 34.47223377227783, "step": 539}
{"train_info/time_between_train_steps": 0.01167607307434082, "step": 539}
{"info/global_step": 540, "train_info/time_within_train_step": 34.38107514381409, "step": 540}
{"train_info/time_between_train_steps": 0.006605625152587891, "step": 540}
{"info/global_step": 541, "train_info/time_within_train_step": 34.21066355705261, "step": 541}
{"train_info/time_between_train_steps": 0.005650043487548828, "step": 541}
{"info/global_step": 542, "train_info/time_within_train_step": 34.18423318862915, "step": 542}
{"train_info/time_between_train_steps": 0.011774063110351562, "step": 542}
{"info/global_step": 543, "train_info/time_within_train_step": 34.14998507499695, "step": 543}
{"train_info/time_between_train_steps": 0.005750417709350586, "step": 543}
{"info/global_step": 544, "train_info/time_within_train_step": 34.18705153465271, "step": 544}
{"train_info/time_between_train_steps": 0.005554676055908203, "step": 544}
{"info/global_step": 545, "train_info/time_within_train_step": 34.18951392173767, "step": 545}
{"train_info/time_between_train_steps": 0.009702682495117188, "step": 545}
{"info/global_step": 546, "train_info/time_within_train_step": 34.227593660354614, "step": 546}
{"train_info/time_between_train_steps": 0.005597591400146484, "step": 546}
{"info/global_step": 547, "train_info/time_within_train_step": 34.23367786407471, "step": 547}
{"train_info/time_between_train_steps": 0.010899782180786133, "step": 547}
{"info/global_step": 548, "train_info/time_within_train_step": 34.23848509788513, "step": 548}
{"train_info/time_between_train_steps": 0.01014256477355957, "step": 548}
{"info/global_step": 549, "train_info/time_within_train_step": 34.067572593688965, "step": 549}
{"train_info/time_between_train_steps": 0.0060977935791015625, "step": 549}
{"info/global_step": 550, "train_info/time_within_train_step": 34.236621618270874, "step": 550}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734122412, "_runtime": 19186}, "step": 550}
{"logs": {"train/loss": 2.5787, "train/learning_rate": 0.0003611111111111111, "train/epoch": 12.03, "_timestamp": 1734122412, "_runtime": 19186}, "step": 550}
{"train_info/time_between_train_steps": 0.008733272552490234, "step": 550}
{"info/global_step": 551, "train_info/time_within_train_step": 34.10575079917908, "step": 551}
{"train_info/time_between_train_steps": 0.006312131881713867, "step": 551}
{"info/global_step": 552, "train_info/time_within_train_step": 34.211265087127686, "step": 552}
{"train_info/time_between_train_steps": 0.010445594787597656, "step": 552}
{"info/global_step": 553, "train_info/time_within_train_step": 34.29032254219055, "step": 553}
{"train_info/time_between_train_steps": 0.009888410568237305, "step": 553}
{"info/global_step": 554, "train_info/time_within_train_step": 34.19848012924194, "step": 554}
{"train_info/time_between_train_steps": 0.01163625717163086, "step": 554}
{"info/global_step": 555, "train_info/time_within_train_step": 34.438663721084595, "step": 555}
{"train_info/time_between_train_steps": 0.007714748382568359, "step": 555}
{"info/global_step": 556, "train_info/time_within_train_step": 34.23737049102783, "step": 556}
{"train_info/time_between_train_steps": 0.006072282791137695, "step": 556}
{"info/global_step": 557, "train_info/time_within_train_step": 34.1436448097229, "step": 557}
{"train_info/time_between_train_steps": 0.011647701263427734, "step": 557}
{"info/global_step": 558, "train_info/time_within_train_step": 34.16348361968994, "step": 558}
{"train_info/time_between_train_steps": 0.0070912837982177734, "step": 558}
{"info/global_step": 559, "train_info/time_within_train_step": 34.2346134185791, "step": 559}
{"train_info/time_between_train_steps": 0.007664918899536133, "step": 559}
{"train_info/time_between_train_steps": 26.979201078414917, "step": 559}
{"info/global_step": 560, "train_info/time_within_train_step": 34.1945743560791, "step": 560}
{"train_info/time_between_train_steps": 0.011452436447143555, "step": 560}
{"info/global_step": 561, "train_info/time_within_train_step": 34.330769538879395, "step": 561}
{"train_info/time_between_train_steps": 0.006077289581298828, "step": 561}
{"info/global_step": 562, "train_info/time_within_train_step": 34.16594958305359, "step": 562}
{"train_info/time_between_train_steps": 0.006361484527587891, "step": 562}
{"info/global_step": 563, "train_info/time_within_train_step": 34.49603343009949, "step": 563}
{"train_info/time_between_train_steps": 0.005976438522338867, "step": 563}
{"info/global_step": 564, "train_info/time_within_train_step": 34.320971965789795, "step": 564}
{"train_info/time_between_train_steps": 0.01075291633605957, "step": 564}
{"info/global_step": 565, "train_info/time_within_train_step": 34.35452198982239, "step": 565}
{"train_info/time_between_train_steps": 0.006203174591064453, "step": 565}
{"info/global_step": 566, "train_info/time_within_train_step": 34.16516423225403, "step": 566}
{"train_info/time_between_train_steps": 0.006360054016113281, "step": 566}
{"info/global_step": 567, "train_info/time_within_train_step": 34.29964852333069, "step": 567}
{"train_info/time_between_train_steps": 0.011253833770751953, "step": 567}
{"info/global_step": 568, "train_info/time_within_train_step": 34.16741180419922, "step": 568}
{"train_info/time_between_train_steps": 0.0063893795013427734, "step": 568}
{"info/global_step": 569, "train_info/time_within_train_step": 34.222636699676514, "step": 569}
{"train_info/time_between_train_steps": 0.005969047546386719, "step": 569}
{"info/global_step": 570, "train_info/time_within_train_step": 34.37155842781067, "step": 570}
{"train_info/time_between_train_steps": 0.0059626102447509766, "step": 570}
{"info/global_step": 571, "train_info/time_within_train_step": 34.39998984336853, "step": 571}
{"train_info/time_between_train_steps": 0.009223699569702148, "step": 571}
{"info/global_step": 572, "train_info/time_within_train_step": 34.367640018463135, "step": 572}
{"train_info/time_between_train_steps": 0.006201267242431641, "step": 572}
{"info/global_step": 573, "train_info/time_within_train_step": 34.29179334640503, "step": 573}
{"train_info/time_between_train_steps": 0.00635218620300293, "step": 573}
{"info/global_step": 574, "train_info/time_within_train_step": 34.10859966278076, "step": 574}
{"train_info/time_between_train_steps": 0.01078486442565918, "step": 574}
{"info/global_step": 575, "train_info/time_within_train_step": 34.37936520576477, "step": 575}
{"train_info/time_between_train_steps": 0.006371974945068359, "step": 575}
{"info/global_step": 576, "train_info/time_within_train_step": 34.09063196182251, "step": 576}
{"train_info/time_between_train_steps": 0.010857343673706055, "step": 576}
{"info/global_step": 577, "train_info/time_within_train_step": 34.434752225875854, "step": 577}
{"train_info/time_between_train_steps": 0.01427006721496582, "step": 577}
{"info/global_step": 578, "train_info/time_within_train_step": 34.215601205825806, "step": 578}
{"train_info/time_between_train_steps": 0.006392002105712891, "step": 578}
{"info/global_step": 579, "train_info/time_within_train_step": 34.762551069259644, "step": 579}
{"train_info/time_between_train_steps": 0.007610321044921875, "step": 579}
{"info/global_step": 580, "train_info/time_within_train_step": 34.20205879211426, "step": 580}
{"train_info/time_between_train_steps": 0.01157832145690918, "step": 580}
{"info/global_step": 581, "train_info/time_within_train_step": 34.30084705352783, "step": 581}
{"train_info/time_between_train_steps": 0.011019229888916016, "step": 581}
{"info/global_step": 582, "train_info/time_within_train_step": 34.123886823654175, "step": 582}
{"train_info/time_between_train_steps": 0.005980968475341797, "step": 582}
{"info/global_step": 583, "train_info/time_within_train_step": 34.32522249221802, "step": 583}
{"train_info/time_between_train_steps": 0.011547565460205078, "step": 583}
{"info/global_step": 584, "train_info/time_within_train_step": 34.191811323165894, "step": 584}
{"train_info/time_between_train_steps": 0.011011123657226562, "step": 584}
{"info/global_step": 585, "train_info/time_within_train_step": 34.28777813911438, "step": 585}
{"train_info/time_between_train_steps": 0.01105642318725586, "step": 585}
{"info/global_step": 586, "train_info/time_within_train_step": 34.13783264160156, "step": 586}
{"train_info/time_between_train_steps": 0.005866527557373047, "step": 586}
{"info/global_step": 587, "train_info/time_within_train_step": 34.19473481178284, "step": 587}
{"train_info/time_between_train_steps": 0.0061571598052978516, "step": 587}
{"info/global_step": 588, "train_info/time_within_train_step": 34.22091460227966, "step": 588}
{"train_info/time_between_train_steps": 0.010542869567871094, "step": 588}
{"info/global_step": 589, "train_info/time_within_train_step": 34.22307872772217, "step": 589}
{"train_info/time_between_train_steps": 0.012009143829345703, "step": 589}
{"info/global_step": 590, "train_info/time_within_train_step": 34.251447677612305, "step": 590}
{"train_info/time_between_train_steps": 0.010296344757080078, "step": 590}
{"info/global_step": 591, "train_info/time_within_train_step": 34.23908352851868, "step": 591}
{"train_info/time_between_train_steps": 0.009996891021728516, "step": 591}
{"info/global_step": 592, "train_info/time_within_train_step": 34.216540575027466, "step": 592}
{"train_info/time_between_train_steps": 0.005852460861206055, "step": 592}
{"info/global_step": 593, "train_info/time_within_train_step": 34.260990619659424, "step": 593}
{"train_info/time_between_train_steps": 0.0057408809661865234, "step": 593}
{"info/global_step": 594, "train_info/time_within_train_step": 34.23512649536133, "step": 594}
{"train_info/time_between_train_steps": 0.006647586822509766, "step": 594}
{"info/global_step": 595, "train_info/time_within_train_step": 34.245572566986084, "step": 595}
{"train_info/time_between_train_steps": 0.005985736846923828, "step": 595}
{"info/global_step": 596, "train_info/time_within_train_step": 34.09879517555237, "step": 596}
{"train_info/time_between_train_steps": 0.006368160247802734, "step": 596}
{"info/global_step": 597, "train_info/time_within_train_step": 34.1888370513916, "step": 597}
{"train_info/time_between_train_steps": 0.005989789962768555, "step": 597}
{"info/global_step": 598, "train_info/time_within_train_step": 34.2636284828186, "step": 598}
{"train_info/time_between_train_steps": 0.008176326751708984, "step": 598}
{"info/global_step": 599, "train_info/time_within_train_step": 34.147268772125244, "step": 599}
{"train_info/time_between_train_steps": 0.005901336669921875, "step": 599}
{"info/global_step": 600, "train_info/time_within_train_step": 34.19427824020386, "step": 600}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734124152, "_runtime": 20926}, "step": 600}
{"logs": {"train/loss": 2.5183, "train/learning_rate": 0.0003333333333333333, "train/epoch": 13.03, "_timestamp": 1734124152, "_runtime": 20926}, "step": 600}
{"train_info/time_between_train_steps": 2.410991668701172, "step": 600}
{"info/global_step": 601, "train_info/time_within_train_step": 34.45214080810547, "step": 601}
{"train_info/time_between_train_steps": 0.010038375854492188, "step": 601}
{"info/global_step": 602, "train_info/time_within_train_step": 34.1722731590271, "step": 602}
{"train_info/time_between_train_steps": 0.0073392391204833984, "step": 602}
{"train_info/time_between_train_steps": 27.016155004501343, "step": 602}
{"info/global_step": 603, "train_info/time_within_train_step": 34.211443185806274, "step": 603}
{"train_info/time_between_train_steps": 0.01267552375793457, "step": 603}
{"info/global_step": 604, "train_info/time_within_train_step": 34.47349238395691, "step": 604}
{"train_info/time_between_train_steps": 0.012946128845214844, "step": 604}
{"info/global_step": 605, "train_info/time_within_train_step": 34.202571868896484, "step": 605}
{"train_info/time_between_train_steps": 0.006869316101074219, "step": 605}
{"info/global_step": 606, "train_info/time_within_train_step": 34.32958626747131, "step": 606}
{"train_info/time_between_train_steps": 0.006060361862182617, "step": 606}
{"info/global_step": 607, "train_info/time_within_train_step": 34.2087345123291, "step": 607}
{"train_info/time_between_train_steps": 0.010020732879638672, "step": 607}
{"info/global_step": 608, "train_info/time_within_train_step": 34.40166711807251, "step": 608}
{"train_info/time_between_train_steps": 0.009186267852783203, "step": 608}
{"info/global_step": 609, "train_info/time_within_train_step": 34.27941370010376, "step": 609}
{"train_info/time_between_train_steps": 0.006552457809448242, "step": 609}
{"info/global_step": 610, "train_info/time_within_train_step": 34.60459876060486, "step": 610}
{"train_info/time_between_train_steps": 0.011588811874389648, "step": 610}
{"info/global_step": 611, "train_info/time_within_train_step": 34.187989234924316, "step": 611}
{"train_info/time_between_train_steps": 0.0056972503662109375, "step": 611}
{"info/global_step": 612, "train_info/time_within_train_step": 34.332491397857666, "step": 612}
{"train_info/time_between_train_steps": 0.008686065673828125, "step": 612}
{"info/global_step": 613, "train_info/time_within_train_step": 34.07234311103821, "step": 613}
{"train_info/time_between_train_steps": 0.011177778244018555, "step": 613}
{"info/global_step": 614, "train_info/time_within_train_step": 34.47253060340881, "step": 614}
{"train_info/time_between_train_steps": 0.010777473449707031, "step": 614}
{"info/global_step": 615, "train_info/time_within_train_step": 34.3013391494751, "step": 615}
{"train_info/time_between_train_steps": 0.007159709930419922, "step": 615}
{"info/global_step": 616, "train_info/time_within_train_step": 34.59434700012207, "step": 616}
{"train_info/time_between_train_steps": 0.006238698959350586, "step": 616}
{"info/global_step": 617, "train_info/time_within_train_step": 34.22197151184082, "step": 617}
{"train_info/time_between_train_steps": 0.006598949432373047, "step": 617}
{"info/global_step": 618, "train_info/time_within_train_step": 34.4439001083374, "step": 618}
{"train_info/time_between_train_steps": 0.006067752838134766, "step": 618}
{"info/global_step": 619, "train_info/time_within_train_step": 34.22411918640137, "step": 619}
{"train_info/time_between_train_steps": 0.0106658935546875, "step": 619}
{"info/global_step": 620, "train_info/time_within_train_step": 34.498749017715454, "step": 620}
{"train_info/time_between_train_steps": 0.006356000900268555, "step": 620}
{"info/global_step": 621, "train_info/time_within_train_step": 34.1224946975708, "step": 621}
{"train_info/time_between_train_steps": 0.0061686038970947266, "step": 621}
{"info/global_step": 622, "train_info/time_within_train_step": 34.32889246940613, "step": 622}
{"train_info/time_between_train_steps": 0.006578922271728516, "step": 622}
{"info/global_step": 623, "train_info/time_within_train_step": 34.18461275100708, "step": 623}
{"train_info/time_between_train_steps": 0.011579036712646484, "step": 623}
{"info/global_step": 624, "train_info/time_within_train_step": 34.30294752120972, "step": 624}
{"train_info/time_between_train_steps": 0.006043910980224609, "step": 624}
{"info/global_step": 625, "train_info/time_within_train_step": 34.332919120788574, "step": 625}
{"train_info/time_between_train_steps": 0.009385108947753906, "step": 625}
{"info/global_step": 626, "train_info/time_within_train_step": 34.33837032318115, "step": 626}
{"train_info/time_between_train_steps": 0.005861043930053711, "step": 626}
{"info/global_step": 627, "train_info/time_within_train_step": 34.11247396469116, "step": 627}
{"train_info/time_between_train_steps": 0.006200313568115234, "step": 627}
{"info/global_step": 628, "train_info/time_within_train_step": 34.23291039466858, "step": 628}
{"train_info/time_between_train_steps": 0.005709171295166016, "step": 628}
{"info/global_step": 629, "train_info/time_within_train_step": 34.23595571517944, "step": 629}
{"train_info/time_between_train_steps": 0.010694265365600586, "step": 629}
{"info/global_step": 630, "train_info/time_within_train_step": 34.299155473709106, "step": 630}
{"train_info/time_between_train_steps": 0.009867191314697266, "step": 630}
{"info/global_step": 631, "train_info/time_within_train_step": 34.463056564331055, "step": 631}
{"train_info/time_between_train_steps": 0.011285543441772461, "step": 631}
{"info/global_step": 632, "train_info/time_within_train_step": 34.29862713813782, "step": 632}
{"train_info/time_between_train_steps": 0.015664100646972656, "step": 632}
{"info/global_step": 633, "train_info/time_within_train_step": 34.24197793006897, "step": 633}
{"train_info/time_between_train_steps": 0.009713411331176758, "step": 633}
{"info/global_step": 634, "train_info/time_within_train_step": 34.14134502410889, "step": 634}
{"train_info/time_between_train_steps": 0.010865211486816406, "step": 634}
{"info/global_step": 635, "train_info/time_within_train_step": 34.21484017372131, "step": 635}
{"train_info/time_between_train_steps": 0.015671491622924805, "step": 635}
{"info/global_step": 636, "train_info/time_within_train_step": 34.14619278907776, "step": 636}
{"train_info/time_between_train_steps": 0.005945920944213867, "step": 636}
{"info/global_step": 637, "train_info/time_within_train_step": 34.23399209976196, "step": 637}
{"train_info/time_between_train_steps": 0.015492439270019531, "step": 637}
{"info/global_step": 638, "train_info/time_within_train_step": 34.27874803543091, "step": 638}
{"train_info/time_between_train_steps": 0.009197711944580078, "step": 638}
{"info/global_step": 639, "train_info/time_within_train_step": 34.221864461898804, "step": 639}
{"train_info/time_between_train_steps": 0.01055908203125, "step": 639}
{"info/global_step": 640, "train_info/time_within_train_step": 34.32451367378235, "step": 640}
{"train_info/time_between_train_steps": 0.0063893795013427734, "step": 640}
{"info/global_step": 641, "train_info/time_within_train_step": 34.170631885528564, "step": 641}
{"train_info/time_between_train_steps": 0.0086212158203125, "step": 641}
{"info/global_step": 642, "train_info/time_within_train_step": 34.23087978363037, "step": 642}
{"train_info/time_between_train_steps": 0.010470867156982422, "step": 642}
{"info/global_step": 643, "train_info/time_within_train_step": 34.19042491912842, "step": 643}
{"train_info/time_between_train_steps": 0.016283512115478516, "step": 643}
{"info/global_step": 644, "train_info/time_within_train_step": 34.26100039482117, "step": 644}
{"train_info/time_between_train_steps": 0.005955934524536133, "step": 644}
{"info/global_step": 645, "train_info/time_within_train_step": 34.232067823410034, "step": 645}
{"train_info/time_between_train_steps": 0.013375997543334961, "step": 645}
{"train_info/time_between_train_steps": 26.67436957359314, "step": 645}
{"info/global_step": 646, "train_info/time_within_train_step": 34.476083517074585, "step": 646}
{"train_info/time_between_train_steps": 0.010116815567016602, "step": 646}
{"info/global_step": 647, "train_info/time_within_train_step": 34.27228093147278, "step": 647}
{"train_info/time_between_train_steps": 0.006240367889404297, "step": 647}
{"info/global_step": 648, "train_info/time_within_train_step": 34.20404601097107, "step": 648}
{"train_info/time_between_train_steps": 0.006073474884033203, "step": 648}
{"info/global_step": 649, "train_info/time_within_train_step": 34.4606249332428, "step": 649}
{"train_info/time_between_train_steps": 0.01099538803100586, "step": 649}
{"info/global_step": 650, "train_info/time_within_train_step": 34.34700036048889, "step": 650}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734125923, "_runtime": 22697}, "step": 650}
{"logs": {"train/loss": 2.4963, "train/learning_rate": 0.00030555555555555555, "train/epoch": 15.0, "_timestamp": 1734125923, "_runtime": 22697}, "step": 650}
{"train_info/time_between_train_steps": 0.014605045318603516, "step": 650}
{"info/global_step": 651, "train_info/time_within_train_step": 34.40733003616333, "step": 651}
{"train_info/time_between_train_steps": 0.011921167373657227, "step": 651}
{"info/global_step": 652, "train_info/time_within_train_step": 34.22405433654785, "step": 652}
{"train_info/time_between_train_steps": 0.0163116455078125, "step": 652}
{"info/global_step": 653, "train_info/time_within_train_step": 34.325711488723755, "step": 653}
{"train_info/time_between_train_steps": 0.00589299201965332, "step": 653}
{"info/global_step": 654, "train_info/time_within_train_step": 34.24138832092285, "step": 654}
{"train_info/time_between_train_steps": 0.011607170104980469, "step": 654}
{"info/global_step": 655, "train_info/time_within_train_step": 34.389145851135254, "step": 655}
{"train_info/time_between_train_steps": 0.00579071044921875, "step": 655}
{"info/global_step": 656, "train_info/time_within_train_step": 34.27243900299072, "step": 656}
{"train_info/time_between_train_steps": 0.012445449829101562, "step": 656}
{"info/global_step": 657, "train_info/time_within_train_step": 34.559133768081665, "step": 657}
{"train_info/time_between_train_steps": 0.008907318115234375, "step": 657}
{"info/global_step": 658, "train_info/time_within_train_step": 34.212080001831055, "step": 658}
{"train_info/time_between_train_steps": 0.006635427474975586, "step": 658}
{"info/global_step": 659, "train_info/time_within_train_step": 34.48903727531433, "step": 659}
{"train_info/time_between_train_steps": 0.01118779182434082, "step": 659}
{"info/global_step": 660, "train_info/time_within_train_step": 34.200114250183105, "step": 660}
{"train_info/time_between_train_steps": 0.00632929801940918, "step": 660}
{"info/global_step": 661, "train_info/time_within_train_step": 34.41797375679016, "step": 661}
{"train_info/time_between_train_steps": 0.011449337005615234, "step": 661}
{"info/global_step": 662, "train_info/time_within_train_step": 34.46434760093689, "step": 662}
{"train_info/time_between_train_steps": 0.006333112716674805, "step": 662}
{"info/global_step": 663, "train_info/time_within_train_step": 34.38517236709595, "step": 663}
{"train_info/time_between_train_steps": 0.010591268539428711, "step": 663}
{"info/global_step": 664, "train_info/time_within_train_step": 34.34353017807007, "step": 664}
{"train_info/time_between_train_steps": 0.00700068473815918, "step": 664}
{"info/global_step": 665, "train_info/time_within_train_step": 34.33009386062622, "step": 665}
{"train_info/time_between_train_steps": 0.008783340454101562, "step": 665}
{"info/global_step": 666, "train_info/time_within_train_step": 34.269628047943115, "step": 666}
{"train_info/time_between_train_steps": 0.011234045028686523, "step": 666}
{"info/global_step": 667, "train_info/time_within_train_step": 34.341816902160645, "step": 667}
{"train_info/time_between_train_steps": 0.006571769714355469, "step": 667}
{"info/global_step": 668, "train_info/time_within_train_step": 34.18894362449646, "step": 668}
{"train_info/time_between_train_steps": 0.006649017333984375, "step": 668}
{"info/global_step": 669, "train_info/time_within_train_step": 34.44625234603882, "step": 669}
{"train_info/time_between_train_steps": 0.006437778472900391, "step": 669}
{"info/global_step": 670, "train_info/time_within_train_step": 34.20540189743042, "step": 670}
{"train_info/time_between_train_steps": 0.007020235061645508, "step": 670}
{"info/global_step": 671, "train_info/time_within_train_step": 34.21165895462036, "step": 671}
{"train_info/time_between_train_steps": 0.010433435440063477, "step": 671}
{"info/global_step": 672, "train_info/time_within_train_step": 34.18183255195618, "step": 672}
{"train_info/time_between_train_steps": 0.0058135986328125, "step": 672}
{"info/global_step": 673, "train_info/time_within_train_step": 34.091641426086426, "step": 673}
{"train_info/time_between_train_steps": 0.010380029678344727, "step": 673}
{"info/global_step": 674, "train_info/time_within_train_step": 34.1546676158905, "step": 674}
{"train_info/time_between_train_steps": 0.006047725677490234, "step": 674}
{"info/global_step": 675, "train_info/time_within_train_step": 34.24254083633423, "step": 675}
{"train_info/time_between_train_steps": 0.012566804885864258, "step": 675}
{"info/global_step": 676, "train_info/time_within_train_step": 34.19473314285278, "step": 676}
{"train_info/time_between_train_steps": 0.007631063461303711, "step": 676}
{"info/global_step": 677, "train_info/time_within_train_step": 34.17925524711609, "step": 677}
{"train_info/time_between_train_steps": 0.01008152961730957, "step": 677}
{"info/global_step": 678, "train_info/time_within_train_step": 34.4884819984436, "step": 678}
{"train_info/time_between_train_steps": 0.005693197250366211, "step": 678}
{"info/global_step": 679, "train_info/time_within_train_step": 34.13639259338379, "step": 679}
{"train_info/time_between_train_steps": 0.010138273239135742, "step": 679}
{"info/global_step": 680, "train_info/time_within_train_step": 34.282939195632935, "step": 680}
{"train_info/time_between_train_steps": 0.010431051254272461, "step": 680}
{"info/global_step": 681, "train_info/time_within_train_step": 34.126723766326904, "step": 681}
{"train_info/time_between_train_steps": 0.0061187744140625, "step": 681}
{"info/global_step": 682, "train_info/time_within_train_step": 34.19358158111572, "step": 682}
{"train_info/time_between_train_steps": 0.005982160568237305, "step": 682}
{"info/global_step": 683, "train_info/time_within_train_step": 34.16616153717041, "step": 683}
{"train_info/time_between_train_steps": 0.01063084602355957, "step": 683}
{"info/global_step": 684, "train_info/time_within_train_step": 34.10023736953735, "step": 684}
{"train_info/time_between_train_steps": 0.010918855667114258, "step": 684}
{"info/global_step": 685, "train_info/time_within_train_step": 34.20217990875244, "step": 685}
{"train_info/time_between_train_steps": 0.015535593032836914, "step": 685}
{"info/global_step": 686, "train_info/time_within_train_step": 34.311694383621216, "step": 686}
{"train_info/time_between_train_steps": 0.010679960250854492, "step": 686}
{"info/global_step": 687, "train_info/time_within_train_step": 34.20346665382385, "step": 687}
{"train_info/time_between_train_steps": 0.013245344161987305, "step": 687}
{"info/global_step": 688, "train_info/time_within_train_step": 34.18217206001282, "step": 688}
{"train_info/time_between_train_steps": 0.008412361145019531, "step": 688}
{"train_info/time_between_train_steps": 27.57362961769104, "step": 688}
{"info/global_step": 689, "train_info/time_within_train_step": 34.19999694824219, "step": 689}
{"train_info/time_between_train_steps": 0.010832548141479492, "step": 689}
{"info/global_step": 690, "train_info/time_within_train_step": 34.45268988609314, "step": 690}
{"train_info/time_between_train_steps": 0.0107879638671875, "step": 690}
{"info/global_step": 691, "train_info/time_within_train_step": 34.2022168636322, "step": 691}
{"train_info/time_between_train_steps": 0.006982564926147461, "step": 691}
{"info/global_step": 692, "train_info/time_within_train_step": 34.394468784332275, "step": 692}
{"train_info/time_between_train_steps": 0.00594019889831543, "step": 692}
{"info/global_step": 693, "train_info/time_within_train_step": 34.26473641395569, "step": 693}
{"train_info/time_between_train_steps": 0.006178855895996094, "step": 693}
{"info/global_step": 694, "train_info/time_within_train_step": 34.226980447769165, "step": 694}
{"train_info/time_between_train_steps": 0.005829572677612305, "step": 694}
{"info/global_step": 695, "train_info/time_within_train_step": 34.24020957946777, "step": 695}
{"train_info/time_between_train_steps": 0.006352901458740234, "step": 695}
{"info/global_step": 696, "train_info/time_within_train_step": 34.38693904876709, "step": 696}
{"train_info/time_between_train_steps": 0.011593818664550781, "step": 696}
{"info/global_step": 697, "train_info/time_within_train_step": 34.29769468307495, "step": 697}
{"train_info/time_between_train_steps": 0.01846623420715332, "step": 697}
{"info/global_step": 698, "train_info/time_within_train_step": 34.60488772392273, "step": 698}
{"train_info/time_between_train_steps": 0.009331703186035156, "step": 698}
{"info/global_step": 699, "train_info/time_within_train_step": 34.14362120628357, "step": 699}
{"train_info/time_between_train_steps": 0.007738351821899414, "step": 699}
{"info/global_step": 700, "train_info/time_within_train_step": 34.428515911102295, "step": 700}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734127665, "_runtime": 24439}, "step": 700}
{"logs": {"train/loss": 2.4139, "train/learning_rate": 0.0002777777777777778, "train/epoch": 16.01, "_timestamp": 1734127665, "_runtime": 24439}, "step": 700}
{"train_info/time_between_train_steps": 2.6592745780944824, "step": 700}
{"info/global_step": 701, "train_info/time_within_train_step": 34.08342957496643, "step": 701}
{"train_info/time_between_train_steps": 0.005723237991333008, "step": 701}
{"info/global_step": 702, "train_info/time_within_train_step": 34.31847023963928, "step": 702}
{"train_info/time_between_train_steps": 0.008723735809326172, "step": 702}
{"info/global_step": 703, "train_info/time_within_train_step": 34.10503935813904, "step": 703}
{"train_info/time_between_train_steps": 0.006079912185668945, "step": 703}
{"info/global_step": 704, "train_info/time_within_train_step": 34.40651082992554, "step": 704}
{"train_info/time_between_train_steps": 0.010900020599365234, "step": 704}
{"info/global_step": 705, "train_info/time_within_train_step": 34.167985916137695, "step": 705}
{"train_info/time_between_train_steps": 0.006066322326660156, "step": 705}
{"info/global_step": 706, "train_info/time_within_train_step": 34.44643998146057, "step": 706}
{"train_info/time_between_train_steps": 0.006430387496948242, "step": 706}
{"info/global_step": 707, "train_info/time_within_train_step": 34.23090362548828, "step": 707}
{"train_info/time_between_train_steps": 0.012081623077392578, "step": 707}
{"info/global_step": 708, "train_info/time_within_train_step": 34.66315293312073, "step": 708}
{"train_info/time_between_train_steps": 0.013121843338012695, "step": 708}
{"info/global_step": 709, "train_info/time_within_train_step": 34.18839693069458, "step": 709}
{"train_info/time_between_train_steps": 0.006483793258666992, "step": 709}
{"info/global_step": 710, "train_info/time_within_train_step": 34.464866399765015, "step": 710}
{"train_info/time_between_train_steps": 0.011763334274291992, "step": 710}
{"info/global_step": 711, "train_info/time_within_train_step": 34.20823931694031, "step": 711}
{"train_info/time_between_train_steps": 0.006468772888183594, "step": 711}
{"info/global_step": 712, "train_info/time_within_train_step": 34.330848932266235, "step": 712}
{"train_info/time_between_train_steps": 0.007187843322753906, "step": 712}
{"info/global_step": 713, "train_info/time_within_train_step": 34.19878029823303, "step": 713}
{"train_info/time_between_train_steps": 0.00973963737487793, "step": 713}
{"info/global_step": 714, "train_info/time_within_train_step": 34.23953461647034, "step": 714}
{"train_info/time_between_train_steps": 0.014587879180908203, "step": 714}
{"info/global_step": 715, "train_info/time_within_train_step": 34.1798095703125, "step": 715}
{"train_info/time_between_train_steps": 0.010672330856323242, "step": 715}
{"info/global_step": 716, "train_info/time_within_train_step": 34.17530083656311, "step": 716}
{"train_info/time_between_train_steps": 0.007414579391479492, "step": 716}
{"info/global_step": 717, "train_info/time_within_train_step": 34.28413963317871, "step": 717}
{"train_info/time_between_train_steps": 0.006445646286010742, "step": 717}
{"info/global_step": 718, "train_info/time_within_train_step": 34.21936345100403, "step": 718}
{"train_info/time_between_train_steps": 0.010311365127563477, "step": 718}
{"info/global_step": 719, "train_info/time_within_train_step": 34.19775366783142, "step": 719}
{"train_info/time_between_train_steps": 0.005843639373779297, "step": 719}
{"info/global_step": 720, "train_info/time_within_train_step": 34.23750042915344, "step": 720}
{"train_info/time_between_train_steps": 0.010125160217285156, "step": 720}
{"info/global_step": 721, "train_info/time_within_train_step": 34.214197397232056, "step": 721}
{"train_info/time_between_train_steps": 0.005883693695068359, "step": 721}
{"info/global_step": 722, "train_info/time_within_train_step": 34.35849595069885, "step": 722}
{"train_info/time_between_train_steps": 0.0063991546630859375, "step": 722}
{"info/global_step": 723, "train_info/time_within_train_step": 34.287846088409424, "step": 723}
{"train_info/time_between_train_steps": 0.005867958068847656, "step": 723}
{"info/global_step": 724, "train_info/time_within_train_step": 34.59677171707153, "step": 724}
{"train_info/time_between_train_steps": 0.01580810546875, "step": 724}
{"info/global_step": 725, "train_info/time_within_train_step": 34.15483593940735, "step": 725}
{"train_info/time_between_train_steps": 0.010394573211669922, "step": 725}
{"info/global_step": 726, "train_info/time_within_train_step": 34.272162437438965, "step": 726}
{"train_info/time_between_train_steps": 0.010439634323120117, "step": 726}
{"info/global_step": 727, "train_info/time_within_train_step": 34.25228953361511, "step": 727}
{"train_info/time_between_train_steps": 0.01141810417175293, "step": 727}
{"info/global_step": 728, "train_info/time_within_train_step": 34.25061321258545, "step": 728}
{"train_info/time_between_train_steps": 0.006102800369262695, "step": 728}
{"info/global_step": 729, "train_info/time_within_train_step": 34.12670302391052, "step": 729}
{"train_info/time_between_train_steps": 0.010730981826782227, "step": 729}
{"info/global_step": 730, "train_info/time_within_train_step": 34.209110498428345, "step": 730}
{"train_info/time_between_train_steps": 0.01577448844909668, "step": 730}
{"info/global_step": 731, "train_info/time_within_train_step": 34.27708601951599, "step": 731}
{"train_info/time_between_train_steps": 0.009015560150146484, "step": 731}
{"train_info/time_between_train_steps": 27.272676706314087, "step": 731}
{"info/global_step": 732, "train_info/time_within_train_step": 34.221521854400635, "step": 732}
{"train_info/time_between_train_steps": 0.005673646926879883, "step": 732}
{"info/global_step": 733, "train_info/time_within_train_step": 34.383155822753906, "step": 733}
{"train_info/time_between_train_steps": 0.0071489810943603516, "step": 733}
{"info/global_step": 734, "train_info/time_within_train_step": 34.25922513008118, "step": 734}
{"train_info/time_between_train_steps": 0.015819787979125977, "step": 734}
{"info/global_step": 735, "train_info/time_within_train_step": 34.568907022476196, "step": 735}
{"train_info/time_between_train_steps": 0.005930185317993164, "step": 735}
{"info/global_step": 736, "train_info/time_within_train_step": 34.1910502910614, "step": 736}
{"train_info/time_between_train_steps": 0.00634455680847168, "step": 736}
{"info/global_step": 737, "train_info/time_within_train_step": 34.45810580253601, "step": 737}
{"train_info/time_between_train_steps": 0.01051187515258789, "step": 737}
{"info/global_step": 738, "train_info/time_within_train_step": 34.31580972671509, "step": 738}
{"train_info/time_between_train_steps": 0.006318330764770508, "step": 738}
{"info/global_step": 739, "train_info/time_within_train_step": 34.65700936317444, "step": 739}
{"train_info/time_between_train_steps": 0.0060002803802490234, "step": 739}
{"info/global_step": 740, "train_info/time_within_train_step": 34.198912620544434, "step": 740}
{"train_info/time_between_train_steps": 0.01016855239868164, "step": 740}
{"info/global_step": 741, "train_info/time_within_train_step": 34.392078161239624, "step": 741}
{"train_info/time_between_train_steps": 0.0066831111907958984, "step": 741}
{"info/global_step": 742, "train_info/time_within_train_step": 34.24319124221802, "step": 742}
{"train_info/time_between_train_steps": 0.006432771682739258, "step": 742}
{"info/global_step": 743, "train_info/time_within_train_step": 34.442819118499756, "step": 743}
{"train_info/time_between_train_steps": 0.0100555419921875, "step": 743}
{"info/global_step": 744, "train_info/time_within_train_step": 34.37176179885864, "step": 744}
{"train_info/time_between_train_steps": 0.012260913848876953, "step": 744}
{"info/global_step": 745, "train_info/time_within_train_step": 34.35140609741211, "step": 745}
{"train_info/time_between_train_steps": 0.006131410598754883, "step": 745}
{"info/global_step": 746, "train_info/time_within_train_step": 34.31276559829712, "step": 746}
{"train_info/time_between_train_steps": 0.017642498016357422, "step": 746}
{"info/global_step": 747, "train_info/time_within_train_step": 34.518542766571045, "step": 747}
{"train_info/time_between_train_steps": 0.011099815368652344, "step": 747}
{"info/global_step": 748, "train_info/time_within_train_step": 34.262826681137085, "step": 748}
{"train_info/time_between_train_steps": 0.010853052139282227, "step": 748}
{"info/global_step": 749, "train_info/time_within_train_step": 34.43430495262146, "step": 749}
{"train_info/time_between_train_steps": 0.006082773208618164, "step": 749}
{"info/global_step": 750, "train_info/time_within_train_step": 34.178693771362305, "step": 750}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734129411, "_runtime": 26185}, "step": 750}
{"logs": {"train/loss": 2.3755, "train/learning_rate": 0.00025, "train/epoch": 17.02, "_timestamp": 1734129411, "_runtime": 26185}, "step": 750}
{"train_info/time_between_train_steps": 0.013538360595703125, "step": 750}
{"info/global_step": 751, "train_info/time_within_train_step": 34.44726920127869, "step": 751}
{"train_info/time_between_train_steps": 0.010918855667114258, "step": 751}
{"info/global_step": 752, "train_info/time_within_train_step": 34.2265350818634, "step": 752}
{"train_info/time_between_train_steps": 0.006357908248901367, "step": 752}
{"info/global_step": 753, "train_info/time_within_train_step": 34.5440399646759, "step": 753}
{"train_info/time_between_train_steps": 0.016896724700927734, "step": 753}
{"info/global_step": 754, "train_info/time_within_train_step": 34.43767738342285, "step": 754}
{"train_info/time_between_train_steps": 0.009647369384765625, "step": 754}
{"info/global_step": 755, "train_info/time_within_train_step": 34.335477352142334, "step": 755}
{"train_info/time_between_train_steps": 0.0064733028411865234, "step": 755}
{"info/global_step": 756, "train_info/time_within_train_step": 34.26743960380554, "step": 756}
{"train_info/time_between_train_steps": 0.005986213684082031, "step": 756}
{"info/global_step": 757, "train_info/time_within_train_step": 34.332616090774536, "step": 757}
{"train_info/time_between_train_steps": 0.016659259796142578, "step": 757}
{"info/global_step": 758, "train_info/time_within_train_step": 34.23478293418884, "step": 758}
{"train_info/time_between_train_steps": 0.006974697113037109, "step": 758}
{"info/global_step": 759, "train_info/time_within_train_step": 34.1808602809906, "step": 759}
{"train_info/time_between_train_steps": 0.010489463806152344, "step": 759}
{"info/global_step": 760, "train_info/time_within_train_step": 34.252479553222656, "step": 760}
{"train_info/time_between_train_steps": 0.006763935089111328, "step": 760}
{"info/global_step": 761, "train_info/time_within_train_step": 34.30576276779175, "step": 761}
{"train_info/time_between_train_steps": 0.01410531997680664, "step": 761}
{"info/global_step": 762, "train_info/time_within_train_step": 34.28077006340027, "step": 762}
{"train_info/time_between_train_steps": 0.00868535041809082, "step": 762}
{"info/global_step": 763, "train_info/time_within_train_step": 34.36265587806702, "step": 763}
{"train_info/time_between_train_steps": 0.00618743896484375, "step": 763}
{"info/global_step": 764, "train_info/time_within_train_step": 34.31991362571716, "step": 764}
{"train_info/time_between_train_steps": 0.010406732559204102, "step": 764}
{"info/global_step": 765, "train_info/time_within_train_step": 34.12204074859619, "step": 765}
{"train_info/time_between_train_steps": 0.016292810440063477, "step": 765}
{"info/global_step": 766, "train_info/time_within_train_step": 34.16937232017517, "step": 766}
{"train_info/time_between_train_steps": 0.00851130485534668, "step": 766}
{"info/global_step": 767, "train_info/time_within_train_step": 34.22804284095764, "step": 767}
{"train_info/time_between_train_steps": 0.006065845489501953, "step": 767}
{"info/global_step": 768, "train_info/time_within_train_step": 34.25669455528259, "step": 768}
{"train_info/time_between_train_steps": 0.00786137580871582, "step": 768}
{"info/global_step": 769, "train_info/time_within_train_step": 34.29105854034424, "step": 769}
{"train_info/time_between_train_steps": 0.011569976806640625, "step": 769}
{"info/global_step": 770, "train_info/time_within_train_step": 34.46993923187256, "step": 770}
{"train_info/time_between_train_steps": 0.011670827865600586, "step": 770}
{"info/global_step": 771, "train_info/time_within_train_step": 34.175307750701904, "step": 771}
{"train_info/time_between_train_steps": 0.007555723190307617, "step": 771}
{"info/global_step": 772, "train_info/time_within_train_step": 34.20494055747986, "step": 772}
{"train_info/time_between_train_steps": 0.0064470767974853516, "step": 772}
{"info/global_step": 773, "train_info/time_within_train_step": 34.17780542373657, "step": 773}
{"train_info/time_between_train_steps": 0.010807037353515625, "step": 773}
{"info/global_step": 774, "train_info/time_within_train_step": 34.30143475532532, "step": 774}
{"train_info/time_between_train_steps": 0.016083240509033203, "step": 774}
{"train_info/time_between_train_steps": 26.959977626800537, "step": 774}
{"info/global_step": 775, "train_info/time_within_train_step": 34.3423056602478, "step": 775}
{"train_info/time_between_train_steps": 0.006146669387817383, "step": 775}
{"info/global_step": 776, "train_info/time_within_train_step": 34.16590070724487, "step": 776}
{"train_info/time_between_train_steps": 0.006022453308105469, "step": 776}
{"info/global_step": 777, "train_info/time_within_train_step": 34.01650857925415, "step": 777}
{"train_info/time_between_train_steps": 0.006914377212524414, "step": 777}
{"info/global_step": 778, "train_info/time_within_train_step": 34.39302182197571, "step": 778}
{"train_info/time_between_train_steps": 0.00604701042175293, "step": 778}
{"info/global_step": 779, "train_info/time_within_train_step": 34.271909952163696, "step": 779}
{"train_info/time_between_train_steps": 0.0058858394622802734, "step": 779}
{"info/global_step": 780, "train_info/time_within_train_step": 34.38509511947632, "step": 780}
{"train_info/time_between_train_steps": 0.010360956192016602, "step": 780}
{"info/global_step": 781, "train_info/time_within_train_step": 34.09158778190613, "step": 781}
{"train_info/time_between_train_steps": 0.007579326629638672, "step": 781}
{"info/global_step": 782, "train_info/time_within_train_step": 34.342446088790894, "step": 782}
{"train_info/time_between_train_steps": 0.010389328002929688, "step": 782}
{"info/global_step": 783, "train_info/time_within_train_step": 34.23660850524902, "step": 783}
{"train_info/time_between_train_steps": 0.016112327575683594, "step": 783}
{"info/global_step": 784, "train_info/time_within_train_step": 34.453094720840454, "step": 784}
{"train_info/time_between_train_steps": 0.016469478607177734, "step": 784}
{"info/global_step": 785, "train_info/time_within_train_step": 34.347872734069824, "step": 785}
{"train_info/time_between_train_steps": 0.017347097396850586, "step": 785}
{"info/global_step": 786, "train_info/time_within_train_step": 34.45007061958313, "step": 786}
{"train_info/time_between_train_steps": 0.006096363067626953, "step": 786}
{"info/global_step": 787, "train_info/time_within_train_step": 34.244505167007446, "step": 787}
{"train_info/time_between_train_steps": 0.007980108261108398, "step": 787}
{"info/global_step": 788, "train_info/time_within_train_step": 34.43627119064331, "step": 788}
{"train_info/time_between_train_steps": 0.0074329376220703125, "step": 788}
{"info/global_step": 789, "train_info/time_within_train_step": 34.24014949798584, "step": 789}
{"train_info/time_between_train_steps": 0.019849300384521484, "step": 789}
{"info/global_step": 790, "train_info/time_within_train_step": 34.54691696166992, "step": 790}
{"train_info/time_between_train_steps": 0.01735091209411621, "step": 790}
{"info/global_step": 791, "train_info/time_within_train_step": 34.28130578994751, "step": 791}
{"train_info/time_between_train_steps": 0.0066967010498046875, "step": 791}
{"info/global_step": 792, "train_info/time_within_train_step": 34.42360043525696, "step": 792}
{"train_info/time_between_train_steps": 0.006651878356933594, "step": 792}
{"info/global_step": 793, "train_info/time_within_train_step": 34.26382064819336, "step": 793}
{"train_info/time_between_train_steps": 0.016466379165649414, "step": 793}
{"info/global_step": 794, "train_info/time_within_train_step": 34.84013533592224, "step": 794}
{"train_info/time_between_train_steps": 0.016775846481323242, "step": 794}
{"info/global_step": 795, "train_info/time_within_train_step": 34.30044913291931, "step": 795}
{"train_info/time_between_train_steps": 0.0066661834716796875, "step": 795}
{"info/global_step": 796, "train_info/time_within_train_step": 34.41482853889465, "step": 796}
{"train_info/time_between_train_steps": 0.006533384323120117, "step": 796}
{"info/global_step": 797, "train_info/time_within_train_step": 34.336069107055664, "step": 797}
{"train_info/time_between_train_steps": 0.016272306442260742, "step": 797}
{"info/global_step": 798, "train_info/time_within_train_step": 34.350369930267334, "step": 798}
{"train_info/time_between_train_steps": 0.012516260147094727, "step": 798}
{"info/global_step": 799, "train_info/time_within_train_step": 34.276323556900024, "step": 799}
{"train_info/time_between_train_steps": 0.011663198471069336, "step": 799}
{"info/global_step": 800, "train_info/time_within_train_step": 34.29197287559509, "step": 800}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734131154, "_runtime": 27928}, "step": 800}
{"logs": {"train/loss": 2.3405, "train/learning_rate": 0.00022222222222222218, "train/epoch": 18.02, "_timestamp": 1734131154, "_runtime": 27928}, "step": 800}
{"train_info/time_between_train_steps": 2.340656280517578, "step": 800}
{"info/global_step": 801, "train_info/time_within_train_step": 34.49958848953247, "step": 801}
{"train_info/time_between_train_steps": 0.006017208099365234, "step": 801}
{"info/global_step": 802, "train_info/time_within_train_step": 34.17701816558838, "step": 802}
{"train_info/time_between_train_steps": 0.01611185073852539, "step": 802}
{"info/global_step": 803, "train_info/time_within_train_step": 34.191428422927856, "step": 803}
{"train_info/time_between_train_steps": 0.005883455276489258, "step": 803}
{"info/global_step": 804, "train_info/time_within_train_step": 34.26623845100403, "step": 804}
{"train_info/time_between_train_steps": 0.011721134185791016, "step": 804}
{"info/global_step": 805, "train_info/time_within_train_step": 34.06249165534973, "step": 805}
{"train_info/time_between_train_steps": 0.007919073104858398, "step": 805}
{"info/global_step": 806, "train_info/time_within_train_step": 34.16015291213989, "step": 806}
{"train_info/time_between_train_steps": 0.005609273910522461, "step": 806}
{"info/global_step": 807, "train_info/time_within_train_step": 34.08658266067505, "step": 807}
{"train_info/time_between_train_steps": 0.005779266357421875, "step": 807}
{"info/global_step": 808, "train_info/time_within_train_step": 34.140838861465454, "step": 808}
{"train_info/time_between_train_steps": 0.015404701232910156, "step": 808}
{"info/global_step": 809, "train_info/time_within_train_step": 34.26502299308777, "step": 809}
{"train_info/time_between_train_steps": 0.008978605270385742, "step": 809}
{"info/global_step": 810, "train_info/time_within_train_step": 34.36869478225708, "step": 810}
{"train_info/time_between_train_steps": 0.009534835815429688, "step": 810}
{"info/global_step": 811, "train_info/time_within_train_step": 34.132169246673584, "step": 811}
{"train_info/time_between_train_steps": 0.007456541061401367, "step": 811}
{"info/global_step": 812, "train_info/time_within_train_step": 34.246402740478516, "step": 812}
{"train_info/time_between_train_steps": 0.005877971649169922, "step": 812}
{"info/global_step": 813, "train_info/time_within_train_step": 34.18831276893616, "step": 813}
{"train_info/time_between_train_steps": 0.007258176803588867, "step": 813}
{"info/global_step": 814, "train_info/time_within_train_step": 34.23479700088501, "step": 814}
{"train_info/time_between_train_steps": 0.0058078765869140625, "step": 814}
{"info/global_step": 815, "train_info/time_within_train_step": 34.215495109558105, "step": 815}
{"train_info/time_between_train_steps": 0.010158777236938477, "step": 815}
{"info/global_step": 816, "train_info/time_within_train_step": 34.4714457988739, "step": 816}
{"train_info/time_between_train_steps": 0.006810665130615234, "step": 816}
{"info/global_step": 817, "train_info/time_within_train_step": 34.23707818984985, "step": 817}
{"train_info/time_between_train_steps": 0.017767906188964844, "step": 817}
{"train_info/time_between_train_steps": 26.748002767562866, "step": 817}
{"info/global_step": 818, "train_info/time_within_train_step": 34.286834955215454, "step": 818}
{"train_info/time_between_train_steps": 0.0070896148681640625, "step": 818}
{"info/global_step": 819, "train_info/time_within_train_step": 34.39852285385132, "step": 819}
{"train_info/time_between_train_steps": 0.014820098876953125, "step": 819}
{"info/global_step": 820, "train_info/time_within_train_step": 34.19866108894348, "step": 820}
{"train_info/time_between_train_steps": 0.0105438232421875, "step": 820}
{"info/global_step": 821, "train_info/time_within_train_step": 34.366469383239746, "step": 821}
{"train_info/time_between_train_steps": 0.01496267318725586, "step": 821}
{"info/global_step": 822, "train_info/time_within_train_step": 34.274616956710815, "step": 822}
{"train_info/time_between_train_steps": 0.017456769943237305, "step": 822}
{"info/global_step": 823, "train_info/time_within_train_step": 34.33998394012451, "step": 823}
{"train_info/time_between_train_steps": 0.010463953018188477, "step": 823}
{"info/global_step": 824, "train_info/time_within_train_step": 34.311384201049805, "step": 824}
{"train_info/time_between_train_steps": 0.009581804275512695, "step": 824}
{"info/global_step": 825, "train_info/time_within_train_step": 34.53688979148865, "step": 825}
{"train_info/time_between_train_steps": 0.01499176025390625, "step": 825}
{"info/global_step": 826, "train_info/time_within_train_step": 34.23944711685181, "step": 826}
{"train_info/time_between_train_steps": 0.006349325180053711, "step": 826}
{"info/global_step": 827, "train_info/time_within_train_step": 34.42324447631836, "step": 827}
{"train_info/time_between_train_steps": 0.005951642990112305, "step": 827}
{"info/global_step": 828, "train_info/time_within_train_step": 34.27533221244812, "step": 828}
{"train_info/time_between_train_steps": 0.010276079177856445, "step": 828}
{"info/global_step": 829, "train_info/time_within_train_step": 34.41749405860901, "step": 829}
{"train_info/time_between_train_steps": 0.010544776916503906, "step": 829}
{"info/global_step": 830, "train_info/time_within_train_step": 34.259504556655884, "step": 830}
{"train_info/time_between_train_steps": 0.012143611907958984, "step": 830}
{"info/global_step": 831, "train_info/time_within_train_step": 34.69096612930298, "step": 831}
{"train_info/time_between_train_steps": 0.01191258430480957, "step": 831}
{"info/global_step": 832, "train_info/time_within_train_step": 34.32181906700134, "step": 832}
{"train_info/time_between_train_steps": 0.016254425048828125, "step": 832}
{"info/global_step": 833, "train_info/time_within_train_step": 34.58566212654114, "step": 833}
{"train_info/time_between_train_steps": 0.006639003753662109, "step": 833}
{"info/global_step": 834, "train_info/time_within_train_step": 34.21125674247742, "step": 834}
{"train_info/time_between_train_steps": 0.01635289192199707, "step": 834}
{"info/global_step": 835, "train_info/time_within_train_step": 34.375266313552856, "step": 835}
{"train_info/time_between_train_steps": 0.006385087966918945, "step": 835}
{"info/global_step": 836, "train_info/time_within_train_step": 34.22850251197815, "step": 836}
{"train_info/time_between_train_steps": 0.010747194290161133, "step": 836}
{"info/global_step": 837, "train_info/time_within_train_step": 34.281336545944214, "step": 837}
{"train_info/time_between_train_steps": 0.006486177444458008, "step": 837}
{"info/global_step": 838, "train_info/time_within_train_step": 34.114501953125, "step": 838}
{"train_info/time_between_train_steps": 0.006327152252197266, "step": 838}
{"info/global_step": 839, "train_info/time_within_train_step": 34.52745270729065, "step": 839}
{"train_info/time_between_train_steps": 0.006459951400756836, "step": 839}
{"info/global_step": 840, "train_info/time_within_train_step": 34.09563183784485, "step": 840}
{"train_info/time_between_train_steps": 0.0063512325286865234, "step": 840}
{"info/global_step": 841, "train_info/time_within_train_step": 34.307016372680664, "step": 841}
{"train_info/time_between_train_steps": 0.010487556457519531, "step": 841}
{"info/global_step": 842, "train_info/time_within_train_step": 34.154725313186646, "step": 842}
{"train_info/time_between_train_steps": 0.009968280792236328, "step": 842}
{"info/global_step": 843, "train_info/time_within_train_step": 34.05165982246399, "step": 843}
{"train_info/time_between_train_steps": 0.005986213684082031, "step": 843}
{"info/global_step": 844, "train_info/time_within_train_step": 34.0968074798584, "step": 844}
{"train_info/time_between_train_steps": 0.005984067916870117, "step": 844}
{"info/global_step": 845, "train_info/time_within_train_step": 34.08921480178833, "step": 845}
{"train_info/time_between_train_steps": 0.010230064392089844, "step": 845}
{"info/global_step": 846, "train_info/time_within_train_step": 34.141289472579956, "step": 846}
{"train_info/time_between_train_steps": 0.010730743408203125, "step": 846}
{"info/global_step": 847, "train_info/time_within_train_step": 34.466209411621094, "step": 847}
{"train_info/time_between_train_steps": 0.011311054229736328, "step": 847}
{"info/global_step": 848, "train_info/time_within_train_step": 34.19258642196655, "step": 848}
{"train_info/time_between_train_steps": 0.010233640670776367, "step": 848}
{"info/global_step": 849, "train_info/time_within_train_step": 34.20340347290039, "step": 849}
{"train_info/time_between_train_steps": 0.015459060668945312, "step": 849}
{"info/global_step": 850, "train_info/time_within_train_step": 34.27547001838684, "step": 850}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734132897, "_runtime": 29671}, "step": 850}
{"logs": {"train/loss": 2.3063, "train/learning_rate": 0.00019444444444444443, "train/epoch": 19.03, "_timestamp": 1734132897, "_runtime": 29671}, "step": 850}
{"train_info/time_between_train_steps": 0.008060216903686523, "step": 850}
{"info/global_step": 851, "train_info/time_within_train_step": 34.117738485336304, "step": 851}
{"train_info/time_between_train_steps": 0.005760669708251953, "step": 851}
{"info/global_step": 852, "train_info/time_within_train_step": 34.21535611152649, "step": 852}
{"train_info/time_between_train_steps": 0.010104894638061523, "step": 852}
{"info/global_step": 853, "train_info/time_within_train_step": 34.22442841529846, "step": 853}
{"train_info/time_between_train_steps": 0.009912490844726562, "step": 853}
{"info/global_step": 854, "train_info/time_within_train_step": 34.17896246910095, "step": 854}
{"train_info/time_between_train_steps": 0.012707710266113281, "step": 854}
{"info/global_step": 855, "train_info/time_within_train_step": 34.175692319869995, "step": 855}
{"train_info/time_between_train_steps": 0.006331443786621094, "step": 855}
{"info/global_step": 856, "train_info/time_within_train_step": 34.17099738121033, "step": 856}
{"train_info/time_between_train_steps": 0.0064525604248046875, "step": 856}
{"info/global_step": 857, "train_info/time_within_train_step": 34.20733618736267, "step": 857}
{"train_info/time_between_train_steps": 0.01040339469909668, "step": 857}
{"info/global_step": 858, "train_info/time_within_train_step": 34.23507523536682, "step": 858}
{"train_info/time_between_train_steps": 0.015470504760742188, "step": 858}
{"info/global_step": 859, "train_info/time_within_train_step": 34.217199087142944, "step": 859}
{"train_info/time_between_train_steps": 0.0059854984283447266, "step": 859}
{"info/global_step": 860, "train_info/time_within_train_step": 34.0879008769989, "step": 860}
{"train_info/time_between_train_steps": 0.006984710693359375, "step": 860}
{"train_info/time_between_train_steps": 27.06364369392395, "step": 860}
{"info/global_step": 861, "train_info/time_within_train_step": 34.23546624183655, "step": 861}
{"train_info/time_between_train_steps": 0.006369113922119141, "step": 861}
{"info/global_step": 862, "train_info/time_within_train_step": 34.58522844314575, "step": 862}
{"train_info/time_between_train_steps": 0.011569499969482422, "step": 862}
{"info/global_step": 863, "train_info/time_within_train_step": 34.43185329437256, "step": 863}
{"train_info/time_between_train_steps": 0.006426572799682617, "step": 863}
{"info/global_step": 864, "train_info/time_within_train_step": 34.565324544906616, "step": 864}
{"train_info/time_between_train_steps": 0.0070497989654541016, "step": 864}
{"info/global_step": 865, "train_info/time_within_train_step": 34.20892572402954, "step": 865}
{"train_info/time_between_train_steps": 0.013046741485595703, "step": 865}
{"info/global_step": 866, "train_info/time_within_train_step": 34.36424446105957, "step": 866}
{"train_info/time_between_train_steps": 0.0069122314453125, "step": 866}
{"info/global_step": 867, "train_info/time_within_train_step": 34.20874881744385, "step": 867}
{"train_info/time_between_train_steps": 0.006027936935424805, "step": 867}
{"info/global_step": 868, "train_info/time_within_train_step": 34.353673696517944, "step": 868}
{"train_info/time_between_train_steps": 0.017554759979248047, "step": 868}
{"info/global_step": 869, "train_info/time_within_train_step": 34.21751379966736, "step": 869}
{"train_info/time_between_train_steps": 0.008165597915649414, "step": 869}
{"info/global_step": 870, "train_info/time_within_train_step": 34.33793759346008, "step": 870}
{"train_info/time_between_train_steps": 0.0062160491943359375, "step": 870}
{"info/global_step": 871, "train_info/time_within_train_step": 34.23542928695679, "step": 871}
{"train_info/time_between_train_steps": 0.006586313247680664, "step": 871}
{"info/global_step": 872, "train_info/time_within_train_step": 34.44032096862793, "step": 872}
{"train_info/time_between_train_steps": 0.0061359405517578125, "step": 872}
{"info/global_step": 873, "train_info/time_within_train_step": 34.2692232131958, "step": 873}
{"train_info/time_between_train_steps": 0.015711307525634766, "step": 873}
{"info/global_step": 874, "train_info/time_within_train_step": 34.40834641456604, "step": 874}
{"train_info/time_between_train_steps": 0.009416341781616211, "step": 874}
{"info/global_step": 875, "train_info/time_within_train_step": 34.337443351745605, "step": 875}
{"train_info/time_between_train_steps": 0.010382890701293945, "step": 875}
{"info/global_step": 876, "train_info/time_within_train_step": 34.49380445480347, "step": 876}
{"train_info/time_between_train_steps": 0.006403207778930664, "step": 876}
{"info/global_step": 877, "train_info/time_within_train_step": 34.370619773864746, "step": 877}
{"train_info/time_between_train_steps": 0.010065078735351562, "step": 877}
{"info/global_step": 878, "train_info/time_within_train_step": 34.3796591758728, "step": 878}
{"train_info/time_between_train_steps": 0.006142377853393555, "step": 878}
{"info/global_step": 879, "train_info/time_within_train_step": 34.11621856689453, "step": 879}
{"train_info/time_between_train_steps": 0.0064487457275390625, "step": 879}
{"info/global_step": 880, "train_info/time_within_train_step": 34.450990438461304, "step": 880}
{"train_info/time_between_train_steps": 0.015514612197875977, "step": 880}
{"info/global_step": 881, "train_info/time_within_train_step": 34.17484903335571, "step": 881}
{"train_info/time_between_train_steps": 0.011541128158569336, "step": 881}
{"info/global_step": 882, "train_info/time_within_train_step": 34.322531938552856, "step": 882}
{"train_info/time_between_train_steps": 0.005950212478637695, "step": 882}
{"info/global_step": 883, "train_info/time_within_train_step": 34.53112006187439, "step": 883}
{"train_info/time_between_train_steps": 0.01177072525024414, "step": 883}
{"info/global_step": 884, "train_info/time_within_train_step": 34.266932010650635, "step": 884}
{"train_info/time_between_train_steps": 0.011919260025024414, "step": 884}
{"info/global_step": 885, "train_info/time_within_train_step": 34.17420983314514, "step": 885}
{"train_info/time_between_train_steps": 0.01590442657470703, "step": 885}
{"info/global_step": 886, "train_info/time_within_train_step": 34.16612982749939, "step": 886}
{"train_info/time_between_train_steps": 0.006650686264038086, "step": 886}
{"info/global_step": 887, "train_info/time_within_train_step": 34.12562966346741, "step": 887}
{"train_info/time_between_train_steps": 0.007907390594482422, "step": 887}
{"info/global_step": 888, "train_info/time_within_train_step": 34.15193963050842, "step": 888}
{"train_info/time_between_train_steps": 0.005717754364013672, "step": 888}
{"info/global_step": 889, "train_info/time_within_train_step": 34.048280477523804, "step": 889}
{"train_info/time_between_train_steps": 0.015403509140014648, "step": 889}
{"info/global_step": 890, "train_info/time_within_train_step": 34.14579129219055, "step": 890}
{"train_info/time_between_train_steps": 0.015247106552124023, "step": 890}
{"info/global_step": 891, "train_info/time_within_train_step": 34.17950940132141, "step": 891}
{"train_info/time_between_train_steps": 0.006099224090576172, "step": 891}
{"info/global_step": 892, "train_info/time_within_train_step": 34.28196144104004, "step": 892}
{"train_info/time_between_train_steps": 0.009073972702026367, "step": 892}
{"info/global_step": 893, "train_info/time_within_train_step": 34.43348431587219, "step": 893}
{"train_info/time_between_train_steps": 0.015609979629516602, "step": 893}
{"info/global_step": 894, "train_info/time_within_train_step": 34.22318410873413, "step": 894}
{"train_info/time_between_train_steps": 0.006026744842529297, "step": 894}
{"info/global_step": 895, "train_info/time_within_train_step": 34.15696382522583, "step": 895}
{"train_info/time_between_train_steps": 0.006148338317871094, "step": 895}
{"info/global_step": 896, "train_info/time_within_train_step": 34.14887619018555, "step": 896}
{"train_info/time_between_train_steps": 0.005994558334350586, "step": 896}
{"info/global_step": 897, "train_info/time_within_train_step": 34.28132510185242, "step": 897}
{"train_info/time_between_train_steps": 0.006193637847900391, "step": 897}
{"info/global_step": 898, "train_info/time_within_train_step": 34.249462366104126, "step": 898}
{"train_info/time_between_train_steps": 0.010420799255371094, "step": 898}
{"info/global_step": 899, "train_info/time_within_train_step": 34.37227773666382, "step": 899}
{"train_info/time_between_train_steps": 0.006260871887207031, "step": 899}
{"info/global_step": 900, "train_info/time_within_train_step": 34.196027994155884, "step": 900}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734134639, "_runtime": 31413}, "step": 900}
{"logs": {"train/loss": 2.2768, "train/learning_rate": 0.00016666666666666666, "train/epoch": 20.03, "_timestamp": 1734134639, "_runtime": 31413}, "step": 900}
{"train_info/time_between_train_steps": 2.4828743934631348, "step": 900}
{"info/global_step": 901, "train_info/time_within_train_step": 34.17523980140686, "step": 901}
{"train_info/time_between_train_steps": 0.007928133010864258, "step": 901}
{"info/global_step": 902, "train_info/time_within_train_step": 34.269044160842896, "step": 902}
{"train_info/time_between_train_steps": 0.011545181274414062, "step": 902}
{"info/global_step": 903, "train_info/time_within_train_step": 34.1886510848999, "step": 903}
{"train_info/time_between_train_steps": 0.007131814956665039, "step": 903}
{"train_info/time_between_train_steps": 27.10485291481018, "step": 903}
{"info/global_step": 904, "train_info/time_within_train_step": 34.19366526603699, "step": 904}
{"train_info/time_between_train_steps": 0.010761499404907227, "step": 904}
{"info/global_step": 905, "train_info/time_within_train_step": 34.20948624610901, "step": 905}
{"train_info/time_between_train_steps": 0.005715131759643555, "step": 905}
{"info/global_step": 906, "train_info/time_within_train_step": 34.189494371414185, "step": 906}
{"train_info/time_between_train_steps": 0.011523962020874023, "step": 906}
{"info/global_step": 907, "train_info/time_within_train_step": 34.2526171207428, "step": 907}
{"train_info/time_between_train_steps": 0.005902767181396484, "step": 907}
{"info/global_step": 908, "train_info/time_within_train_step": 34.42653751373291, "step": 908}
{"train_info/time_between_train_steps": 0.015253067016601562, "step": 908}
{"info/global_step": 909, "train_info/time_within_train_step": 34.3089542388916, "step": 909}
{"train_info/time_between_train_steps": 0.00635981559753418, "step": 909}
{"info/global_step": 910, "train_info/time_within_train_step": 34.22803497314453, "step": 910}
{"train_info/time_between_train_steps": 0.008904218673706055, "step": 910}
{"info/global_step": 911, "train_info/time_within_train_step": 34.138240575790405, "step": 911}
{"train_info/time_between_train_steps": 0.010040044784545898, "step": 911}
{"info/global_step": 912, "train_info/time_within_train_step": 34.08813118934631, "step": 912}
{"train_info/time_between_train_steps": 0.012991666793823242, "step": 912}
{"info/global_step": 913, "train_info/time_within_train_step": 34.362653732299805, "step": 913}
{"train_info/time_between_train_steps": 0.005877256393432617, "step": 913}
{"info/global_step": 914, "train_info/time_within_train_step": 34.10465431213379, "step": 914}
{"train_info/time_between_train_steps": 0.016505956649780273, "step": 914}
{"info/global_step": 915, "train_info/time_within_train_step": 34.34658169746399, "step": 915}
{"train_info/time_between_train_steps": 0.0057451725006103516, "step": 915}
{"info/global_step": 916, "train_info/time_within_train_step": 34.132941007614136, "step": 916}
{"train_info/time_between_train_steps": 0.005562305450439453, "step": 916}
{"info/global_step": 917, "train_info/time_within_train_step": 34.21564555168152, "step": 917}
{"train_info/time_between_train_steps": 0.005716800689697266, "step": 917}
{"info/global_step": 918, "train_info/time_within_train_step": 34.112443685531616, "step": 918}
{"train_info/time_between_train_steps": 0.0064890384674072266, "step": 918}
{"info/global_step": 919, "train_info/time_within_train_step": 34.340616941452026, "step": 919}
{"train_info/time_between_train_steps": 0.006421089172363281, "step": 919}
{"info/global_step": 920, "train_info/time_within_train_step": 34.13861060142517, "step": 920}
{"train_info/time_between_train_steps": 0.006272077560424805, "step": 920}
{"info/global_step": 921, "train_info/time_within_train_step": 34.412436962127686, "step": 921}
{"train_info/time_between_train_steps": 0.015813112258911133, "step": 921}
{"info/global_step": 922, "train_info/time_within_train_step": 34.11564517021179, "step": 922}
{"train_info/time_between_train_steps": 0.010760307312011719, "step": 922}
{"info/global_step": 923, "train_info/time_within_train_step": 34.27817988395691, "step": 923}
{"train_info/time_between_train_steps": 0.007055521011352539, "step": 923}
{"info/global_step": 924, "train_info/time_within_train_step": 34.32755756378174, "step": 924}
{"train_info/time_between_train_steps": 0.006166219711303711, "step": 924}
{"info/global_step": 925, "train_info/time_within_train_step": 34.17571496963501, "step": 925}
{"train_info/time_between_train_steps": 0.0125274658203125, "step": 925}
{"info/global_step": 926, "train_info/time_within_train_step": 34.160751819610596, "step": 926}
{"train_info/time_between_train_steps": 0.0069522857666015625, "step": 926}
{"info/global_step": 927, "train_info/time_within_train_step": 34.21443796157837, "step": 927}
{"train_info/time_between_train_steps": 0.010837554931640625, "step": 927}
{"info/global_step": 928, "train_info/time_within_train_step": 34.07856607437134, "step": 928}
{"train_info/time_between_train_steps": 0.010877132415771484, "step": 928}
{"info/global_step": 929, "train_info/time_within_train_step": 34.11731815338135, "step": 929}
{"train_info/time_between_train_steps": 0.0057561397552490234, "step": 929}
{"info/global_step": 930, "train_info/time_within_train_step": 34.0112783908844, "step": 930}
{"train_info/time_between_train_steps": 0.013057231903076172, "step": 930}
{"info/global_step": 931, "train_info/time_within_train_step": 34.12925696372986, "step": 931}
{"train_info/time_between_train_steps": 0.01034855842590332, "step": 931}
{"info/global_step": 932, "train_info/time_within_train_step": 34.01408767700195, "step": 932}
{"train_info/time_between_train_steps": 0.0058557987213134766, "step": 932}
{"info/global_step": 933, "train_info/time_within_train_step": 34.12556290626526, "step": 933}
{"train_info/time_between_train_steps": 0.007503509521484375, "step": 933}
{"info/global_step": 934, "train_info/time_within_train_step": 34.07360863685608, "step": 934}
{"train_info/time_between_train_steps": 0.0062541961669921875, "step": 934}
{"info/global_step": 935, "train_info/time_within_train_step": 34.111966371536255, "step": 935}
{"train_info/time_between_train_steps": 0.006078004837036133, "step": 935}
{"info/global_step": 936, "train_info/time_within_train_step": 34.15686845779419, "step": 936}
{"train_info/time_between_train_steps": 0.005871772766113281, "step": 936}
{"info/global_step": 937, "train_info/time_within_train_step": 34.08384108543396, "step": 937}
{"train_info/time_between_train_steps": 0.0060749053955078125, "step": 937}
{"info/global_step": 938, "train_info/time_within_train_step": 34.07208728790283, "step": 938}
{"train_info/time_between_train_steps": 0.016588687896728516, "step": 938}
{"info/global_step": 939, "train_info/time_within_train_step": 34.35982298851013, "step": 939}
{"train_info/time_between_train_steps": 0.005881547927856445, "step": 939}
{"info/global_step": 940, "train_info/time_within_train_step": 34.107320070266724, "step": 940}
{"train_info/time_between_train_steps": 0.010849237442016602, "step": 940}
{"info/global_step": 941, "train_info/time_within_train_step": 34.07608675956726, "step": 941}
{"train_info/time_between_train_steps": 0.010972023010253906, "step": 941}
{"info/global_step": 942, "train_info/time_within_train_step": 34.0812246799469, "step": 942}
{"train_info/time_between_train_steps": 0.005838155746459961, "step": 942}
{"info/global_step": 943, "train_info/time_within_train_step": 33.92925524711609, "step": 943}
{"train_info/time_between_train_steps": 0.0058667659759521484, "step": 943}
{"info/global_step": 944, "train_info/time_within_train_step": 33.9324836730957, "step": 944}
{"train_info/time_between_train_steps": 0.006687164306640625, "step": 944}
{"info/global_step": 945, "train_info/time_within_train_step": 33.94490051269531, "step": 945}
{"train_info/time_between_train_steps": 0.0058438777923583984, "step": 945}
{"info/global_step": 946, "train_info/time_within_train_step": 33.99585509300232, "step": 946}
{"train_info/time_between_train_steps": 0.0072765350341796875, "step": 946}
{"train_info/time_between_train_steps": 26.40818738937378, "step": 946}
{"info/global_step": 947, "train_info/time_within_train_step": 33.937848806381226, "step": 947}
{"train_info/time_between_train_steps": 0.005491495132446289, "step": 947}
{"info/global_step": 948, "train_info/time_within_train_step": 34.07169198989868, "step": 948}
{"train_info/time_between_train_steps": 0.01093602180480957, "step": 948}
{"info/global_step": 949, "train_info/time_within_train_step": 34.027287006378174, "step": 949}
{"train_info/time_between_train_steps": 0.00585174560546875, "step": 949}
{"info/global_step": 950, "train_info/time_within_train_step": 34.172181129455566, "step": 950}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734136403, "_runtime": 33177}, "step": 950}
{"logs": {"train/loss": 2.2799, "train/learning_rate": 0.0001388888888888889, "train/epoch": 22.0, "_timestamp": 1734136403, "_runtime": 33177}, "step": 950}
{"train_info/time_between_train_steps": 0.007848978042602539, "step": 950}
{"info/global_step": 951, "train_info/time_within_train_step": 33.9336838722229, "step": 951}
{"train_info/time_between_train_steps": 0.010345697402954102, "step": 951}
{"info/global_step": 952, "train_info/time_within_train_step": 34.07649207115173, "step": 952}
{"train_info/time_between_train_steps": 0.00563502311706543, "step": 952}
{"info/global_step": 953, "train_info/time_within_train_step": 33.915390491485596, "step": 953}
{"train_info/time_between_train_steps": 0.005829334259033203, "step": 953}
{"info/global_step": 954, "train_info/time_within_train_step": 34.34664702415466, "step": 954}
{"train_info/time_between_train_steps": 0.005751371383666992, "step": 954}
{"info/global_step": 955, "train_info/time_within_train_step": 33.90649938583374, "step": 955}
{"train_info/time_between_train_steps": 0.005768299102783203, "step": 955}
{"info/global_step": 956, "train_info/time_within_train_step": 34.05367159843445, "step": 956}
{"train_info/time_between_train_steps": 0.009830474853515625, "step": 956}
{"info/global_step": 957, "train_info/time_within_train_step": 34.144235610961914, "step": 957}
{"train_info/time_between_train_steps": 0.005796194076538086, "step": 957}
{"info/global_step": 958, "train_info/time_within_train_step": 34.13447833061218, "step": 958}
{"train_info/time_between_train_steps": 0.011500358581542969, "step": 958}
{"info/global_step": 959, "train_info/time_within_train_step": 34.0697705745697, "step": 959}
{"train_info/time_between_train_steps": 0.00616455078125, "step": 959}
{"info/global_step": 960, "train_info/time_within_train_step": 34.072986364364624, "step": 960}
{"train_info/time_between_train_steps": 0.0074002742767333984, "step": 960}
{"info/global_step": 961, "train_info/time_within_train_step": 33.93251585960388, "step": 961}
{"train_info/time_between_train_steps": 0.005615234375, "step": 961}
{"info/global_step": 962, "train_info/time_within_train_step": 34.057374715805054, "step": 962}
{"train_info/time_between_train_steps": 0.005877494812011719, "step": 962}
{"info/global_step": 963, "train_info/time_within_train_step": 33.99641823768616, "step": 963}
{"train_info/time_between_train_steps": 0.005975484848022461, "step": 963}
{"info/global_step": 964, "train_info/time_within_train_step": 34.191415309906006, "step": 964}
{"train_info/time_between_train_steps": 0.009399175643920898, "step": 964}
{"info/global_step": 965, "train_info/time_within_train_step": 33.94884443283081, "step": 965}
{"train_info/time_between_train_steps": 0.0057528018951416016, "step": 965}
{"info/global_step": 966, "train_info/time_within_train_step": 34.05805063247681, "step": 966}
{"train_info/time_between_train_steps": 0.00579524040222168, "step": 966}
{"info/global_step": 967, "train_info/time_within_train_step": 33.966967821121216, "step": 967}
{"train_info/time_between_train_steps": 0.005886554718017578, "step": 967}
{"info/global_step": 968, "train_info/time_within_train_step": 34.405919551849365, "step": 968}
{"train_info/time_between_train_steps": 0.012041091918945312, "step": 968}
{"info/global_step": 969, "train_info/time_within_train_step": 34.04548954963684, "step": 969}
{"train_info/time_between_train_steps": 0.00591278076171875, "step": 969}
{"info/global_step": 970, "train_info/time_within_train_step": 34.27181148529053, "step": 970}
{"train_info/time_between_train_steps": 0.005667209625244141, "step": 970}
{"info/global_step": 971, "train_info/time_within_train_step": 33.91901779174805, "step": 971}
{"train_info/time_between_train_steps": 0.005566120147705078, "step": 971}
{"info/global_step": 972, "train_info/time_within_train_step": 33.90877437591553, "step": 972}
{"train_info/time_between_train_steps": 0.005680561065673828, "step": 972}
{"info/global_step": 973, "train_info/time_within_train_step": 34.00944709777832, "step": 973}
{"train_info/time_between_train_steps": 0.005750894546508789, "step": 973}
{"info/global_step": 974, "train_info/time_within_train_step": 33.94278860092163, "step": 974}
{"train_info/time_between_train_steps": 0.005898475646972656, "step": 974}
{"info/global_step": 975, "train_info/time_within_train_step": 33.92260503768921, "step": 975}
{"train_info/time_between_train_steps": 0.0058536529541015625, "step": 975}
{"info/global_step": 976, "train_info/time_within_train_step": 33.95765423774719, "step": 976}
{"train_info/time_between_train_steps": 0.005659341812133789, "step": 976}
{"info/global_step": 977, "train_info/time_within_train_step": 34.13049364089966, "step": 977}
{"train_info/time_between_train_steps": 0.005768775939941406, "step": 977}
{"info/global_step": 978, "train_info/time_within_train_step": 34.0544798374176, "step": 978}
{"train_info/time_between_train_steps": 0.005557060241699219, "step": 978}
{"info/global_step": 979, "train_info/time_within_train_step": 33.9323194026947, "step": 979}
{"train_info/time_between_train_steps": 0.005556821823120117, "step": 979}
{"info/global_step": 980, "train_info/time_within_train_step": 33.99165749549866, "step": 980}
{"train_info/time_between_train_steps": 0.010528326034545898, "step": 980}
{"info/global_step": 981, "train_info/time_within_train_step": 33.93170189857483, "step": 981}
{"train_info/time_between_train_steps": 0.009847402572631836, "step": 981}
{"info/global_step": 982, "train_info/time_within_train_step": 34.26586651802063, "step": 982}
{"train_info/time_between_train_steps": 0.009850263595581055, "step": 982}
{"info/global_step": 983, "train_info/time_within_train_step": 33.97601628303528, "step": 983}
{"train_info/time_between_train_steps": 0.006260871887207031, "step": 983}
{"info/global_step": 984, "train_info/time_within_train_step": 33.917027711868286, "step": 984}
{"train_info/time_between_train_steps": 0.0056896209716796875, "step": 984}
{"info/global_step": 985, "train_info/time_within_train_step": 34.110342502593994, "step": 985}
{"train_info/time_between_train_steps": 0.005809307098388672, "step": 985}
{"info/global_step": 986, "train_info/time_within_train_step": 33.92935824394226, "step": 986}
{"train_info/time_between_train_steps": 0.005705595016479492, "step": 986}
{"info/global_step": 987, "train_info/time_within_train_step": 33.925607442855835, "step": 987}
{"train_info/time_between_train_steps": 0.009957313537597656, "step": 987}
{"info/global_step": 988, "train_info/time_within_train_step": 33.954437494277954, "step": 988}
{"train_info/time_between_train_steps": 0.010384798049926758, "step": 988}
{"info/global_step": 989, "train_info/time_within_train_step": 33.9338116645813, "step": 989}
{"train_info/time_between_train_steps": 0.0071485042572021484, "step": 989}
{"train_info/time_between_train_steps": 26.493628978729248, "step": 989}
{"info/global_step": 990, "train_info/time_within_train_step": 33.91390657424927, "step": 990}
{"train_info/time_between_train_steps": 0.005485057830810547, "step": 990}
{"info/global_step": 991, "train_info/time_within_train_step": 34.02641773223877, "step": 991}
{"train_info/time_between_train_steps": 0.005513429641723633, "step": 991}
{"info/global_step": 992, "train_info/time_within_train_step": 34.0487380027771, "step": 992}
{"train_info/time_between_train_steps": 0.009821891784667969, "step": 992}
{"info/global_step": 993, "train_info/time_within_train_step": 34.33652663230896, "step": 993}
{"train_info/time_between_train_steps": 0.005834341049194336, "step": 993}
{"info/global_step": 994, "train_info/time_within_train_step": 33.9742157459259, "step": 994}
{"train_info/time_between_train_steps": 0.00578618049621582, "step": 994}
{"info/global_step": 995, "train_info/time_within_train_step": 34.07072305679321, "step": 995}
{"train_info/time_between_train_steps": 0.005777835845947266, "step": 995}
{"info/global_step": 996, "train_info/time_within_train_step": 33.913206577301025, "step": 996}
{"train_info/time_between_train_steps": 0.005757331848144531, "step": 996}
{"info/global_step": 997, "train_info/time_within_train_step": 34.07409954071045, "step": 997}
{"train_info/time_between_train_steps": 0.005761623382568359, "step": 997}
{"info/global_step": 998, "train_info/time_within_train_step": 33.99646067619324, "step": 998}
{"train_info/time_between_train_steps": 0.005601644515991211, "step": 998}
{"info/global_step": 999, "train_info/time_within_train_step": 34.0934157371521, "step": 999}
{"train_info/time_between_train_steps": 0.006064653396606445, "step": 999}
{"info/global_step": 1000, "train_info/time_within_train_step": 34.15969514846802, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1734138131, "_runtime": 34905}, "step": 1000}
{"logs": {"train/loss": 2.2247, "train/learning_rate": 0.00011111111111111109, "train/epoch": 23.01, "_timestamp": 1734138131, "_runtime": 34905}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1734138135, "_runtime": 34909}, "step": 1000}
{"logs": {"eval/loss": 2.6665191650390625, "eval/runtime": 3.9154, "eval/samples_per_second": 41.631, "eval/steps_per_second": 2.809, "train/epoch": 23.01, "_timestamp": 1734138135, "_runtime": 34909}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1734138135, "_runtime": 34909}, "step": 1000}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 2.6665191650390625, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 14.389793420654337, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 3.9154, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 41.631, "train/epoch": 23.01, "_timestamp": 1734138135, "_runtime": 34909}, "step": 1000}
{"train_info/time_between_train_steps": 6.326541185379028, "step": 1000}
{"info/global_step": 1001, "train_info/time_within_train_step": 34.070326805114746, "step": 1001}
{"train_info/time_between_train_steps": 0.005808830261230469, "step": 1001}
{"info/global_step": 1002, "train_info/time_within_train_step": 34.059762477874756, "step": 1002}
{"train_info/time_between_train_steps": 0.01061558723449707, "step": 1002}
{"info/global_step": 1003, "train_info/time_within_train_step": 34.19774031639099, "step": 1003}
{"train_info/time_between_train_steps": 0.005789995193481445, "step": 1003}
{"info/global_step": 1004, "train_info/time_within_train_step": 34.032607555389404, "step": 1004}
{"train_info/time_between_train_steps": 0.005682945251464844, "step": 1004}
{"info/global_step": 1005, "train_info/time_within_train_step": 34.026185274124146, "step": 1005}
{"train_info/time_between_train_steps": 0.005745649337768555, "step": 1005}
{"info/global_step": 1006, "train_info/time_within_train_step": 33.92703032493591, "step": 1006}
{"train_info/time_between_train_steps": 0.006201267242431641, "step": 1006}
{"info/global_step": 1007, "train_info/time_within_train_step": 34.148635387420654, "step": 1007}
{"train_info/time_between_train_steps": 0.006073713302612305, "step": 1007}
{"info/global_step": 1008, "train_info/time_within_train_step": 33.922956466674805, "step": 1008}
{"train_info/time_between_train_steps": 0.00607752799987793, "step": 1008}
{"info/global_step": 1009, "train_info/time_within_train_step": 34.15241599082947, "step": 1009}
{"train_info/time_between_train_steps": 0.005766868591308594, "step": 1009}
{"info/global_step": 1010, "train_info/time_within_train_step": 33.97430992126465, "step": 1010}
{"train_info/time_between_train_steps": 0.005704402923583984, "step": 1010}
{"info/global_step": 1011, "train_info/time_within_train_step": 34.14553356170654, "step": 1011}
{"train_info/time_between_train_steps": 0.005882978439331055, "step": 1011}
{"info/global_step": 1012, "train_info/time_within_train_step": 34.042195558547974, "step": 1012}
{"train_info/time_between_train_steps": 0.006098747253417969, "step": 1012}
{"info/global_step": 1013, "train_info/time_within_train_step": 34.0646288394928, "step": 1013}
{"train_info/time_between_train_steps": 0.006937980651855469, "step": 1013}
{"info/global_step": 1014, "train_info/time_within_train_step": 34.01616907119751, "step": 1014}
{"train_info/time_between_train_steps": 0.005794048309326172, "step": 1014}
{"info/global_step": 1015, "train_info/time_within_train_step": 33.97951126098633, "step": 1015}
{"train_info/time_between_train_steps": 0.0057604312896728516, "step": 1015}
{"info/global_step": 1016, "train_info/time_within_train_step": 34.25823616981506, "step": 1016}
{"train_info/time_between_train_steps": 0.010168313980102539, "step": 1016}
{"info/global_step": 1017, "train_info/time_within_train_step": 34.03421068191528, "step": 1017}
{"train_info/time_between_train_steps": 0.0058689117431640625, "step": 1017}
{"info/global_step": 1018, "train_info/time_within_train_step": 33.995872259140015, "step": 1018}
{"train_info/time_between_train_steps": 0.005963563919067383, "step": 1018}
{"info/global_step": 1019, "train_info/time_within_train_step": 34.05829405784607, "step": 1019}
{"train_info/time_between_train_steps": 0.006232500076293945, "step": 1019}
{"info/global_step": 1020, "train_info/time_within_train_step": 33.99742579460144, "step": 1020}
{"train_info/time_between_train_steps": 0.0056304931640625, "step": 1020}
{"info/global_step": 1021, "train_info/time_within_train_step": 34.054168462753296, "step": 1021}
{"train_info/time_between_train_steps": 0.005605936050415039, "step": 1021}
{"info/global_step": 1022, "train_info/time_within_train_step": 33.9277925491333, "step": 1022}
{"train_info/time_between_train_steps": 0.010802745819091797, "step": 1022}
{"info/global_step": 1023, "train_info/time_within_train_step": 33.970675230026245, "step": 1023}
{"train_info/time_between_train_steps": 0.010020971298217773, "step": 1023}
{"info/global_step": 1024, "train_info/time_within_train_step": 34.07091569900513, "step": 1024}
{"train_info/time_between_train_steps": 0.005634307861328125, "step": 1024}
{"info/global_step": 1025, "train_info/time_within_train_step": 33.924468994140625, "step": 1025}
{"train_info/time_between_train_steps": 0.005610942840576172, "step": 1025}
{"info/global_step": 1026, "train_info/time_within_train_step": 33.96419954299927, "step": 1026}
{"train_info/time_between_train_steps": 0.005930662155151367, "step": 1026}
{"info/global_step": 1027, "train_info/time_within_train_step": 33.94988656044006, "step": 1027}
{"train_info/time_between_train_steps": 0.005807161331176758, "step": 1027}
{"info/global_step": 1028, "train_info/time_within_train_step": 33.917275190353394, "step": 1028}
{"train_info/time_between_train_steps": 0.005572319030761719, "step": 1028}
{"info/global_step": 1029, "train_info/time_within_train_step": 33.93394088745117, "step": 1029}
{"train_info/time_between_train_steps": 0.0055980682373046875, "step": 1029}
{"info/global_step": 1030, "train_info/time_within_train_step": 33.96735882759094, "step": 1030}
{"train_info/time_between_train_steps": 0.005948543548583984, "step": 1030}
{"info/global_step": 1031, "train_info/time_within_train_step": 33.9425904750824, "step": 1031}
{"train_info/time_between_train_steps": 0.005642414093017578, "step": 1031}
{"info/global_step": 1032, "train_info/time_within_train_step": 34.254334688186646, "step": 1032}
{"train_info/time_between_train_steps": 0.0065424442291259766, "step": 1032}
{"train_info/time_between_train_steps": 26.717602014541626, "step": 1032}
{"info/global_step": 1033, "train_info/time_within_train_step": 33.91817665100098, "step": 1033}
{"train_info/time_between_train_steps": 0.005706310272216797, "step": 1033}
{"info/global_step": 1034, "train_info/time_within_train_step": 34.193055629730225, "step": 1034}
{"train_info/time_between_train_steps": 0.0056972503662109375, "step": 1034}
{"info/global_step": 1035, "train_info/time_within_train_step": 33.97995066642761, "step": 1035}
{"train_info/time_between_train_steps": 0.010203361511230469, "step": 1035}
{"info/global_step": 1036, "train_info/time_within_train_step": 34.08863401412964, "step": 1036}
{"train_info/time_between_train_steps": 0.011229276657104492, "step": 1036}
{"info/global_step": 1037, "train_info/time_within_train_step": 33.909584045410156, "step": 1037}
{"train_info/time_between_train_steps": 0.005598306655883789, "step": 1037}
{"info/global_step": 1038, "train_info/time_within_train_step": 34.37515687942505, "step": 1038}
{"train_info/time_between_train_steps": 0.005750417709350586, "step": 1038}
{"info/global_step": 1039, "train_info/time_within_train_step": 33.99901103973389, "step": 1039}
{"train_info/time_between_train_steps": 0.005883693695068359, "step": 1039}
{"info/global_step": 1040, "train_info/time_within_train_step": 34.11225247383118, "step": 1040}
{"train_info/time_between_train_steps": 0.00560760498046875, "step": 1040}
{"info/global_step": 1041, "train_info/time_within_train_step": 33.992757081985474, "step": 1041}
{"train_info/time_between_train_steps": 0.010509967803955078, "step": 1041}
{"info/global_step": 1042, "train_info/time_within_train_step": 34.16673231124878, "step": 1042}
{"train_info/time_between_train_steps": 0.010033845901489258, "step": 1042}
{"info/global_step": 1043, "train_info/time_within_train_step": 33.93798303604126, "step": 1043}
{"train_info/time_between_train_steps": 0.006925344467163086, "step": 1043}
{"info/global_step": 1044, "train_info/time_within_train_step": 34.32095789909363, "step": 1044}
{"train_info/time_between_train_steps": 0.010180473327636719, "step": 1044}
{"info/global_step": 1045, "train_info/time_within_train_step": 34.136717796325684, "step": 1045}
{"train_info/time_between_train_steps": 0.005851030349731445, "step": 1045}
{"info/global_step": 1046, "train_info/time_within_train_step": 34.27866220474243, "step": 1046}
{"train_info/time_between_train_steps": 0.005891084671020508, "step": 1046}
{"info/global_step": 1047, "train_info/time_within_train_step": 34.2420289516449, "step": 1047}
{"train_info/time_between_train_steps": 0.009700775146484375, "step": 1047}
{"info/global_step": 1048, "train_info/time_within_train_step": 34.06551742553711, "step": 1048}
{"train_info/time_between_train_steps": 0.005887269973754883, "step": 1048}
{"info/global_step": 1049, "train_info/time_within_train_step": 33.972641944885254, "step": 1049}
{"train_info/time_between_train_steps": 0.008360862731933594, "step": 1049}
{"info/global_step": 1050, "train_info/time_within_train_step": 34.10671949386597, "step": 1050}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1734139868, "_runtime": 36642}, "step": 1050}
{"logs": {"train/loss": 2.202, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 24.02, "_timestamp": 1734139868, "_runtime": 36642}, "step": 1050}
{"train_info/time_between_train_steps": 0.007729768753051758, "step": 1050}
{"info/global_step": 1051, "train_info/time_within_train_step": 33.987746238708496, "step": 1051}
{"train_info/time_between_train_steps": 0.011051654815673828, "step": 1051}
{"info/global_step": 1052, "train_info/time_within_train_step": 34.156229734420776, "step": 1052}
{"train_info/time_between_train_steps": 0.00643610954284668, "step": 1052}
{"info/global_step": 1053, "train_info/time_within_train_step": 34.076088428497314, "step": 1053}
{"train_info/time_between_train_steps": 0.010221481323242188, "step": 1053}
{"info/global_step": 1054, "train_info/time_within_train_step": 34.0594208240509, "step": 1054}
{"train_info/time_between_train_steps": 0.005877017974853516, "step": 1054}
{"info/global_step": 1055, "train_info/time_within_train_step": 33.93663454055786, "step": 1055}
{"train_info/time_between_train_steps": 0.0060694217681884766, "step": 1055}
{"info/global_step": 1056, "train_info/time_within_train_step": 34.04137325286865, "step": 1056}
{"train_info/time_between_train_steps": 0.011309623718261719, "step": 1056}
{"info/global_step": 1057, "train_info/time_within_train_step": 33.99544835090637, "step": 1057}
{"train_info/time_between_train_steps": 0.005651950836181641, "step": 1057}
{"info/global_step": 1058, "train_info/time_within_train_step": 33.938379764556885, "step": 1058}
{"train_info/time_between_train_steps": 0.0054340362548828125, "step": 1058}
{"info/global_step": 1059, "train_info/time_within_train_step": 33.90923023223877, "step": 1059}
{"train_info/time_between_train_steps": 0.005587339401245117, "step": 1059}
{"info/global_step": 1060, "train_info/time_within_train_step": 33.92139434814453, "step": 1060}
{"train_info/time_between_train_steps": 0.0057373046875, "step": 1060}
{"info/global_step": 1061, "train_info/time_within_train_step": 34.18470120429993, "step": 1061}
{"train_info/time_between_train_steps": 0.005749225616455078, "step": 1061}
{"info/global_step": 1062, "train_info/time_within_train_step": 34.14124131202698, "step": 1062}
{"train_info/time_between_train_steps": 0.007133007049560547, "step": 1062}
{"info/global_step": 1063, "train_info/time_within_train_step": 33.92502164840698, "step": 1063}
{"train_info/time_between_train_steps": 0.010812520980834961, "step": 1063}
{"info/global_step": 1064, "train_info/time_within_train_step": 34.000664472579956, "step": 1064}
{"train_info/time_between_train_steps": 0.006394863128662109, "step": 1064}
{"info/global_step": 1065, "train_info/time_within_train_step": 33.980124950408936, "step": 1065}
{"train_info/time_between_train_steps": 0.005570888519287109, "step": 1065}
{"info/global_step": 1066, "train_info/time_within_train_step": 33.92186260223389, "step": 1066}
{"train_info/time_between_train_steps": 0.005797386169433594, "step": 1066}
{"info/global_step": 1067, "train_info/time_within_train_step": 33.963494062423706, "step": 1067}
{"train_info/time_between_train_steps": 0.0058422088623046875, "step": 1067}
{"info/global_step": 1068, "train_info/time_within_train_step": 33.96771287918091, "step": 1068}
{"train_info/time_between_train_steps": 0.005781888961791992, "step": 1068}
{"info/global_step": 1069, "train_info/time_within_train_step": 33.91128492355347, "step": 1069}
{"train_info/time_between_train_steps": 0.005574226379394531, "step": 1069}
{"info/global_step": 1070, "train_info/time_within_train_step": 33.95173001289368, "step": 1070}
{"train_info/time_between_train_steps": 0.01025533676147461, "step": 1070}
{"info/global_step": 1071, "train_info/time_within_train_step": 33.920140504837036, "step": 1071}
{"train_info/time_between_train_steps": 0.0060460567474365234, "step": 1071}
{"info/global_step": 1072, "train_info/time_within_train_step": 33.92554974555969, "step": 1072}
{"train_info/time_between_train_steps": 0.005692005157470703, "step": 1072}
{"info/global_step": 1073, "train_info/time_within_train_step": 34.03243803977966, "step": 1073}
{"train_info/time_between_train_steps": 0.005765676498413086, "step": 1073}
{"info/global_step": 1074, "train_info/time_within_train_step": 34.135080099105835, "step": 1074}
{"train_info/time_between_train_steps": 0.010108709335327148, "step": 1074}
{"info/global_step": 1075, "train_info/time_within_train_step": 33.98382353782654, "step": 1075}
{"train_info/time_between_train_steps": 0.007024288177490234, "step": 1075}
{"train_info/time_between_train_steps": 26.74669051170349, "step": 1075}
{"info/global_step": 1076, "train_info/time_within_train_step": 33.976805210113525, "step": 1076}
{"train_info/time_between_train_steps": 0.005487203598022461, "step": 1076}
{"info/global_step": 1077, "train_info/time_within_train_step": 34.25062680244446, "step": 1077}
{"train_info/time_between_train_steps": 0.005434513092041016, "step": 1077}
{"info/global_step": 1078, "train_info/time_within_train_step": 33.94887924194336, "step": 1078}
{"train_info/time_between_train_steps": 0.015048503875732422, "step": 1078}
{"info/global_step": 1079, "train_info/time_within_train_step": 34.09612059593201, "step": 1079}
{"train_info/time_between_train_steps": 0.005859851837158203, "step": 1079}
{"info/global_step": 1080, "train_info/time_within_train_step": 33.94880175590515, "step": 1080}
{"train_info/time_between_train_steps": 0.005929708480834961, "step": 1080}
{"info/global_step": 1081, "train_info/time_within_train_step": 34.0843620300293, "step": 1081}
{"train_info/time_between_train_steps": 0.005727052688598633, "step": 1081}
{"info/global_step": 1082, "train_info/time_within_train_step": 33.96199369430542, "step": 1082}
{"train_info/time_between_train_steps": 0.005880832672119141, "step": 1082}
{"info/global_step": 1083, "train_info/time_within_train_step": 34.1620237827301, "step": 1083}
{"train_info/time_between_train_steps": 0.011062383651733398, "step": 1083}
{"info/global_step": 1084, "train_info/time_within_train_step": 33.95333695411682, "step": 1084}
{"train_info/time_between_train_steps": 0.010466575622558594, "step": 1084}
{"info/global_step": 1085, "train_info/time_within_train_step": 34.052128314971924, "step": 1085}
{"train_info/time_between_train_steps": 0.005671024322509766, "step": 1085}
{"info/global_step": 1086, "train_info/time_within_train_step": 33.92511057853699, "step": 1086}
{"train_info/time_between_train_steps": 0.0058519840240478516, "step": 1086}
{"info/global_step": 1087, "train_info/time_within_train_step": 34.08294343948364, "step": 1087}
{"train_info/time_between_train_steps": 0.005974531173706055, "step": 1087}
{"info/global_step": 1088, "train_info/time_within_train_step": 33.93109059333801, "step": 1088}
{"train_info/time_between_train_steps": 0.005727052688598633, "step": 1088}
{"info/global_step": 1089, "train_info/time_within_train_step": 34.061625242233276, "step": 1089}
{"train_info/time_between_train_steps": 0.005684614181518555, "step": 1089}
{"info/global_step": 1090, "train_info/time_within_train_step": 33.94662809371948, "step": 1090}
{"train_info/time_between_train_steps": 0.0059261322021484375, "step": 1090}
{"info/global_step": 1091, "train_info/time_within_train_step": 34.09079170227051, "step": 1091}
{"train_info/time_between_train_steps": 0.006386995315551758, "step": 1091}
{"info/global_step": 1092, "train_info/time_within_train_step": 33.97335076332092, "step": 1092}
{"train_info/time_between_train_steps": 0.005837440490722656, "step": 1092}
{"info/global_step": 1093, "train_info/time_within_train_step": 34.260239601135254, "step": 1093}
{"train_info/time_between_train_steps": 0.010686397552490234, "step": 1093}
{"info/global_step": 1094, "train_info/time_within_train_step": 34.03615856170654, "step": 1094}
{"train_info/time_between_train_steps": 0.010545730590820312, "step": 1094}
{"info/global_step": 1095, "train_info/time_within_train_step": 34.4882550239563, "step": 1095}
{"train_info/time_between_train_steps": 0.00928044319152832, "step": 1095}
{"info/global_step": 1096, "train_info/time_within_train_step": 33.958274364471436, "step": 1096}
{"train_info/time_between_train_steps": 0.0055713653564453125, "step": 1096}
{"info/global_step": 1097, "train_info/time_within_train_step": 34.06031155586243, "step": 1097}
{"train_info/time_between_train_steps": 0.005835771560668945, "step": 1097}
{"info/global_step": 1098, "train_info/time_within_train_step": 34.070141553878784, "step": 1098}
{"train_info/time_between_train_steps": 0.007073879241943359, "step": 1098}
{"info/global_step": 1099, "train_info/time_within_train_step": 34.243091106414795, "step": 1099}
{"train_info/time_between_train_steps": 0.006014347076416016, "step": 1099}
{"info/global_step": 1100, "train_info/time_within_train_step": 33.97498536109924, "step": 1100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1734141596, "_runtime": 38370}, "step": 1100}
{"logs": {"train/loss": 2.1818, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 25.02, "_timestamp": 1734141596, "_runtime": 38370}, "step": 1100}
{"train_info/time_between_train_steps": 2.421398162841797, "step": 1100}
{"info/global_step": 1101, "train_info/time_within_train_step": 33.93361473083496, "step": 1101}
{"train_info/time_between_train_steps": 0.010723114013671875, "step": 1101}
{"info/global_step": 1102, "train_info/time_within_train_step": 33.966546058654785, "step": 1102}
{"train_info/time_between_train_steps": 0.005817890167236328, "step": 1102}
{"info/global_step": 1103, "train_info/time_within_train_step": 33.944666147232056, "step": 1103}
{"train_info/time_between_train_steps": 0.006685733795166016, "step": 1103}
{"info/global_step": 1104, "train_info/time_within_train_step": 33.96061849594116, "step": 1104}
{"train_info/time_between_train_steps": 0.005834102630615234, "step": 1104}
{"info/global_step": 1105, "train_info/time_within_train_step": 33.96911549568176, "step": 1105}
{"train_info/time_between_train_steps": 0.005860328674316406, "step": 1105}
{"info/global_step": 1106, "train_info/time_within_train_step": 33.93296241760254, "step": 1106}
{"train_info/time_between_train_steps": 0.0059452056884765625, "step": 1106}
{"info/global_step": 1107, "train_info/time_within_train_step": 33.95451998710632, "step": 1107}
{"train_info/time_between_train_steps": 0.005558967590332031, "step": 1107}
{"info/global_step": 1108, "train_info/time_within_train_step": 34.24998998641968, "step": 1108}
{"train_info/time_between_train_steps": 0.005654096603393555, "step": 1108}
{"info/global_step": 1109, "train_info/time_within_train_step": 33.949851512908936, "step": 1109}
{"train_info/time_between_train_steps": 0.006324291229248047, "step": 1109}
{"info/global_step": 1110, "train_info/time_within_train_step": 33.934459924697876, "step": 1110}
{"train_info/time_between_train_steps": 0.010651111602783203, "step": 1110}
{"info/global_step": 1111, "train_info/time_within_train_step": 34.0303897857666, "step": 1111}
{"train_info/time_between_train_steps": 0.010488748550415039, "step": 1111}
{"info/global_step": 1112, "train_info/time_within_train_step": 33.925400257110596, "step": 1112}
{"train_info/time_between_train_steps": 0.0057713985443115234, "step": 1112}
{"info/global_step": 1113, "train_info/time_within_train_step": 33.985668659210205, "step": 1113}
{"train_info/time_between_train_steps": 0.011486530303955078, "step": 1113}
{"info/global_step": 1114, "train_info/time_within_train_step": 33.93440628051758, "step": 1114}
{"train_info/time_between_train_steps": 0.005741119384765625, "step": 1114}
{"info/global_step": 1115, "train_info/time_within_train_step": 33.92906069755554, "step": 1115}
{"train_info/time_between_train_steps": 0.0055162906646728516, "step": 1115}
{"info/global_step": 1116, "train_info/time_within_train_step": 33.9394326210022, "step": 1116}
{"train_info/time_between_train_steps": 0.005952596664428711, "step": 1116}
{"info/global_step": 1117, "train_info/time_within_train_step": 34.193798303604126, "step": 1117}
{"train_info/time_between_train_steps": 0.006186723709106445, "step": 1117}
{"info/global_step": 1118, "train_info/time_within_train_step": 33.98376250267029, "step": 1118}
{"train_info/time_between_train_steps": 0.006599903106689453, "step": 1118}
{"train_info/time_between_train_steps": 26.4100821018219, "step": 1118}
{"info/global_step": 1119, "train_info/time_within_train_step": 33.92854309082031, "step": 1119}
{"train_info/time_between_train_steps": 0.0061609745025634766, "step": 1119}
{"info/global_step": 1120, "train_info/time_within_train_step": 34.22250413894653, "step": 1120}
{"train_info/time_between_train_steps": 0.010968685150146484, "step": 1120}
{"info/global_step": 1121, "train_info/time_within_train_step": 33.98474478721619, "step": 1121}
{"train_info/time_between_train_steps": 0.006304025650024414, "step": 1121}
{"info/global_step": 1122, "train_info/time_within_train_step": 34.155330181121826, "step": 1122}
{"train_info/time_between_train_steps": 0.005757570266723633, "step": 1122}
{"info/global_step": 1123, "train_info/time_within_train_step": 34.41145610809326, "step": 1123}
{"train_info/time_between_train_steps": 0.010128498077392578, "step": 1123}
{"info/global_step": 1124, "train_info/time_within_train_step": 34.10151147842407, "step": 1124}
{"train_info/time_between_train_steps": 0.011728525161743164, "step": 1124}
{"info/global_step": 1125, "train_info/time_within_train_step": 33.98994016647339, "step": 1125}
{"train_info/time_between_train_steps": 0.005980968475341797, "step": 1125}
{"info/global_step": 1126, "train_info/time_within_train_step": 34.14987254142761, "step": 1126}
{"train_info/time_between_train_steps": 0.005822658538818359, "step": 1126}
{"info/global_step": 1127, "train_info/time_within_train_step": 33.9594190120697, "step": 1127}
{"train_info/time_between_train_steps": 0.005812168121337891, "step": 1127}
{"info/global_step": 1128, "train_info/time_within_train_step": 34.06180381774902, "step": 1128}
{"train_info/time_between_train_steps": 0.005641937255859375, "step": 1128}
{"info/global_step": 1129, "train_info/time_within_train_step": 33.98486351966858, "step": 1129}
{"train_info/time_between_train_steps": 0.00588679313659668, "step": 1129}
{"info/global_step": 1130, "train_info/time_within_train_step": 34.1574866771698, "step": 1130}
{"train_info/time_between_train_steps": 0.005916118621826172, "step": 1130}
{"info/global_step": 1131, "train_info/time_within_train_step": 33.91718077659607, "step": 1131}
{"train_info/time_between_train_steps": 0.0058858394622802734, "step": 1131}
{"info/global_step": 1132, "train_info/time_within_train_step": 34.086122274398804, "step": 1132}
{"train_info/time_between_train_steps": 0.0056667327880859375, "step": 1132}
{"info/global_step": 1133, "train_info/time_within_train_step": 33.99027967453003, "step": 1133}
{"train_info/time_between_train_steps": 0.006078481674194336, "step": 1133}
{"info/global_step": 1134, "train_info/time_within_train_step": 34.124074935913086, "step": 1134}
{"train_info/time_between_train_steps": 0.005882978439331055, "step": 1134}
{"info/global_step": 1135, "train_info/time_within_train_step": 33.91106462478638, "step": 1135}
{"train_info/time_between_train_steps": 0.0056836605072021484, "step": 1135}
{"info/global_step": 1136, "train_info/time_within_train_step": 34.05653119087219, "step": 1136}
{"train_info/time_between_train_steps": 0.006300687789916992, "step": 1136}
{"info/global_step": 1137, "train_info/time_within_train_step": 33.943588972091675, "step": 1137}
{"train_info/time_between_train_steps": 0.006128549575805664, "step": 1137}
{"info/global_step": 1138, "train_info/time_within_train_step": 34.09567618370056, "step": 1138}
{"train_info/time_between_train_steps": 0.005890846252441406, "step": 1138}
{"info/global_step": 1139, "train_info/time_within_train_step": 34.17840504646301, "step": 1139}
{"train_info/time_between_train_steps": 0.005949258804321289, "step": 1139}
{"info/global_step": 1140, "train_info/time_within_train_step": 34.06473994255066, "step": 1140}
{"train_info/time_between_train_steps": 0.006079673767089844, "step": 1140}
{"info/global_step": 1141, "train_info/time_within_train_step": 33.952765703201294, "step": 1141}
{"train_info/time_between_train_steps": 0.006175041198730469, "step": 1141}
{"info/global_step": 1142, "train_info/time_within_train_step": 34.00036835670471, "step": 1142}
{"train_info/time_between_train_steps": 0.010681390762329102, "step": 1142}
{"info/global_step": 1143, "train_info/time_within_train_step": 33.96709132194519, "step": 1143}
{"train_info/time_between_train_steps": 0.005591154098510742, "step": 1143}
{"info/global_step": 1144, "train_info/time_within_train_step": 33.91551089286804, "step": 1144}
{"train_info/time_between_train_steps": 0.00554203987121582, "step": 1144}
{"info/global_step": 1145, "train_info/time_within_train_step": 33.92208385467529, "step": 1145}
{"train_info/time_between_train_steps": 0.005677938461303711, "step": 1145}
{"info/global_step": 1146, "train_info/time_within_train_step": 33.957175493240356, "step": 1146}
{"train_info/time_between_train_steps": 0.010330915451049805, "step": 1146}
{"info/global_step": 1147, "train_info/time_within_train_step": 33.91388916969299, "step": 1147}
{"train_info/time_between_train_steps": 0.01036381721496582, "step": 1147}
{"info/global_step": 1148, "train_info/time_within_train_step": 33.943175077438354, "step": 1148}
{"train_info/time_between_train_steps": 0.005673408508300781, "step": 1148}
{"info/global_step": 1149, "train_info/time_within_train_step": 33.96632194519043, "step": 1149}
{"train_info/time_between_train_steps": 0.006025075912475586, "step": 1149}
{"info/global_step": 1150, "train_info/time_within_train_step": 33.95074677467346, "step": 1150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1734143326, "_runtime": 40100}, "step": 1150}
{"logs": {"train/loss": 2.1639, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 26.03, "_timestamp": 1734143326, "_runtime": 40100}, "step": 1150}
{"train_info/time_between_train_steps": 0.007605314254760742, "step": 1150}
{"info/global_step": 1151, "train_info/time_within_train_step": 33.91352295875549, "step": 1151}
{"train_info/time_between_train_steps": 0.0055501461029052734, "step": 1151}
{"info/global_step": 1152, "train_info/time_within_train_step": 33.97094655036926, "step": 1152}
{"train_info/time_between_train_steps": 0.006044149398803711, "step": 1152}
{"info/global_step": 1153, "train_info/time_within_train_step": 33.93713665008545, "step": 1153}
{"train_info/time_between_train_steps": 0.0055446624755859375, "step": 1153}
{"info/global_step": 1154, "train_info/time_within_train_step": 34.13758897781372, "step": 1154}
{"train_info/time_between_train_steps": 0.005766630172729492, "step": 1154}
{"info/global_step": 1155, "train_info/time_within_train_step": 33.94569778442383, "step": 1155}
{"train_info/time_between_train_steps": 0.005822658538818359, "step": 1155}
{"info/global_step": 1156, "train_info/time_within_train_step": 33.94386315345764, "step": 1156}
{"train_info/time_between_train_steps": 0.010448455810546875, "step": 1156}
{"info/global_step": 1157, "train_info/time_within_train_step": 33.963223934173584, "step": 1157}
{"train_info/time_between_train_steps": 0.010445356369018555, "step": 1157}
{"info/global_step": 1158, "train_info/time_within_train_step": 33.930869817733765, "step": 1158}
{"train_info/time_between_train_steps": 0.005746364593505859, "step": 1158}
{"info/global_step": 1159, "train_info/time_within_train_step": 33.95359396934509, "step": 1159}
{"train_info/time_between_train_steps": 0.00604701042175293, "step": 1159}
{"info/global_step": 1160, "train_info/time_within_train_step": 33.956098318099976, "step": 1160}
{"train_info/time_between_train_steps": 0.005871295928955078, "step": 1160}
{"info/global_step": 1161, "train_info/time_within_train_step": 33.982966899871826, "step": 1161}
{"train_info/time_between_train_steps": 0.006842136383056641, "step": 1161}
{"train_info/time_between_train_steps": 26.51215171813965, "step": 1161}
{"info/global_step": 1162, "train_info/time_within_train_step": 33.911837339401245, "step": 1162}
{"train_info/time_between_train_steps": 0.0054357051849365234, "step": 1162}
{"info/global_step": 1163, "train_info/time_within_train_step": 34.14310359954834, "step": 1163}
{"train_info/time_between_train_steps": 0.00691533088684082, "step": 1163}
{"info/global_step": 1164, "train_info/time_within_train_step": 34.07083296775818, "step": 1164}
{"train_info/time_between_train_steps": 0.011109352111816406, "step": 1164}
{"info/global_step": 1165, "train_info/time_within_train_step": 34.38593316078186, "step": 1165}
{"train_info/time_between_train_steps": 0.006134748458862305, "step": 1165}
{"info/global_step": 1166, "train_info/time_within_train_step": 33.97422981262207, "step": 1166}
{"train_info/time_between_train_steps": 0.005887746810913086, "step": 1166}
{"info/global_step": 1167, "train_info/time_within_train_step": 34.09808945655823, "step": 1167}
{"train_info/time_between_train_steps": 0.006094455718994141, "step": 1167}
{"info/global_step": 1168, "train_info/time_within_train_step": 33.97538781166077, "step": 1168}
{"train_info/time_between_train_steps": 0.0058345794677734375, "step": 1168}
{"info/global_step": 1169, "train_info/time_within_train_step": 34.44387674331665, "step": 1169}
{"train_info/time_between_train_steps": 0.0057926177978515625, "step": 1169}
{"info/global_step": 1170, "train_info/time_within_train_step": 33.943424224853516, "step": 1170}
{"train_info/time_between_train_steps": 0.00567936897277832, "step": 1170}
{"info/global_step": 1171, "train_info/time_within_train_step": 34.10338521003723, "step": 1171}
{"train_info/time_between_train_steps": 0.006022930145263672, "step": 1171}
{"info/global_step": 1172, "train_info/time_within_train_step": 33.93301320075989, "step": 1172}
{"train_info/time_between_train_steps": 0.005946159362792969, "step": 1172}
{"info/global_step": 1173, "train_info/time_within_train_step": 34.07112145423889, "step": 1173}
{"train_info/time_between_train_steps": 0.005932807922363281, "step": 1173}
{"info/global_step": 1174, "train_info/time_within_train_step": 34.13752484321594, "step": 1174}
{"train_info/time_between_train_steps": 0.011135101318359375, "step": 1174}
{"info/global_step": 1175, "train_info/time_within_train_step": 34.109928607940674, "step": 1175}
{"train_info/time_between_train_steps": 0.00574183464050293, "step": 1175}
{"info/global_step": 1176, "train_info/time_within_train_step": 33.967544078826904, "step": 1176}
{"train_info/time_between_train_steps": 0.005814313888549805, "step": 1176}
{"info/global_step": 1177, "train_info/time_within_train_step": 34.20954751968384, "step": 1177}
{"train_info/time_between_train_steps": 0.006097316741943359, "step": 1177}
{"info/global_step": 1178, "train_info/time_within_train_step": 33.95464873313904, "step": 1178}
{"train_info/time_between_train_steps": 0.005797624588012695, "step": 1178}
{"info/global_step": 1179, "train_info/time_within_train_step": 34.07373666763306, "step": 1179}
{"train_info/time_between_train_steps": 0.0058269500732421875, "step": 1179}
{"info/global_step": 1180, "train_info/time_within_train_step": 33.97344779968262, "step": 1180}
{"train_info/time_between_train_steps": 0.006049394607543945, "step": 1180}
{"info/global_step": 1181, "train_info/time_within_train_step": 34.23436999320984, "step": 1181}
{"train_info/time_between_train_steps": 0.010298728942871094, "step": 1181}
{"info/global_step": 1182, "train_info/time_within_train_step": 33.94318747520447, "step": 1182}
{"train_info/time_between_train_steps": 0.010552644729614258, "step": 1182}
{"info/global_step": 1183, "train_info/time_within_train_step": 34.08762717247009, "step": 1183}
{"train_info/time_between_train_steps": 0.005980253219604492, "step": 1183}
{"info/global_step": 1184, "train_info/time_within_train_step": 34.01844024658203, "step": 1184}
{"train_info/time_between_train_steps": 0.0064694881439208984, "step": 1184}
{"info/global_step": 1185, "train_info/time_within_train_step": 34.24541759490967, "step": 1185}
{"train_info/time_between_train_steps": 0.010681390762329102, "step": 1185}
{"info/global_step": 1186, "train_info/time_within_train_step": 34.007827043533325, "step": 1186}
{"train_info/time_between_train_steps": 0.005646467208862305, "step": 1186}
{"info/global_step": 1187, "train_info/time_within_train_step": 33.935630321502686, "step": 1187}
{"train_info/time_between_train_steps": 0.005785465240478516, "step": 1187}
{"info/global_step": 1188, "train_info/time_within_train_step": 33.94897747039795, "step": 1188}
{"train_info/time_between_train_steps": 0.009077787399291992, "step": 1188}
{"info/global_step": 1189, "train_info/time_within_train_step": 33.936394453048706, "step": 1189}
{"train_info/time_between_train_steps": 0.005663394927978516, "step": 1189}
{"info/global_step": 1190, "train_info/time_within_train_step": 33.942760705947876, "step": 1190}
{"train_info/time_between_train_steps": 0.005837678909301758, "step": 1190}
{"info/global_step": 1191, "train_info/time_within_train_step": 33.939635038375854, "step": 1191}
{"train_info/time_between_train_steps": 0.006777048110961914, "step": 1191}
{"info/global_step": 1192, "train_info/time_within_train_step": 33.94094133377075, "step": 1192}
{"train_info/time_between_train_steps": 0.00556492805480957, "step": 1192}
{"info/global_step": 1193, "train_info/time_within_train_step": 33.940455198287964, "step": 1193}
{"train_info/time_between_train_steps": 0.005598783493041992, "step": 1193}
{"info/global_step": 1194, "train_info/time_within_train_step": 33.965275287628174, "step": 1194}
{"train_info/time_between_train_steps": 0.005690097808837891, "step": 1194}
{"info/global_step": 1195, "train_info/time_within_train_step": 33.92872095108032, "step": 1195}
{"train_info/time_between_train_steps": 0.011001110076904297, "step": 1195}
{"info/global_step": 1196, "train_info/time_within_train_step": 33.919358015060425, "step": 1196}
{"train_info/time_between_train_steps": 0.005690574645996094, "step": 1196}
{"info/global_step": 1197, "train_info/time_within_train_step": 34.02172517776489, "step": 1197}
{"train_info/time_between_train_steps": 0.00576019287109375, "step": 1197}
{"info/global_step": 1198, "train_info/time_within_train_step": 33.94172286987305, "step": 1198}
{"train_info/time_between_train_steps": 0.005869865417480469, "step": 1198}
{"info/global_step": 1199, "train_info/time_within_train_step": 33.94505429267883, "step": 1199}
{"train_info/time_between_train_steps": 0.005688190460205078, "step": 1199}
{"info/global_step": 1200, "train_info/time_within_train_step": 33.93799662590027, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1734145054, "_runtime": 41828}, "step": 1200}
{"logs": {"train/loss": 2.1505, "train/learning_rate": 0.0, "train/epoch": 27.03, "_timestamp": 1734145054, "_runtime": 41828}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1734145057, "_runtime": 41831}, "step": 1200}
{"logs": {"train/train_runtime": 41831.4796, "train/train_samples_per_second": 14.688, "train/train_steps_per_second": 0.029, "train/total_flos": 3.25971739017216e+17, "train/train_loss": 2.9837031372388205, "train/epoch": 27.03, "_timestamp": 1734145057, "_runtime": 41831}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1734145061, "_runtime": 41835}, "step": 1200}
{"logs": {"eval/loss": 2.6705334186553955, "eval/runtime": 3.9142, "eval/samples_per_second": 41.643, "eval/steps_per_second": 2.81, "train/epoch": 27.03, "_timestamp": 1734145061, "_runtime": 41835}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1734145061, "_runtime": 41835}, "step": 1200}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 2.6705334186553955, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 14.447673796460634, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 3.9142, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 41.643, "train/epoch": 27.03, "_timestamp": 1734145061, "_runtime": 41835}, "step": 1200}