diff --git "a/metrics.json" "b/metrics.json" new file mode 100644--- /dev/null +++ "b/metrics.json" @@ -0,0 +1,6144 @@ +{"num_parameters": 108882432, "trainable_parameters": 108882432, "step": 0} +{"train_info/time_between_train_steps": 2.3095357418060303, "step": 0} +{"info/global_step": 1, "train_info/time_within_train_step": 4.7620849609375, "step": 1} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 4412.87744140625, "train_info/memory_reserved": 4642.0, "train_info/memory_max_reserved": 4642.0, "_timestamp": 1746203256, "_runtime": 28}, "step": 1} +{"logs": {"train/loss": 10.2942, "train/learning_rate": 2e-06, "train/epoch": 0.0, "_timestamp": 1746203256, "_runtime": 28}, "step": 1} +{"train_info/time_between_train_steps": 0.02449512481689453, "step": 1} +{"info/global_step": 2, "train_info/time_within_train_step": 2.4327449798583984, "step": 2} +{"train_info/time_between_train_steps": 0.0035254955291748047, "step": 2} +{"info/global_step": 3, "train_info/time_within_train_step": 2.4369704723358154, "step": 3} +{"train_info/time_between_train_steps": 0.0035636425018310547, "step": 3} +{"info/global_step": 4, "train_info/time_within_train_step": 2.440464973449707, "step": 4} +{"train_info/time_between_train_steps": 0.0035486221313476562, "step": 4} +{"info/global_step": 5, "train_info/time_within_train_step": 2.4436657428741455, "step": 5} +{"train_info/time_between_train_steps": 0.003805398941040039, "step": 5} +{"info/global_step": 6, "train_info/time_within_train_step": 2.44313645362854, "step": 6} +{"train_info/time_between_train_steps": 0.0038051605224609375, "step": 6} +{"info/global_step": 7, "train_info/time_within_train_step": 2.4456143379211426, "step": 7} +{"train_info/time_between_train_steps": 0.0037441253662109375, "step": 7} +{"info/global_step": 8, "train_info/time_within_train_step": 2.4601821899414062, "step": 8} +{"train_info/time_between_train_steps": 0.003785371780395508, "step": 8} +{"info/global_step": 9, "train_info/time_within_train_step": 2.457118511199951, "step": 9} +{"train_info/time_between_train_steps": 0.0037212371826171875, "step": 9} +{"info/global_step": 10, "train_info/time_within_train_step": 2.4583563804626465, "step": 10} +{"train_info/time_between_train_steps": 0.003732919692993164, "step": 10} +{"info/global_step": 11, "train_info/time_within_train_step": 2.458862781524658, "step": 11} +{"train_info/time_between_train_steps": 0.0037279129028320312, "step": 11} +{"info/global_step": 12, "train_info/time_within_train_step": 2.5850377082824707, "step": 12} +{"train_info/time_between_train_steps": 0.003770589828491211, "step": 12} +{"info/global_step": 13, "train_info/time_within_train_step": 2.6638383865356445, "step": 13} +{"train_info/time_between_train_steps": 0.0037260055541992188, "step": 13} +{"info/global_step": 14, "train_info/time_within_train_step": 2.662461757659912, "step": 14} +{"train_info/time_between_train_steps": 0.003740549087524414, "step": 14} +{"info/global_step": 15, "train_info/time_within_train_step": 2.6663665771484375, "step": 15} +{"train_info/time_between_train_steps": 0.003741025924682617, "step": 15} +{"info/global_step": 16, "train_info/time_within_train_step": 2.671712636947632, "step": 16} +{"train_info/time_between_train_steps": 0.00402069091796875, "step": 16} +{"info/global_step": 17, "train_info/time_within_train_step": 2.6782314777374268, "step": 17} +{"train_info/time_between_train_steps": 0.0038099288940429688, "step": 17} +{"info/global_step": 18, "train_info/time_within_train_step": 2.6749656200408936, "step": 18} +{"train_info/time_between_train_steps": 0.0037415027618408203, "step": 18} +{"info/global_step": 19, "train_info/time_within_train_step": 2.6738333702087402, "step": 19} +{"train_info/time_between_train_steps": 0.003767728805541992, "step": 19} +{"info/global_step": 20, "train_info/time_within_train_step": 2.6751608848571777, "step": 20} +{"train_info/time_between_train_steps": 0.0038280487060546875, "step": 20} +{"info/global_step": 21, "train_info/time_within_train_step": 2.675354480743408, "step": 21} +{"train_info/time_between_train_steps": 0.0037262439727783203, "step": 21} +{"info/global_step": 22, "train_info/time_within_train_step": 2.6766891479492188, "step": 22} +{"train_info/time_between_train_steps": 0.0037391185760498047, "step": 22} +{"info/global_step": 23, "train_info/time_within_train_step": 2.675642251968384, "step": 23} +{"train_info/time_between_train_steps": 0.0037441253662109375, "step": 23} +{"info/global_step": 24, "train_info/time_within_train_step": 2.6771345138549805, "step": 24} +{"train_info/time_between_train_steps": 0.0038764476776123047, "step": 24} +{"info/global_step": 25, "train_info/time_within_train_step": 2.6758639812469482, "step": 25} +{"train_info/time_between_train_steps": 0.0037326812744140625, "step": 25} +{"info/global_step": 26, "train_info/time_within_train_step": 2.674818277359009, "step": 26} +{"train_info/time_between_train_steps": 0.003694772720336914, "step": 26} +{"info/global_step": 27, "train_info/time_within_train_step": 2.673687696456909, "step": 27} +{"train_info/time_between_train_steps": 0.0037729740142822266, "step": 27} +{"info/global_step": 28, "train_info/time_within_train_step": 2.674609899520874, "step": 28} +{"train_info/time_between_train_steps": 0.003712892532348633, "step": 28} +{"info/global_step": 29, "train_info/time_within_train_step": 2.6759581565856934, "step": 29} +{"train_info/time_between_train_steps": 0.0037534236907958984, "step": 29} +{"info/global_step": 30, "train_info/time_within_train_step": 2.6742756366729736, "step": 30} +{"train_info/time_between_train_steps": 0.0038259029388427734, "step": 30} +{"info/global_step": 31, "train_info/time_within_train_step": 2.6743245124816895, "step": 31} +{"train_info/time_between_train_steps": 0.0037004947662353516, "step": 31} +{"info/global_step": 32, "train_info/time_within_train_step": 2.673260450363159, "step": 32} +{"train_info/time_between_train_steps": 0.003713846206665039, "step": 32} +{"info/global_step": 33, "train_info/time_within_train_step": 2.674147605895996, "step": 33} +{"train_info/time_between_train_steps": 0.003704071044921875, "step": 33} +{"info/global_step": 34, "train_info/time_within_train_step": 2.673579454421997, "step": 34} +{"train_info/time_between_train_steps": 0.003753662109375, "step": 34} +{"info/global_step": 35, "train_info/time_within_train_step": 2.67448091506958, "step": 35} +{"train_info/time_between_train_steps": 0.003812074661254883, "step": 35} +{"info/global_step": 36, "train_info/time_within_train_step": 2.6742849349975586, "step": 36} +{"train_info/time_between_train_steps": 0.0036551952362060547, "step": 36} +{"info/global_step": 37, "train_info/time_within_train_step": 2.674428701400757, "step": 37} +{"train_info/time_between_train_steps": 0.003710031509399414, "step": 37} +{"info/global_step": 38, "train_info/time_within_train_step": 2.6741087436676025, "step": 38} +{"train_info/time_between_train_steps": 0.0037305355072021484, "step": 38} +{"info/global_step": 39, "train_info/time_within_train_step": 2.6734626293182373, "step": 39} +{"train_info/time_between_train_steps": 0.0036983489990234375, "step": 39} +{"info/global_step": 40, "train_info/time_within_train_step": 2.674689292907715, "step": 40} +{"train_info/time_between_train_steps": 0.003752470016479492, "step": 40} +{"info/global_step": 41, "train_info/time_within_train_step": 2.6731157302856445, "step": 41} +{"train_info/time_between_train_steps": 0.003764629364013672, "step": 41} +{"info/global_step": 42, "train_info/time_within_train_step": 2.6732141971588135, "step": 42} +{"train_info/time_between_train_steps": 0.003650665283203125, "step": 42} +{"info/global_step": 43, "train_info/time_within_train_step": 2.6734602451324463, "step": 43} +{"train_info/time_between_train_steps": 0.0037086009979248047, "step": 43} +{"info/global_step": 44, "train_info/time_within_train_step": 2.673903703689575, "step": 44} +{"train_info/time_between_train_steps": 0.003713846206665039, "step": 44} +{"info/global_step": 45, "train_info/time_within_train_step": 2.673090934753418, "step": 45} +{"train_info/time_between_train_steps": 0.0037407875061035156, "step": 45} +{"info/global_step": 46, "train_info/time_within_train_step": 2.6740119457244873, "step": 46} +{"train_info/time_between_train_steps": 0.0036745071411132812, "step": 46} +{"info/global_step": 47, "train_info/time_within_train_step": 2.674269199371338, "step": 47} +{"train_info/time_between_train_steps": 0.003673076629638672, "step": 47} +{"info/global_step": 48, "train_info/time_within_train_step": 2.6740705966949463, "step": 48} +{"train_info/time_between_train_steps": 0.003756284713745117, "step": 48} +{"info/global_step": 49, "train_info/time_within_train_step": 2.674374580383301, "step": 49} +{"train_info/time_between_train_steps": 0.0036973953247070312, "step": 49} +{"info/global_step": 50, "train_info/time_within_train_step": 2.673729181289673, "step": 50} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746203386, "_runtime": 158}, "step": 50} +{"logs": {"train/loss": 8.3356, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 0.02, "_timestamp": 1746203386, "_runtime": 158}, "step": 50} +{"train_info/time_between_train_steps": 0.02401137351989746, "step": 50} +{"info/global_step": 51, "train_info/time_within_train_step": 3.042022943496704, "step": 51} +{"train_info/time_between_train_steps": 0.003593921661376953, "step": 51} +{"info/global_step": 52, "train_info/time_within_train_step": 2.6738550662994385, "step": 52} +{"train_info/time_between_train_steps": 0.0034792423248291016, "step": 52} +{"info/global_step": 53, "train_info/time_within_train_step": 2.677279472351074, "step": 53} +{"train_info/time_between_train_steps": 0.0034465789794921875, "step": 53} +{"info/global_step": 54, "train_info/time_within_train_step": 2.67323637008667, "step": 54} +{"train_info/time_between_train_steps": 0.003474712371826172, "step": 54} +{"info/global_step": 55, "train_info/time_within_train_step": 2.6733579635620117, "step": 55} +{"train_info/time_between_train_steps": 0.0034084320068359375, "step": 55} +{"info/global_step": 56, "train_info/time_within_train_step": 2.672527313232422, "step": 56} +{"train_info/time_between_train_steps": 0.0034508705139160156, "step": 56} +{"info/global_step": 57, "train_info/time_within_train_step": 2.673602342605591, "step": 57} +{"train_info/time_between_train_steps": 0.003461122512817383, "step": 57} +{"info/global_step": 58, "train_info/time_within_train_step": 2.672050952911377, "step": 58} +{"train_info/time_between_train_steps": 0.0034666061401367188, "step": 58} +{"info/global_step": 59, "train_info/time_within_train_step": 2.672114849090576, "step": 59} +{"train_info/time_between_train_steps": 0.003421783447265625, "step": 59} +{"info/global_step": 60, "train_info/time_within_train_step": 2.6725659370422363, "step": 60} +{"train_info/time_between_train_steps": 0.003496885299682617, "step": 60} +{"info/global_step": 61, "train_info/time_within_train_step": 2.674790859222412, "step": 61} +{"train_info/time_between_train_steps": 0.003468751907348633, "step": 61} +{"info/global_step": 62, "train_info/time_within_train_step": 2.6732065677642822, "step": 62} +{"train_info/time_between_train_steps": 0.003482818603515625, "step": 62} +{"info/global_step": 63, "train_info/time_within_train_step": 2.8366661071777344, "step": 63} +{"train_info/time_between_train_steps": 0.0036983489990234375, "step": 63} +{"info/global_step": 64, "train_info/time_within_train_step": 2.6742806434631348, "step": 64} +{"train_info/time_between_train_steps": 0.003624439239501953, "step": 64} +{"info/global_step": 65, "train_info/time_within_train_step": 2.674879550933838, "step": 65} +{"train_info/time_between_train_steps": 0.0037300586700439453, "step": 65} +{"info/global_step": 66, "train_info/time_within_train_step": 2.6743862628936768, "step": 66} +{"train_info/time_between_train_steps": 0.0036890506744384766, "step": 66} +{"info/global_step": 67, "train_info/time_within_train_step": 2.674596071243286, "step": 67} +{"train_info/time_between_train_steps": 0.0036270618438720703, "step": 67} +{"info/global_step": 68, "train_info/time_within_train_step": 2.673957586288452, "step": 68} +{"train_info/time_between_train_steps": 0.0036590099334716797, "step": 68} +{"info/global_step": 69, "train_info/time_within_train_step": 2.6785480976104736, "step": 69} +{"train_info/time_between_train_steps": 0.0036225318908691406, "step": 69} +{"info/global_step": 70, "train_info/time_within_train_step": 2.6753551959991455, "step": 70} +{"train_info/time_between_train_steps": 0.003707408905029297, "step": 70} +{"info/global_step": 71, "train_info/time_within_train_step": 2.6741390228271484, "step": 71} +{"train_info/time_between_train_steps": 0.003637075424194336, "step": 71} +{"info/global_step": 72, "train_info/time_within_train_step": 2.6727652549743652, "step": 72} +{"train_info/time_between_train_steps": 0.0035839080810546875, "step": 72} +{"info/global_step": 73, "train_info/time_within_train_step": 2.67364239692688, "step": 73} +{"train_info/time_between_train_steps": 0.003718137741088867, "step": 73} +{"info/global_step": 74, "train_info/time_within_train_step": 2.673227548599243, "step": 74} +{"train_info/time_between_train_steps": 0.003569364547729492, "step": 74} +{"info/global_step": 75, "train_info/time_within_train_step": 2.673940658569336, "step": 75} +{"train_info/time_between_train_steps": 0.003712892532348633, "step": 75} +{"info/global_step": 76, "train_info/time_within_train_step": 2.673243284225464, "step": 76} +{"train_info/time_between_train_steps": 0.0036695003509521484, "step": 76} +{"info/global_step": 77, "train_info/time_within_train_step": 2.6735689640045166, "step": 77} +{"train_info/time_between_train_steps": 0.0036725997924804688, "step": 77} +{"info/global_step": 78, "train_info/time_within_train_step": 2.6748874187469482, "step": 78} +{"train_info/time_between_train_steps": 0.0037822723388671875, "step": 78} +{"info/global_step": 79, "train_info/time_within_train_step": 2.6747379302978516, "step": 79} +{"train_info/time_between_train_steps": 0.0036001205444335938, "step": 79} +{"info/global_step": 80, "train_info/time_within_train_step": 2.6806342601776123, "step": 80} +{"train_info/time_between_train_steps": 0.0036296844482421875, "step": 80} +{"info/global_step": 81, "train_info/time_within_train_step": 2.674990177154541, "step": 81} +{"train_info/time_between_train_steps": 0.003618001937866211, "step": 81} +{"info/global_step": 82, "train_info/time_within_train_step": 2.6753244400024414, "step": 82} +{"train_info/time_between_train_steps": 0.003656148910522461, "step": 82} +{"info/global_step": 83, "train_info/time_within_train_step": 2.674675941467285, "step": 83} +{"train_info/time_between_train_steps": 0.0036017894744873047, "step": 83} +{"info/global_step": 84, "train_info/time_within_train_step": 2.6749322414398193, "step": 84} +{"train_info/time_between_train_steps": 0.003566265106201172, "step": 84} +{"info/global_step": 85, "train_info/time_within_train_step": 2.674990653991699, "step": 85} +{"train_info/time_between_train_steps": 0.003679037094116211, "step": 85} +{"info/global_step": 86, "train_info/time_within_train_step": 2.6758971214294434, "step": 86} +{"train_info/time_between_train_steps": 0.0039844512939453125, "step": 86} +{"info/global_step": 87, "train_info/time_within_train_step": 2.6757147312164307, "step": 87} +{"train_info/time_between_train_steps": 0.004456996917724609, "step": 87} +{"info/global_step": 88, "train_info/time_within_train_step": 2.674431562423706, "step": 88} +{"train_info/time_between_train_steps": 0.003808736801147461, "step": 88} +{"info/global_step": 89, "train_info/time_within_train_step": 2.674302101135254, "step": 89} +{"train_info/time_between_train_steps": 0.0038416385650634766, "step": 89} +{"info/global_step": 90, "train_info/time_within_train_step": 2.675790786743164, "step": 90} +{"train_info/time_between_train_steps": 0.0038080215454101562, "step": 90} +{"info/global_step": 91, "train_info/time_within_train_step": 2.6772236824035645, "step": 91} +{"train_info/time_between_train_steps": 0.0038042068481445312, "step": 91} +{"info/global_step": 92, "train_info/time_within_train_step": 2.6755762100219727, "step": 92} +{"train_info/time_between_train_steps": 0.0038590431213378906, "step": 92} +{"info/global_step": 93, "train_info/time_within_train_step": 2.6787021160125732, "step": 93} +{"train_info/time_between_train_steps": 0.003821849822998047, "step": 93} +{"info/global_step": 94, "train_info/time_within_train_step": 2.6776344776153564, "step": 94} +{"train_info/time_between_train_steps": 0.004029989242553711, "step": 94} +{"info/global_step": 95, "train_info/time_within_train_step": 2.67838716506958, "step": 95} +{"train_info/time_between_train_steps": 0.00398564338684082, "step": 95} +{"info/global_step": 96, "train_info/time_within_train_step": 2.67771053314209, "step": 96} +{"train_info/time_between_train_steps": 0.003911256790161133, "step": 96} +{"info/global_step": 97, "train_info/time_within_train_step": 2.6768417358398438, "step": 97} +{"train_info/time_between_train_steps": 0.0039751529693603516, "step": 97} +{"info/global_step": 98, "train_info/time_within_train_step": 2.6778805255889893, "step": 98} +{"train_info/time_between_train_steps": 0.003877401351928711, "step": 98} +{"info/global_step": 99, "train_info/time_within_train_step": 2.676440477371216, "step": 99} +{"train_info/time_between_train_steps": 0.004006624221801758, "step": 99} +{"info/global_step": 100, "train_info/time_within_train_step": 2.6755387783050537, "step": 100} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746203521, "_runtime": 293}, "step": 100} +{"logs": {"train/loss": 6.6218, "train/learning_rate": 0.00019999999999999998, "train/epoch": 0.03, "_timestamp": 1746203521, "_runtime": 293}, "step": 100} +{"train_info/time_between_train_steps": 13.745463132858276, "step": 100} +{"info/global_step": 101, "train_info/time_within_train_step": 2.4679293632507324, "step": 101} +{"train_info/time_between_train_steps": 0.0038788318634033203, "step": 101} +{"info/global_step": 102, "train_info/time_within_train_step": 2.457540512084961, "step": 102} +{"train_info/time_between_train_steps": 0.0038628578186035156, "step": 102} +{"info/global_step": 103, "train_info/time_within_train_step": 2.5134189128875732, "step": 103} +{"train_info/time_between_train_steps": 0.0037603378295898438, "step": 103} +{"info/global_step": 104, "train_info/time_within_train_step": 3.10634708404541, "step": 104} +{"train_info/time_between_train_steps": 0.0034704208374023438, "step": 104} +{"info/global_step": 105, "train_info/time_within_train_step": 2.67266583442688, "step": 105} +{"train_info/time_between_train_steps": 0.0035660266876220703, "step": 105} +{"info/global_step": 106, "train_info/time_within_train_step": 2.674832582473755, "step": 106} +{"train_info/time_between_train_steps": 0.0034942626953125, "step": 106} +{"info/global_step": 107, "train_info/time_within_train_step": 2.675748348236084, "step": 107} +{"train_info/time_between_train_steps": 0.004167795181274414, "step": 107} +{"info/global_step": 108, "train_info/time_within_train_step": 2.6822164058685303, "step": 108} +{"train_info/time_between_train_steps": 0.0046274662017822266, "step": 108} +{"info/global_step": 109, "train_info/time_within_train_step": 2.6748549938201904, "step": 109} +{"train_info/time_between_train_steps": 0.003692150115966797, "step": 109} +{"info/global_step": 110, "train_info/time_within_train_step": 2.677856683731079, "step": 110} +{"train_info/time_between_train_steps": 0.004945516586303711, "step": 110} +{"info/global_step": 111, "train_info/time_within_train_step": 2.6793782711029053, "step": 111} +{"train_info/time_between_train_steps": 0.0046155452728271484, "step": 111} +{"info/global_step": 112, "train_info/time_within_train_step": 2.677870273590088, "step": 112} +{"train_info/time_between_train_steps": 0.004459857940673828, "step": 112} +{"info/global_step": 113, "train_info/time_within_train_step": 2.6768391132354736, "step": 113} +{"train_info/time_between_train_steps": 0.004300355911254883, "step": 113} +{"info/global_step": 114, "train_info/time_within_train_step": 2.676726818084717, "step": 114} +{"train_info/time_between_train_steps": 0.004446983337402344, "step": 114} +{"info/global_step": 115, "train_info/time_within_train_step": 2.678340435028076, "step": 115} +{"train_info/time_between_train_steps": 0.0044171810150146484, "step": 115} +{"info/global_step": 116, "train_info/time_within_train_step": 2.6767265796661377, "step": 116} +{"train_info/time_between_train_steps": 0.0045163631439208984, "step": 116} +{"info/global_step": 117, "train_info/time_within_train_step": 2.6797425746917725, "step": 117} +{"train_info/time_between_train_steps": 0.00443577766418457, "step": 117} +{"info/global_step": 118, "train_info/time_within_train_step": 2.678990602493286, "step": 118} +{"train_info/time_between_train_steps": 0.005054473876953125, "step": 118} +{"info/global_step": 119, "train_info/time_within_train_step": 2.6781065464019775, "step": 119} +{"train_info/time_between_train_steps": 0.0042459964752197266, "step": 119} +{"info/global_step": 120, "train_info/time_within_train_step": 2.679413080215454, "step": 120} +{"train_info/time_between_train_steps": 0.004616260528564453, "step": 120} +{"info/global_step": 121, "train_info/time_within_train_step": 2.6792478561401367, "step": 121} +{"train_info/time_between_train_steps": 0.004419803619384766, "step": 121} +{"info/global_step": 122, "train_info/time_within_train_step": 2.6765389442443848, "step": 122} +{"train_info/time_between_train_steps": 0.004458189010620117, "step": 122} +{"info/global_step": 123, "train_info/time_within_train_step": 2.6774110794067383, "step": 123} +{"train_info/time_between_train_steps": 0.004609107971191406, "step": 123} +{"info/global_step": 124, "train_info/time_within_train_step": 2.6780028343200684, "step": 124} +{"train_info/time_between_train_steps": 0.004599571228027344, "step": 124} +{"info/global_step": 125, "train_info/time_within_train_step": 2.6771013736724854, "step": 125} +{"train_info/time_between_train_steps": 0.2480788230895996, "step": 125} +{"info/global_step": 126, "train_info/time_within_train_step": 2.674790859222412, "step": 126} +{"train_info/time_between_train_steps": 0.003892183303833008, "step": 126} +{"info/global_step": 127, "train_info/time_within_train_step": 2.674844741821289, "step": 127} +{"train_info/time_between_train_steps": 0.003818511962890625, "step": 127} +{"info/global_step": 128, "train_info/time_within_train_step": 2.674772262573242, "step": 128} +{"train_info/time_between_train_steps": 0.003930568695068359, "step": 128} +{"info/global_step": 129, "train_info/time_within_train_step": 2.675541877746582, "step": 129} +{"train_info/time_between_train_steps": 0.0038909912109375, "step": 129} +{"info/global_step": 130, "train_info/time_within_train_step": 2.673668146133423, "step": 130} +{"train_info/time_between_train_steps": 0.003654956817626953, "step": 130} +{"info/global_step": 131, "train_info/time_within_train_step": 2.679614543914795, "step": 131} +{"train_info/time_between_train_steps": 0.003979206085205078, "step": 131} +{"info/global_step": 132, "train_info/time_within_train_step": 2.6764919757843018, "step": 132} +{"train_info/time_between_train_steps": 0.003944873809814453, "step": 132} +{"info/global_step": 133, "train_info/time_within_train_step": 2.6743552684783936, "step": 133} +{"train_info/time_between_train_steps": 0.0038368701934814453, "step": 133} +{"info/global_step": 134, "train_info/time_within_train_step": 2.676011562347412, "step": 134} +{"train_info/time_between_train_steps": 0.003853321075439453, "step": 134} +{"info/global_step": 135, "train_info/time_within_train_step": 2.6752867698669434, "step": 135} +{"train_info/time_between_train_steps": 0.0038368701934814453, "step": 135} +{"info/global_step": 136, "train_info/time_within_train_step": 2.6770670413970947, "step": 136} +{"train_info/time_between_train_steps": 0.0038442611694335938, "step": 136} +{"info/global_step": 137, "train_info/time_within_train_step": 2.679912567138672, "step": 137} +{"train_info/time_between_train_steps": 0.0037877559661865234, "step": 137} +{"info/global_step": 138, "train_info/time_within_train_step": 2.674931049346924, "step": 138} +{"train_info/time_between_train_steps": 0.003920793533325195, "step": 138} +{"info/global_step": 139, "train_info/time_within_train_step": 2.6746010780334473, "step": 139} +{"train_info/time_between_train_steps": 0.003863811492919922, "step": 139} +{"info/global_step": 140, "train_info/time_within_train_step": 2.6753592491149902, "step": 140} +{"train_info/time_between_train_steps": 0.0038132667541503906, "step": 140} +{"info/global_step": 141, "train_info/time_within_train_step": 2.674400806427002, "step": 141} +{"train_info/time_between_train_steps": 0.004003286361694336, "step": 141} +{"info/global_step": 142, "train_info/time_within_train_step": 2.6786718368530273, "step": 142} +{"train_info/time_between_train_steps": 0.0038101673126220703, "step": 142} +{"info/global_step": 143, "train_info/time_within_train_step": 2.675382137298584, "step": 143} +{"train_info/time_between_train_steps": 0.003958225250244141, "step": 143} +{"info/global_step": 144, "train_info/time_within_train_step": 2.674081563949585, "step": 144} +{"train_info/time_between_train_steps": 0.0038788318634033203, "step": 144} +{"info/global_step": 145, "train_info/time_within_train_step": 2.6750423908233643, "step": 145} +{"train_info/time_between_train_steps": 0.004198789596557617, "step": 145} +{"info/global_step": 146, "train_info/time_within_train_step": 2.676042079925537, "step": 146} +{"train_info/time_between_train_steps": 0.00434422492980957, "step": 146} +{"info/global_step": 147, "train_info/time_within_train_step": 2.7026703357696533, "step": 147} +{"train_info/time_between_train_steps": 0.004365682601928711, "step": 147} +{"info/global_step": 148, "train_info/time_within_train_step": 2.6778180599212646, "step": 148} +{"train_info/time_between_train_steps": 0.0043408870697021484, "step": 148} +{"info/global_step": 149, "train_info/time_within_train_step": 2.6774978637695312, "step": 149} +{"train_info/time_between_train_steps": 0.004342079162597656, "step": 149} +{"info/global_step": 150, "train_info/time_within_train_step": 2.677701711654663, "step": 150} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746203670, "_runtime": 442}, "step": 150} +{"logs": {"train/loss": 6.1255, "train/learning_rate": 0.0003, "train/epoch": 0.05, "_timestamp": 1746203670, "_runtime": 442}, "step": 150} +{"train_info/time_between_train_steps": 0.025470495223999023, "step": 150} +{"info/global_step": 151, "train_info/time_within_train_step": 2.6765995025634766, "step": 151} +{"train_info/time_between_train_steps": 0.0043375492095947266, "step": 151} +{"info/global_step": 152, "train_info/time_within_train_step": 2.67539381980896, "step": 152} +{"train_info/time_between_train_steps": 0.004201412200927734, "step": 152} +{"info/global_step": 153, "train_info/time_within_train_step": 2.6754229068756104, "step": 153} +{"train_info/time_between_train_steps": 0.0043315887451171875, "step": 153} +{"info/global_step": 154, "train_info/time_within_train_step": 2.6733322143554688, "step": 154} +{"train_info/time_between_train_steps": 0.004152536392211914, "step": 154} +{"info/global_step": 155, "train_info/time_within_train_step": 3.279858112335205, "step": 155} +{"train_info/time_between_train_steps": 0.0035653114318847656, "step": 155} +{"info/global_step": 156, "train_info/time_within_train_step": 2.673189640045166, "step": 156} +{"train_info/time_between_train_steps": 0.0034971237182617188, "step": 156} +{"info/global_step": 157, "train_info/time_within_train_step": 2.6717331409454346, "step": 157} +{"train_info/time_between_train_steps": 0.003511190414428711, "step": 157} +{"info/global_step": 158, "train_info/time_within_train_step": 2.6746485233306885, "step": 158} +{"train_info/time_between_train_steps": 0.0035483837127685547, "step": 158} +{"info/global_step": 159, "train_info/time_within_train_step": 2.678255081176758, "step": 159} +{"train_info/time_between_train_steps": 0.003428936004638672, "step": 159} +{"info/global_step": 160, "train_info/time_within_train_step": 2.6751317977905273, "step": 160} +{"train_info/time_between_train_steps": 0.003531217575073242, "step": 160} +{"info/global_step": 161, "train_info/time_within_train_step": 2.6727468967437744, "step": 161} +{"train_info/time_between_train_steps": 0.0034711360931396484, "step": 161} +{"info/global_step": 162, "train_info/time_within_train_step": 2.674410104751587, "step": 162} +{"train_info/time_between_train_steps": 0.003482341766357422, "step": 162} +{"info/global_step": 163, "train_info/time_within_train_step": 2.6740710735321045, "step": 163} +{"train_info/time_between_train_steps": 0.0036156177520751953, "step": 163} +{"info/global_step": 164, "train_info/time_within_train_step": 2.6768078804016113, "step": 164} +{"train_info/time_between_train_steps": 0.003592967987060547, "step": 164} +{"info/global_step": 165, "train_info/time_within_train_step": 2.6712472438812256, "step": 165} +{"train_info/time_between_train_steps": 0.003542661666870117, "step": 165} +{"info/global_step": 166, "train_info/time_within_train_step": 2.673222064971924, "step": 166} +{"train_info/time_between_train_steps": 0.0034995079040527344, "step": 166} +{"info/global_step": 167, "train_info/time_within_train_step": 2.670372486114502, "step": 167} +{"train_info/time_between_train_steps": 0.003546476364135742, "step": 167} +{"info/global_step": 168, "train_info/time_within_train_step": 2.6715519428253174, "step": 168} +{"train_info/time_between_train_steps": 0.003561258316040039, "step": 168} +{"info/global_step": 169, "train_info/time_within_train_step": 2.7037627696990967, "step": 169} +{"train_info/time_between_train_steps": 0.0035734176635742188, "step": 169} +{"info/global_step": 170, "train_info/time_within_train_step": 2.673729419708252, "step": 170} +{"train_info/time_between_train_steps": 0.0036089420318603516, "step": 170} +{"info/global_step": 171, "train_info/time_within_train_step": 2.672940731048584, "step": 171} +{"train_info/time_between_train_steps": 0.003705263137817383, "step": 171} +{"info/global_step": 172, "train_info/time_within_train_step": 2.673166036605835, "step": 172} +{"train_info/time_between_train_steps": 0.0036649703979492188, "step": 172} +{"info/global_step": 173, "train_info/time_within_train_step": 2.672569990158081, "step": 173} +{"train_info/time_between_train_steps": 0.003725290298461914, "step": 173} +{"info/global_step": 174, "train_info/time_within_train_step": 2.6740026473999023, "step": 174} +{"train_info/time_between_train_steps": 0.0037441253662109375, "step": 174} +{"info/global_step": 175, "train_info/time_within_train_step": 2.6725664138793945, "step": 175} +{"train_info/time_between_train_steps": 0.0037004947662353516, "step": 175} +{"info/global_step": 176, "train_info/time_within_train_step": 2.6724941730499268, "step": 176} +{"train_info/time_between_train_steps": 0.003718137741088867, "step": 176} +{"info/global_step": 177, "train_info/time_within_train_step": 2.6734459400177, "step": 177} +{"train_info/time_between_train_steps": 0.0036394596099853516, "step": 177} +{"info/global_step": 178, "train_info/time_within_train_step": 2.6730945110321045, "step": 178} +{"train_info/time_between_train_steps": 0.0036699771881103516, "step": 178} +{"info/global_step": 179, "train_info/time_within_train_step": 2.672452688217163, "step": 179} +{"train_info/time_between_train_steps": 0.0037202835083007812, "step": 179} +{"info/global_step": 180, "train_info/time_within_train_step": 2.6729648113250732, "step": 180} +{"train_info/time_between_train_steps": 0.003712892532348633, "step": 180} +{"info/global_step": 181, "train_info/time_within_train_step": 2.673978567123413, "step": 181} +{"train_info/time_between_train_steps": 0.003557443618774414, "step": 181} +{"info/global_step": 182, "train_info/time_within_train_step": 2.672996759414673, "step": 182} +{"train_info/time_between_train_steps": 0.0036804676055908203, "step": 182} +{"info/global_step": 183, "train_info/time_within_train_step": 2.674086332321167, "step": 183} +{"train_info/time_between_train_steps": 0.0036957263946533203, "step": 183} +{"info/global_step": 184, "train_info/time_within_train_step": 2.674816608428955, "step": 184} +{"train_info/time_between_train_steps": 0.0037424564361572266, "step": 184} +{"info/global_step": 185, "train_info/time_within_train_step": 2.673668146133423, "step": 185} +{"train_info/time_between_train_steps": 0.003704547882080078, "step": 185} +{"info/global_step": 186, "train_info/time_within_train_step": 2.6748220920562744, "step": 186} +{"train_info/time_between_train_steps": 0.0038328170776367188, "step": 186} +{"info/global_step": 187, "train_info/time_within_train_step": 2.6744484901428223, "step": 187} +{"train_info/time_between_train_steps": 0.0036134719848632812, "step": 187} +{"info/global_step": 188, "train_info/time_within_train_step": 2.841005325317383, "step": 188} +{"train_info/time_between_train_steps": 0.003464221954345703, "step": 188} +{"info/global_step": 189, "train_info/time_within_train_step": 2.6734182834625244, "step": 189} +{"train_info/time_between_train_steps": 0.0035429000854492188, "step": 189} +{"info/global_step": 190, "train_info/time_within_train_step": 2.673306941986084, "step": 190} +{"train_info/time_between_train_steps": 0.003513813018798828, "step": 190} +{"info/global_step": 191, "train_info/time_within_train_step": 2.673593521118164, "step": 191} +{"train_info/time_between_train_steps": 0.0036034584045410156, "step": 191} +{"info/global_step": 192, "train_info/time_within_train_step": 3.017935037612915, "step": 192} +{"train_info/time_between_train_steps": 0.003366231918334961, "step": 192} +{"info/global_step": 193, "train_info/time_within_train_step": 2.670536994934082, "step": 193} +{"train_info/time_between_train_steps": 0.0033953189849853516, "step": 193} +{"info/global_step": 194, "train_info/time_within_train_step": 2.6698007583618164, "step": 194} +{"train_info/time_between_train_steps": 0.0033736228942871094, "step": 194} +{"info/global_step": 195, "train_info/time_within_train_step": 2.6712348461151123, "step": 195} +{"train_info/time_between_train_steps": 0.0033664703369140625, "step": 195} +{"info/global_step": 196, "train_info/time_within_train_step": 2.672844409942627, "step": 196} +{"train_info/time_between_train_steps": 0.003409862518310547, "step": 196} +{"info/global_step": 197, "train_info/time_within_train_step": 2.673795461654663, "step": 197} +{"train_info/time_between_train_steps": 0.0034143924713134766, "step": 197} +{"info/global_step": 198, "train_info/time_within_train_step": 2.6721715927124023, "step": 198} +{"train_info/time_between_train_steps": 0.0034513473510742188, "step": 198} +{"info/global_step": 199, "train_info/time_within_train_step": 2.6734561920166016, "step": 199} +{"train_info/time_between_train_steps": 0.0035142898559570312, "step": 199} +{"info/global_step": 200, "train_info/time_within_train_step": 2.6734931468963623, "step": 200} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746203806, "_runtime": 578}, "step": 200} +{"logs": {"train/loss": 5.8614, "train/learning_rate": 0.00039999999999999996, "train/epoch": 0.07, "_timestamp": 1746203806, "_runtime": 578}, "step": 200} +{"train_info/time_between_train_steps": 15.570960521697998, "step": 200} +{"info/global_step": 201, "train_info/time_within_train_step": 2.4740476608276367, "step": 201} +{"train_info/time_between_train_steps": 0.0035860538482666016, "step": 201} +{"info/global_step": 202, "train_info/time_within_train_step": 2.4570181369781494, "step": 202} +{"train_info/time_between_train_steps": 0.0033898353576660156, "step": 202} +{"info/global_step": 203, "train_info/time_within_train_step": 2.467954397201538, "step": 203} +{"train_info/time_between_train_steps": 0.0033826828002929688, "step": 203} +{"info/global_step": 204, "train_info/time_within_train_step": 2.642672061920166, "step": 204} +{"train_info/time_between_train_steps": 0.0033702850341796875, "step": 204} +{"info/global_step": 205, "train_info/time_within_train_step": 2.674328088760376, "step": 205} +{"train_info/time_between_train_steps": 0.0033936500549316406, "step": 205} +{"info/global_step": 206, "train_info/time_within_train_step": 2.672698974609375, "step": 206} +{"train_info/time_between_train_steps": 0.0033445358276367188, "step": 206} +{"info/global_step": 207, "train_info/time_within_train_step": 2.6735994815826416, "step": 207} +{"train_info/time_between_train_steps": 0.0033485889434814453, "step": 207} +{"info/global_step": 208, "train_info/time_within_train_step": 2.694563388824463, "step": 208} +{"train_info/time_between_train_steps": 0.003364086151123047, "step": 208} +{"info/global_step": 209, "train_info/time_within_train_step": 2.673905849456787, "step": 209} +{"train_info/time_between_train_steps": 0.003332376480102539, "step": 209} +{"info/global_step": 210, "train_info/time_within_train_step": 2.6731557846069336, "step": 210} +{"train_info/time_between_train_steps": 0.0033240318298339844, "step": 210} +{"info/global_step": 211, "train_info/time_within_train_step": 2.6727631092071533, "step": 211} +{"train_info/time_between_train_steps": 0.0033125877380371094, "step": 211} +{"info/global_step": 212, "train_info/time_within_train_step": 2.6737380027770996, "step": 212} +{"train_info/time_between_train_steps": 0.0033409595489501953, "step": 212} +{"info/global_step": 213, "train_info/time_within_train_step": 2.6726856231689453, "step": 213} +{"train_info/time_between_train_steps": 0.0032739639282226562, "step": 213} +{"info/global_step": 214, "train_info/time_within_train_step": 2.6739559173583984, "step": 214} +{"train_info/time_between_train_steps": 0.0033652782440185547, "step": 214} +{"info/global_step": 215, "train_info/time_within_train_step": 2.671849012374878, "step": 215} +{"train_info/time_between_train_steps": 0.0033483505249023438, "step": 215} +{"info/global_step": 216, "train_info/time_within_train_step": 2.68243145942688, "step": 216} +{"train_info/time_between_train_steps": 0.003317117691040039, "step": 216} +{"info/global_step": 217, "train_info/time_within_train_step": 2.673107147216797, "step": 217} +{"train_info/time_between_train_steps": 0.0033359527587890625, "step": 217} +{"info/global_step": 218, "train_info/time_within_train_step": 2.6741058826446533, "step": 218} +{"train_info/time_between_train_steps": 0.0033502578735351562, "step": 218} +{"info/global_step": 219, "train_info/time_within_train_step": 2.67265248298645, "step": 219} +{"train_info/time_between_train_steps": 0.003346681594848633, "step": 219} +{"info/global_step": 220, "train_info/time_within_train_step": 2.6757495403289795, "step": 220} +{"train_info/time_between_train_steps": 0.003348827362060547, "step": 220} +{"info/global_step": 221, "train_info/time_within_train_step": 2.6737372875213623, "step": 221} +{"train_info/time_between_train_steps": 0.003296375274658203, "step": 221} +{"info/global_step": 222, "train_info/time_within_train_step": 2.6734204292297363, "step": 222} +{"train_info/time_between_train_steps": 0.0034193992614746094, "step": 222} +{"info/global_step": 223, "train_info/time_within_train_step": 2.674668312072754, "step": 223} +{"train_info/time_between_train_steps": 0.00335693359375, "step": 223} +{"info/global_step": 224, "train_info/time_within_train_step": 2.673732042312622, "step": 224} +{"train_info/time_between_train_steps": 0.003328084945678711, "step": 224} +{"info/global_step": 225, "train_info/time_within_train_step": 2.6745338439941406, "step": 225} +{"train_info/time_between_train_steps": 0.0033791065216064453, "step": 225} +{"info/global_step": 226, "train_info/time_within_train_step": 2.673332929611206, "step": 226} +{"train_info/time_between_train_steps": 0.0033266544342041016, "step": 226} +{"info/global_step": 227, "train_info/time_within_train_step": 2.672685146331787, "step": 227} +{"train_info/time_between_train_steps": 0.0033638477325439453, "step": 227} +{"info/global_step": 228, "train_info/time_within_train_step": 2.672978401184082, "step": 228} +{"train_info/time_between_train_steps": 0.0033910274505615234, "step": 228} +{"info/global_step": 229, "train_info/time_within_train_step": 2.6711273193359375, "step": 229} +{"train_info/time_between_train_steps": 0.003359556198120117, "step": 229} +{"info/global_step": 230, "train_info/time_within_train_step": 2.672713041305542, "step": 230} +{"train_info/time_between_train_steps": 0.0034401416778564453, "step": 230} +{"info/global_step": 231, "train_info/time_within_train_step": 2.6719090938568115, "step": 231} +{"train_info/time_between_train_steps": 0.0033905506134033203, "step": 231} +{"info/global_step": 232, "train_info/time_within_train_step": 2.673164129257202, "step": 232} +{"train_info/time_between_train_steps": 0.0032622814178466797, "step": 232} +{"info/global_step": 233, "train_info/time_within_train_step": 2.6724374294281006, "step": 233} +{"train_info/time_between_train_steps": 0.0033180713653564453, "step": 233} +{"info/global_step": 234, "train_info/time_within_train_step": 2.674220561981201, "step": 234} +{"train_info/time_between_train_steps": 0.0033121109008789062, "step": 234} +{"info/global_step": 235, "train_info/time_within_train_step": 2.672297239303589, "step": 235} +{"train_info/time_between_train_steps": 0.0032901763916015625, "step": 235} +{"info/global_step": 236, "train_info/time_within_train_step": 2.673548936843872, "step": 236} +{"train_info/time_between_train_steps": 0.0033812522888183594, "step": 236} +{"info/global_step": 237, "train_info/time_within_train_step": 2.675276517868042, "step": 237} +{"train_info/time_between_train_steps": 0.003373861312866211, "step": 237} +{"info/global_step": 238, "train_info/time_within_train_step": 2.6734204292297363, "step": 238} +{"train_info/time_between_train_steps": 0.0032875537872314453, "step": 238} +{"info/global_step": 239, "train_info/time_within_train_step": 2.671637773513794, "step": 239} +{"train_info/time_between_train_steps": 0.0033037662506103516, "step": 239} +{"info/global_step": 240, "train_info/time_within_train_step": 2.672189712524414, "step": 240} +{"train_info/time_between_train_steps": 0.003457307815551758, "step": 240} +{"info/global_step": 241, "train_info/time_within_train_step": 2.672666549682617, "step": 241} +{"train_info/time_between_train_steps": 0.003417491912841797, "step": 241} +{"info/global_step": 242, "train_info/time_within_train_step": 2.673332929611206, "step": 242} +{"train_info/time_between_train_steps": 0.0034151077270507812, "step": 242} +{"info/global_step": 243, "train_info/time_within_train_step": 2.67252779006958, "step": 243} +{"train_info/time_between_train_steps": 0.003476858139038086, "step": 243} +{"info/global_step": 244, "train_info/time_within_train_step": 2.672834634780884, "step": 244} +{"train_info/time_between_train_steps": 0.003412961959838867, "step": 244} +{"info/global_step": 245, "train_info/time_within_train_step": 2.703786849975586, "step": 245} +{"train_info/time_between_train_steps": 0.0034368038177490234, "step": 245} +{"info/global_step": 246, "train_info/time_within_train_step": 2.6728155612945557, "step": 246} +{"train_info/time_between_train_steps": 0.003415822982788086, "step": 246} +{"info/global_step": 247, "train_info/time_within_train_step": 2.673424243927002, "step": 247} +{"train_info/time_between_train_steps": 0.0035295486450195312, "step": 247} +{"info/global_step": 248, "train_info/time_within_train_step": 2.674389123916626, "step": 248} +{"train_info/time_between_train_steps": 0.0035409927368164062, "step": 248} +{"info/global_step": 249, "train_info/time_within_train_step": 2.675299882888794, "step": 249} +{"train_info/time_between_train_steps": 0.0037546157836914062, "step": 249} +{"info/global_step": 250, "train_info/time_within_train_step": 3.478531837463379, "step": 250} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746203957, "_runtime": 729}, "step": 250} +{"logs": {"train/loss": 5.7039, "train/learning_rate": 0.0005, "train/epoch": 0.08, "_timestamp": 1746203957, "_runtime": 729}, "step": 250} +{"train_info/time_between_train_steps": 0.2118537425994873, "step": 250} +{"info/global_step": 251, "train_info/time_within_train_step": 2.6678593158721924, "step": 251} +{"train_info/time_between_train_steps": 0.0035915374755859375, "step": 251} +{"info/global_step": 252, "train_info/time_within_train_step": 2.6750247478485107, "step": 252} +{"train_info/time_between_train_steps": 0.003539562225341797, "step": 252} +{"info/global_step": 253, "train_info/time_within_train_step": 2.673814296722412, "step": 253} +{"train_info/time_between_train_steps": 0.0035610198974609375, "step": 253} +{"info/global_step": 254, "train_info/time_within_train_step": 2.6731700897216797, "step": 254} +{"train_info/time_between_train_steps": 0.003614664077758789, "step": 254} +{"info/global_step": 255, "train_info/time_within_train_step": 2.672347068786621, "step": 255} +{"train_info/time_between_train_steps": 0.0035533905029296875, "step": 255} +{"info/global_step": 256, "train_info/time_within_train_step": 2.6708295345306396, "step": 256} +{"train_info/time_between_train_steps": 0.0034258365631103516, "step": 256} +{"info/global_step": 257, "train_info/time_within_train_step": 2.6711463928222656, "step": 257} +{"train_info/time_between_train_steps": 0.0034918785095214844, "step": 257} +{"info/global_step": 258, "train_info/time_within_train_step": 2.672351360321045, "step": 258} +{"train_info/time_between_train_steps": 0.0036406517028808594, "step": 258} +{"info/global_step": 259, "train_info/time_within_train_step": 2.672375202178955, "step": 259} +{"train_info/time_between_train_steps": 0.0034279823303222656, "step": 259} +{"info/global_step": 260, "train_info/time_within_train_step": 2.6721103191375732, "step": 260} +{"train_info/time_between_train_steps": 0.0034248828887939453, "step": 260} +{"info/global_step": 261, "train_info/time_within_train_step": 2.672578811645508, "step": 261} +{"train_info/time_between_train_steps": 0.0034761428833007812, "step": 261} +{"info/global_step": 262, "train_info/time_within_train_step": 2.673434019088745, "step": 262} +{"train_info/time_between_train_steps": 0.00348663330078125, "step": 262} +{"info/global_step": 263, "train_info/time_within_train_step": 2.6712520122528076, "step": 263} +{"train_info/time_between_train_steps": 0.0034799575805664062, "step": 263} +{"info/global_step": 264, "train_info/time_within_train_step": 2.672443151473999, "step": 264} +{"train_info/time_between_train_steps": 0.0036275386810302734, "step": 264} +{"info/global_step": 265, "train_info/time_within_train_step": 3.032341480255127, "step": 265} +{"train_info/time_between_train_steps": 0.0034704208374023438, "step": 265} +{"info/global_step": 266, "train_info/time_within_train_step": 2.6714541912078857, "step": 266} +{"train_info/time_between_train_steps": 0.0033614635467529297, "step": 266} +{"info/global_step": 267, "train_info/time_within_train_step": 2.676044464111328, "step": 267} +{"train_info/time_between_train_steps": 0.003378629684448242, "step": 267} +{"info/global_step": 268, "train_info/time_within_train_step": 2.672032594680786, "step": 268} +{"train_info/time_between_train_steps": 0.0033910274505615234, "step": 268} +{"info/global_step": 269, "train_info/time_within_train_step": 2.6694047451019287, "step": 269} +{"train_info/time_between_train_steps": 0.0033609867095947266, "step": 269} +{"info/global_step": 270, "train_info/time_within_train_step": 2.6705667972564697, "step": 270} +{"train_info/time_between_train_steps": 0.003427267074584961, "step": 270} +{"info/global_step": 271, "train_info/time_within_train_step": 2.670759916305542, "step": 271} +{"train_info/time_between_train_steps": 0.0033426284790039062, "step": 271} +{"info/global_step": 272, "train_info/time_within_train_step": 2.671191453933716, "step": 272} +{"train_info/time_between_train_steps": 0.0033338069915771484, "step": 272} +{"info/global_step": 273, "train_info/time_within_train_step": 2.6769988536834717, "step": 273} +{"train_info/time_between_train_steps": 0.0033752918243408203, "step": 273} +{"info/global_step": 274, "train_info/time_within_train_step": 2.6717307567596436, "step": 274} +{"train_info/time_between_train_steps": 0.0033817291259765625, "step": 274} +{"info/global_step": 275, "train_info/time_within_train_step": 2.673508405685425, "step": 275} +{"train_info/time_between_train_steps": 0.003355741500854492, "step": 275} +{"info/global_step": 276, "train_info/time_within_train_step": 2.6722731590270996, "step": 276} +{"train_info/time_between_train_steps": 0.003364086151123047, "step": 276} +{"info/global_step": 277, "train_info/time_within_train_step": 2.6709136962890625, "step": 277} +{"train_info/time_between_train_steps": 0.003319978713989258, "step": 277} +{"info/global_step": 278, "train_info/time_within_train_step": 2.6708266735076904, "step": 278} +{"train_info/time_between_train_steps": 0.003330230712890625, "step": 278} +{"info/global_step": 279, "train_info/time_within_train_step": 2.6715571880340576, "step": 279} +{"train_info/time_between_train_steps": 0.0032548904418945312, "step": 279} +{"info/global_step": 280, "train_info/time_within_train_step": 2.6701247692108154, "step": 280} +{"train_info/time_between_train_steps": 0.00336456298828125, "step": 280} +{"info/global_step": 281, "train_info/time_within_train_step": 2.6750078201293945, "step": 281} +{"train_info/time_between_train_steps": 0.0033278465270996094, "step": 281} +{"info/global_step": 282, "train_info/time_within_train_step": 2.669235944747925, "step": 282} +{"train_info/time_between_train_steps": 0.0033240318298339844, "step": 282} +{"info/global_step": 283, "train_info/time_within_train_step": 2.669334888458252, "step": 283} +{"train_info/time_between_train_steps": 0.0034089088439941406, "step": 283} +{"info/global_step": 284, "train_info/time_within_train_step": 2.6688990592956543, "step": 284} +{"train_info/time_between_train_steps": 0.0032868385314941406, "step": 284} +{"info/global_step": 285, "train_info/time_within_train_step": 2.671140193939209, "step": 285} +{"train_info/time_between_train_steps": 0.0032961368560791016, "step": 285} +{"info/global_step": 286, "train_info/time_within_train_step": 2.6698434352874756, "step": 286} +{"train_info/time_between_train_steps": 0.0033092498779296875, "step": 286} +{"info/global_step": 287, "train_info/time_within_train_step": 2.6698157787323, "step": 287} +{"train_info/time_between_train_steps": 0.003287076950073242, "step": 287} +{"info/global_step": 288, "train_info/time_within_train_step": 2.671264171600342, "step": 288} +{"train_info/time_between_train_steps": 0.0032935142517089844, "step": 288} +{"info/global_step": 289, "train_info/time_within_train_step": 2.6697278022766113, "step": 289} +{"train_info/time_between_train_steps": 0.003337383270263672, "step": 289} +{"info/global_step": 290, "train_info/time_within_train_step": 2.668949842453003, "step": 290} +{"train_info/time_between_train_steps": 0.0032858848571777344, "step": 290} +{"info/global_step": 291, "train_info/time_within_train_step": 2.6689860820770264, "step": 291} +{"train_info/time_between_train_steps": 0.003331899642944336, "step": 291} +{"info/global_step": 292, "train_info/time_within_train_step": 2.6697120666503906, "step": 292} +{"train_info/time_between_train_steps": 0.003357410430908203, "step": 292} +{"info/global_step": 293, "train_info/time_within_train_step": 2.670353651046753, "step": 293} +{"train_info/time_between_train_steps": 0.0033617019653320312, "step": 293} +{"info/global_step": 294, "train_info/time_within_train_step": 2.6697707176208496, "step": 294} +{"train_info/time_between_train_steps": 0.0039446353912353516, "step": 294} +{"info/global_step": 295, "train_info/time_within_train_step": 2.6697838306427, "step": 295} +{"train_info/time_between_train_steps": 0.0033211708068847656, "step": 295} +{"info/global_step": 296, "train_info/time_within_train_step": 2.6706676483154297, "step": 296} +{"train_info/time_between_train_steps": 0.0033309459686279297, "step": 296} +{"info/global_step": 297, "train_info/time_within_train_step": 2.693833112716675, "step": 297} +{"train_info/time_between_train_steps": 0.003274679183959961, "step": 297} +{"info/global_step": 298, "train_info/time_within_train_step": 2.670638084411621, "step": 298} +{"train_info/time_between_train_steps": 0.003321409225463867, "step": 298} +{"info/global_step": 299, "train_info/time_within_train_step": 2.672093152999878, "step": 299} +{"train_info/time_between_train_steps": 0.003356456756591797, "step": 299} +{"info/global_step": 300, "train_info/time_within_train_step": 2.6727395057678223, "step": 300} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746204092, "_runtime": 864}, "step": 300} +{"logs": {"train/loss": 5.5978, "train/learning_rate": 0.0006, "train/epoch": 0.1, "_timestamp": 1746204092, "_runtime": 864}, "step": 300} +{"train_info/time_between_train_steps": 13.812514781951904, "step": 300} +{"info/global_step": 301, "train_info/time_within_train_step": 2.4638476371765137, "step": 301} +{"train_info/time_between_train_steps": 0.003627777099609375, "step": 301} +{"info/global_step": 302, "train_info/time_within_train_step": 2.4547438621520996, "step": 302} +{"train_info/time_between_train_steps": 0.003676891326904297, "step": 302} +{"info/global_step": 303, "train_info/time_within_train_step": 2.4645090103149414, "step": 303} +{"train_info/time_between_train_steps": 0.003645181655883789, "step": 303} +{"info/global_step": 304, "train_info/time_within_train_step": 2.6407933235168457, "step": 304} +{"train_info/time_between_train_steps": 0.0035533905029296875, "step": 304} +{"info/global_step": 305, "train_info/time_within_train_step": 2.6703078746795654, "step": 305} +{"train_info/time_between_train_steps": 0.0035991668701171875, "step": 305} +{"info/global_step": 306, "train_info/time_within_train_step": 2.6693835258483887, "step": 306} +{"train_info/time_between_train_steps": 0.0036394596099853516, "step": 306} +{"info/global_step": 307, "train_info/time_within_train_step": 2.6708638668060303, "step": 307} +{"train_info/time_between_train_steps": 0.003527402877807617, "step": 307} +{"info/global_step": 308, "train_info/time_within_train_step": 2.6715781688690186, "step": 308} +{"train_info/time_between_train_steps": 0.0035843849182128906, "step": 308} +{"info/global_step": 309, "train_info/time_within_train_step": 2.6721420288085938, "step": 309} +{"train_info/time_between_train_steps": 0.0036249160766601562, "step": 309} +{"info/global_step": 310, "train_info/time_within_train_step": 2.672952890396118, "step": 310} +{"train_info/time_between_train_steps": 0.003582477569580078, "step": 310} +{"info/global_step": 311, "train_info/time_within_train_step": 2.6728734970092773, "step": 311} +{"train_info/time_between_train_steps": 0.0035881996154785156, "step": 311} +{"info/global_step": 312, "train_info/time_within_train_step": 2.6960670948028564, "step": 312} +{"train_info/time_between_train_steps": 0.0035011768341064453, "step": 312} +{"info/global_step": 313, "train_info/time_within_train_step": 2.8724517822265625, "step": 313} +{"train_info/time_between_train_steps": 0.0034852027893066406, "step": 313} +{"info/global_step": 314, "train_info/time_within_train_step": 2.6732802391052246, "step": 314} +{"train_info/time_between_train_steps": 0.0034055709838867188, "step": 314} +{"info/global_step": 315, "train_info/time_within_train_step": 2.6722679138183594, "step": 315} +{"train_info/time_between_train_steps": 0.0034008026123046875, "step": 315} +{"info/global_step": 316, "train_info/time_within_train_step": 2.6717138290405273, "step": 316} +{"train_info/time_between_train_steps": 0.0033452510833740234, "step": 316} +{"info/global_step": 317, "train_info/time_within_train_step": 2.6728334426879883, "step": 317} +{"train_info/time_between_train_steps": 0.0034096240997314453, "step": 317} +{"info/global_step": 318, "train_info/time_within_train_step": 2.670365333557129, "step": 318} +{"train_info/time_between_train_steps": 0.003421306610107422, "step": 318} +{"info/global_step": 319, "train_info/time_within_train_step": 2.6705102920532227, "step": 319} +{"train_info/time_between_train_steps": 0.003404378890991211, "step": 319} +{"info/global_step": 320, "train_info/time_within_train_step": 2.6706933975219727, "step": 320} +{"train_info/time_between_train_steps": 0.0035746097564697266, "step": 320} +{"info/global_step": 321, "train_info/time_within_train_step": 2.9962260723114014, "step": 321} +{"train_info/time_between_train_steps": 0.0034263134002685547, "step": 321} +{"info/global_step": 322, "train_info/time_within_train_step": 2.6714584827423096, "step": 322} +{"train_info/time_between_train_steps": 0.003331899642944336, "step": 322} +{"info/global_step": 323, "train_info/time_within_train_step": 2.6722121238708496, "step": 323} +{"train_info/time_between_train_steps": 0.0033795833587646484, "step": 323} +{"info/global_step": 324, "train_info/time_within_train_step": 2.671409845352173, "step": 324} +{"train_info/time_between_train_steps": 0.0032939910888671875, "step": 324} +{"info/global_step": 325, "train_info/time_within_train_step": 2.6720292568206787, "step": 325} +{"train_info/time_between_train_steps": 0.0033173561096191406, "step": 325} +{"info/global_step": 326, "train_info/time_within_train_step": 2.670295476913452, "step": 326} +{"train_info/time_between_train_steps": 0.003419637680053711, "step": 326} +{"info/global_step": 327, "train_info/time_within_train_step": 2.6699893474578857, "step": 327} +{"train_info/time_between_train_steps": 0.0033235549926757812, "step": 327} +{"info/global_step": 328, "train_info/time_within_train_step": 2.66976261138916, "step": 328} +{"train_info/time_between_train_steps": 0.003284454345703125, "step": 328} +{"info/global_step": 329, "train_info/time_within_train_step": 2.671265125274658, "step": 329} +{"train_info/time_between_train_steps": 0.0033986568450927734, "step": 329} +{"info/global_step": 330, "train_info/time_within_train_step": 2.6700241565704346, "step": 330} +{"train_info/time_between_train_steps": 0.0035343170166015625, "step": 330} +{"info/global_step": 331, "train_info/time_within_train_step": 2.6758127212524414, "step": 331} +{"train_info/time_between_train_steps": 0.0034482479095458984, "step": 331} +{"info/global_step": 332, "train_info/time_within_train_step": 2.675473690032959, "step": 332} +{"train_info/time_between_train_steps": 0.003732442855834961, "step": 332} +{"info/global_step": 333, "train_info/time_within_train_step": 2.672105073928833, "step": 333} +{"train_info/time_between_train_steps": 0.003720998764038086, "step": 333} +{"info/global_step": 334, "train_info/time_within_train_step": 2.6704416275024414, "step": 334} +{"train_info/time_between_train_steps": 0.0036356449127197266, "step": 334} +{"info/global_step": 335, "train_info/time_within_train_step": 2.6753711700439453, "step": 335} +{"train_info/time_between_train_steps": 0.003658771514892578, "step": 335} +{"info/global_step": 336, "train_info/time_within_train_step": 2.671926736831665, "step": 336} +{"train_info/time_between_train_steps": 0.0036542415618896484, "step": 336} +{"info/global_step": 337, "train_info/time_within_train_step": 2.6719844341278076, "step": 337} +{"train_info/time_between_train_steps": 0.0036039352416992188, "step": 337} +{"info/global_step": 338, "train_info/time_within_train_step": 2.6719956398010254, "step": 338} +{"train_info/time_between_train_steps": 0.0036077499389648438, "step": 338} +{"info/global_step": 339, "train_info/time_within_train_step": 2.672581672668457, "step": 339} +{"train_info/time_between_train_steps": 0.003535032272338867, "step": 339} +{"info/global_step": 340, "train_info/time_within_train_step": 2.6726152896881104, "step": 340} +{"train_info/time_between_train_steps": 0.0036094188690185547, "step": 340} +{"info/global_step": 341, "train_info/time_within_train_step": 2.67106032371521, "step": 341} +{"train_info/time_between_train_steps": 0.0036611557006835938, "step": 341} +{"info/global_step": 342, "train_info/time_within_train_step": 2.671043872833252, "step": 342} +{"train_info/time_between_train_steps": 0.003551483154296875, "step": 342} +{"info/global_step": 343, "train_info/time_within_train_step": 2.671152353286743, "step": 343} +{"train_info/time_between_train_steps": 0.0037050247192382812, "step": 343} +{"info/global_step": 344, "train_info/time_within_train_step": 2.6706151962280273, "step": 344} +{"train_info/time_between_train_steps": 0.003567218780517578, "step": 344} +{"info/global_step": 345, "train_info/time_within_train_step": 2.6706225872039795, "step": 345} +{"train_info/time_between_train_steps": 0.0035505294799804688, "step": 345} +{"info/global_step": 346, "train_info/time_within_train_step": 2.670076608657837, "step": 346} +{"train_info/time_between_train_steps": 0.0036554336547851562, "step": 346} +{"info/global_step": 347, "train_info/time_within_train_step": 2.670319080352783, "step": 347} +{"train_info/time_between_train_steps": 0.003571748733520508, "step": 347} +{"info/global_step": 348, "train_info/time_within_train_step": 2.669877767562866, "step": 348} +{"train_info/time_between_train_steps": 0.00353240966796875, "step": 348} +{"info/global_step": 349, "train_info/time_within_train_step": 2.670729398727417, "step": 349} +{"train_info/time_between_train_steps": 0.0035986900329589844, "step": 349} +{"info/global_step": 350, "train_info/time_within_train_step": 2.671603202819824, "step": 350} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746204241, "_runtime": 1013}, "step": 350} +{"logs": {"train/loss": 5.5178, "train/learning_rate": 0.0005888888888888889, "train/epoch": 0.12, "_timestamp": 1746204241, "_runtime": 1013}, "step": 350} +{"train_info/time_between_train_steps": 0.024843215942382812, "step": 350} +{"info/global_step": 351, "train_info/time_within_train_step": 2.6710774898529053, "step": 351} +{"train_info/time_between_train_steps": 0.0035772323608398438, "step": 351} +{"info/global_step": 352, "train_info/time_within_train_step": 2.6707050800323486, "step": 352} +{"train_info/time_between_train_steps": 0.0035920143127441406, "step": 352} +{"info/global_step": 353, "train_info/time_within_train_step": 2.6711249351501465, "step": 353} +{"train_info/time_between_train_steps": 0.0036270618438720703, "step": 353} +{"info/global_step": 354, "train_info/time_within_train_step": 2.6705429553985596, "step": 354} +{"train_info/time_between_train_steps": 0.0035805702209472656, "step": 354} +{"info/global_step": 355, "train_info/time_within_train_step": 2.6693830490112305, "step": 355} +{"train_info/time_between_train_steps": 0.003545045852661133, "step": 355} +{"info/global_step": 356, "train_info/time_within_train_step": 2.6697590351104736, "step": 356} +{"train_info/time_between_train_steps": 0.003829479217529297, "step": 356} +{"info/global_step": 357, "train_info/time_within_train_step": 2.6707441806793213, "step": 357} +{"train_info/time_between_train_steps": 0.0035905838012695312, "step": 357} +{"info/global_step": 358, "train_info/time_within_train_step": 2.67039155960083, "step": 358} +{"train_info/time_between_train_steps": 0.003652811050415039, "step": 358} +{"info/global_step": 359, "train_info/time_within_train_step": 2.692997694015503, "step": 359} +{"train_info/time_between_train_steps": 0.0035839080810546875, "step": 359} +{"info/global_step": 360, "train_info/time_within_train_step": 2.6704773902893066, "step": 360} +{"train_info/time_between_train_steps": 0.003624439239501953, "step": 360} +{"info/global_step": 361, "train_info/time_within_train_step": 2.669480562210083, "step": 361} +{"train_info/time_between_train_steps": 0.003538370132446289, "step": 361} +{"info/global_step": 362, "train_info/time_within_train_step": 2.6706840991973877, "step": 362} +{"train_info/time_between_train_steps": 0.0036590099334716797, "step": 362} +{"info/global_step": 363, "train_info/time_within_train_step": 2.6707820892333984, "step": 363} +{"train_info/time_between_train_steps": 0.0035927295684814453, "step": 363} +{"info/global_step": 364, "train_info/time_within_train_step": 2.6725919246673584, "step": 364} +{"train_info/time_between_train_steps": 0.0035440921783447266, "step": 364} +{"info/global_step": 365, "train_info/time_within_train_step": 2.6711926460266113, "step": 365} +{"train_info/time_between_train_steps": 0.0035126209259033203, "step": 365} +{"info/global_step": 366, "train_info/time_within_train_step": 2.671330690383911, "step": 366} +{"train_info/time_between_train_steps": 0.0035316944122314453, "step": 366} +{"info/global_step": 367, "train_info/time_within_train_step": 2.671454429626465, "step": 367} +{"train_info/time_between_train_steps": 0.0035429000854492188, "step": 367} +{"info/global_step": 368, "train_info/time_within_train_step": 2.670044183731079, "step": 368} +{"train_info/time_between_train_steps": 0.003532886505126953, "step": 368} +{"info/global_step": 369, "train_info/time_within_train_step": 2.6706182956695557, "step": 369} +{"train_info/time_between_train_steps": 0.003802776336669922, "step": 369} +{"info/global_step": 370, "train_info/time_within_train_step": 2.670461416244507, "step": 370} +{"train_info/time_between_train_steps": 0.0035517215728759766, "step": 370} +{"info/global_step": 371, "train_info/time_within_train_step": 2.669644832611084, "step": 371} +{"train_info/time_between_train_steps": 0.0035142898559570312, "step": 371} +{"info/global_step": 372, "train_info/time_within_train_step": 2.6720192432403564, "step": 372} +{"train_info/time_between_train_steps": 0.0035817623138427734, "step": 372} +{"info/global_step": 373, "train_info/time_within_train_step": 2.6708123683929443, "step": 373} +{"train_info/time_between_train_steps": 0.003564119338989258, "step": 373} +{"info/global_step": 374, "train_info/time_within_train_step": 2.669966459274292, "step": 374} +{"train_info/time_between_train_steps": 0.003582477569580078, "step": 374} +{"info/global_step": 375, "train_info/time_within_train_step": 2.670438766479492, "step": 375} +{"train_info/time_between_train_steps": 0.15409636497497559, "step": 375} +{"info/global_step": 376, "train_info/time_within_train_step": 2.6698849201202393, "step": 376} +{"train_info/time_between_train_steps": 0.0034317970275878906, "step": 376} +{"info/global_step": 377, "train_info/time_within_train_step": 2.670729398727417, "step": 377} +{"train_info/time_between_train_steps": 0.003374814987182617, "step": 377} +{"info/global_step": 378, "train_info/time_within_train_step": 2.6707916259765625, "step": 378} +{"train_info/time_between_train_steps": 0.003413677215576172, "step": 378} +{"info/global_step": 379, "train_info/time_within_train_step": 2.6706974506378174, "step": 379} +{"train_info/time_between_train_steps": 0.003392934799194336, "step": 379} +{"info/global_step": 380, "train_info/time_within_train_step": 2.6706414222717285, "step": 380} +{"train_info/time_between_train_steps": 0.0034618377685546875, "step": 380} +{"info/global_step": 381, "train_info/time_within_train_step": 2.6708590984344482, "step": 381} +{"train_info/time_between_train_steps": 0.0033826828002929688, "step": 381} +{"info/global_step": 382, "train_info/time_within_train_step": 2.672121286392212, "step": 382} +{"train_info/time_between_train_steps": 0.0034949779510498047, "step": 382} +{"info/global_step": 383, "train_info/time_within_train_step": 2.6723616123199463, "step": 383} +{"train_info/time_between_train_steps": 0.003423452377319336, "step": 383} +{"info/global_step": 384, "train_info/time_within_train_step": 2.669729471206665, "step": 384} +{"train_info/time_between_train_steps": 0.003316164016723633, "step": 384} +{"info/global_step": 385, "train_info/time_within_train_step": 2.6732754707336426, "step": 385} +{"train_info/time_between_train_steps": 0.003370046615600586, "step": 385} +{"info/global_step": 386, "train_info/time_within_train_step": 2.672959327697754, "step": 386} +{"train_info/time_between_train_steps": 0.003676891326904297, "step": 386} +{"info/global_step": 387, "train_info/time_within_train_step": 2.672390937805176, "step": 387} +{"train_info/time_between_train_steps": 0.0034439563751220703, "step": 387} +{"info/global_step": 388, "train_info/time_within_train_step": 2.672974109649658, "step": 388} +{"train_info/time_between_train_steps": 0.0034279823303222656, "step": 388} +{"info/global_step": 389, "train_info/time_within_train_step": 2.6722252368927, "step": 389} +{"train_info/time_between_train_steps": 0.003439664840698242, "step": 389} +{"info/global_step": 390, "train_info/time_within_train_step": 2.672436475753784, "step": 390} +{"train_info/time_between_train_steps": 0.0034508705139160156, "step": 390} +{"info/global_step": 391, "train_info/time_within_train_step": 2.6714706420898438, "step": 391} +{"train_info/time_between_train_steps": 0.003439664840698242, "step": 391} +{"info/global_step": 392, "train_info/time_within_train_step": 2.672456741333008, "step": 392} +{"train_info/time_between_train_steps": 0.0034415721893310547, "step": 392} +{"info/global_step": 393, "train_info/time_within_train_step": 2.671206474304199, "step": 393} +{"train_info/time_between_train_steps": 0.0034148693084716797, "step": 393} +{"info/global_step": 394, "train_info/time_within_train_step": 2.672351598739624, "step": 394} +{"train_info/time_between_train_steps": 0.0033919811248779297, "step": 394} +{"info/global_step": 395, "train_info/time_within_train_step": 2.6717135906219482, "step": 395} +{"train_info/time_between_train_steps": 0.003439664840698242, "step": 395} +{"info/global_step": 396, "train_info/time_within_train_step": 2.670243978500366, "step": 396} +{"train_info/time_between_train_steps": 0.0033960342407226562, "step": 396} +{"info/global_step": 397, "train_info/time_within_train_step": 2.6716248989105225, "step": 397} +{"train_info/time_between_train_steps": 0.003429889678955078, "step": 397} +{"info/global_step": 398, "train_info/time_within_train_step": 2.676309108734131, "step": 398} +{"train_info/time_between_train_steps": 0.0034236907958984375, "step": 398} +{"info/global_step": 399, "train_info/time_within_train_step": 2.677645444869995, "step": 399} +{"train_info/time_between_train_steps": 0.0034744739532470703, "step": 399} +{"info/global_step": 400, "train_info/time_within_train_step": 2.670508861541748, "step": 400} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746204376, "_runtime": 1148}, "step": 400} +{"logs": {"train/loss": 5.4384, "train/learning_rate": 0.0005777777777777776, "train/epoch": 0.13, "_timestamp": 1746204376, "_runtime": 1148}, "step": 400} +{"train_info/time_between_train_steps": 46.280723571777344, "step": 400} +{"info/global_step": 401, "train_info/time_within_train_step": 2.4803361892700195, "step": 401} +{"train_info/time_between_train_steps": 0.003464937210083008, "step": 401} +{"info/global_step": 402, "train_info/time_within_train_step": 2.7947778701782227, "step": 402} +{"train_info/time_between_train_steps": 0.0033712387084960938, "step": 402} +{"info/global_step": 403, "train_info/time_within_train_step": 2.4614548683166504, "step": 403} +{"train_info/time_between_train_steps": 0.00345611572265625, "step": 403} +{"info/global_step": 404, "train_info/time_within_train_step": 2.488615036010742, "step": 404} +{"train_info/time_between_train_steps": 0.0033905506134033203, "step": 404} +{"info/global_step": 405, "train_info/time_within_train_step": 2.6626458168029785, "step": 405} +{"train_info/time_between_train_steps": 0.003396749496459961, "step": 405} +{"info/global_step": 406, "train_info/time_within_train_step": 2.6659531593322754, "step": 406} +{"train_info/time_between_train_steps": 0.0034432411193847656, "step": 406} +{"info/global_step": 407, "train_info/time_within_train_step": 2.6731648445129395, "step": 407} +{"train_info/time_between_train_steps": 0.003409147262573242, "step": 407} +{"info/global_step": 408, "train_info/time_within_train_step": 2.6759698390960693, "step": 408} +{"train_info/time_between_train_steps": 0.003446817398071289, "step": 408} +{"info/global_step": 409, "train_info/time_within_train_step": 2.6774535179138184, "step": 409} +{"train_info/time_between_train_steps": 0.003438711166381836, "step": 409} +{"info/global_step": 410, "train_info/time_within_train_step": 2.6786463260650635, "step": 410} +{"train_info/time_between_train_steps": 0.003811359405517578, "step": 410} +{"info/global_step": 411, "train_info/time_within_train_step": 2.677783966064453, "step": 411} +{"train_info/time_between_train_steps": 0.003856658935546875, "step": 411} +{"info/global_step": 412, "train_info/time_within_train_step": 2.678684949874878, "step": 412} +{"train_info/time_between_train_steps": 0.003695249557495117, "step": 412} +{"info/global_step": 413, "train_info/time_within_train_step": 2.6770174503326416, "step": 413} +{"train_info/time_between_train_steps": 0.003719806671142578, "step": 413} +{"info/global_step": 414, "train_info/time_within_train_step": 2.677213191986084, "step": 414} +{"train_info/time_between_train_steps": 0.0037987232208251953, "step": 414} +{"info/global_step": 415, "train_info/time_within_train_step": 2.6764349937438965, "step": 415} +{"train_info/time_between_train_steps": 0.003728151321411133, "step": 415} +{"info/global_step": 416, "train_info/time_within_train_step": 2.680449962615967, "step": 416} +{"train_info/time_between_train_steps": 0.0038094520568847656, "step": 416} +{"info/global_step": 417, "train_info/time_within_train_step": 2.6750988960266113, "step": 417} +{"train_info/time_between_train_steps": 0.0037131309509277344, "step": 417} +{"info/global_step": 418, "train_info/time_within_train_step": 2.676668405532837, "step": 418} +{"train_info/time_between_train_steps": 0.0038051605224609375, "step": 418} +{"info/global_step": 419, "train_info/time_within_train_step": 2.6773555278778076, "step": 419} +{"train_info/time_between_train_steps": 0.0037736892700195312, "step": 419} +{"info/global_step": 420, "train_info/time_within_train_step": 2.6778206825256348, "step": 420} +{"train_info/time_between_train_steps": 0.003751993179321289, "step": 420} +{"info/global_step": 421, "train_info/time_within_train_step": 2.676764488220215, "step": 421} +{"train_info/time_between_train_steps": 0.003724336624145508, "step": 421} +{"info/global_step": 422, "train_info/time_within_train_step": 2.6753034591674805, "step": 422} +{"train_info/time_between_train_steps": 0.003809690475463867, "step": 422} +{"info/global_step": 423, "train_info/time_within_train_step": 2.6761462688446045, "step": 423} +{"train_info/time_between_train_steps": 0.003814697265625, "step": 423} +{"info/global_step": 424, "train_info/time_within_train_step": 2.6761550903320312, "step": 424} +{"train_info/time_between_train_steps": 0.003725767135620117, "step": 424} +{"info/global_step": 425, "train_info/time_within_train_step": 2.6756722927093506, "step": 425} +{"train_info/time_between_train_steps": 0.003716707229614258, "step": 425} +{"info/global_step": 426, "train_info/time_within_train_step": 2.6769611835479736, "step": 426} +{"train_info/time_between_train_steps": 0.003690481185913086, "step": 426} +{"info/global_step": 427, "train_info/time_within_train_step": 2.6784398555755615, "step": 427} +{"train_info/time_between_train_steps": 0.003776073455810547, "step": 427} +{"info/global_step": 428, "train_info/time_within_train_step": 2.676312208175659, "step": 428} +{"train_info/time_between_train_steps": 0.007226705551147461, "step": 428} +{"info/global_step": 429, "train_info/time_within_train_step": 2.675996780395508, "step": 429} +{"train_info/time_between_train_steps": 0.0037267208099365234, "step": 429} +{"info/global_step": 430, "train_info/time_within_train_step": 2.677185535430908, "step": 430} +{"train_info/time_between_train_steps": 0.0037539005279541016, "step": 430} +{"info/global_step": 431, "train_info/time_within_train_step": 2.6782567501068115, "step": 431} +{"train_info/time_between_train_steps": 0.0037648677825927734, "step": 431} +{"info/global_step": 432, "train_info/time_within_train_step": 2.6765458583831787, "step": 432} +{"train_info/time_between_train_steps": 0.0036890506744384766, "step": 432} +{"info/global_step": 433, "train_info/time_within_train_step": 2.6781346797943115, "step": 433} +{"train_info/time_between_train_steps": 0.0037353038787841797, "step": 433} +{"info/global_step": 434, "train_info/time_within_train_step": 2.677184820175171, "step": 434} +{"train_info/time_between_train_steps": 0.0037555694580078125, "step": 434} +{"info/global_step": 435, "train_info/time_within_train_step": 2.6770694255828857, "step": 435} +{"train_info/time_between_train_steps": 0.0037102699279785156, "step": 435} +{"info/global_step": 436, "train_info/time_within_train_step": 2.6771111488342285, "step": 436} +{"train_info/time_between_train_steps": 0.003756999969482422, "step": 436} +{"info/global_step": 437, "train_info/time_within_train_step": 2.6765286922454834, "step": 437} +{"train_info/time_between_train_steps": 0.0036971569061279297, "step": 437} +{"info/global_step": 438, "train_info/time_within_train_step": 2.874352216720581, "step": 438} +{"train_info/time_between_train_steps": 0.003530740737915039, "step": 438} +{"info/global_step": 439, "train_info/time_within_train_step": 2.675447702407837, "step": 439} +{"train_info/time_between_train_steps": 0.003503561019897461, "step": 439} +{"info/global_step": 440, "train_info/time_within_train_step": 2.675344228744507, "step": 440} +{"train_info/time_between_train_steps": 0.0035686492919921875, "step": 440} +{"info/global_step": 441, "train_info/time_within_train_step": 2.6749019622802734, "step": 441} +{"train_info/time_between_train_steps": 0.0036895275115966797, "step": 441} +{"info/global_step": 442, "train_info/time_within_train_step": 2.677124261856079, "step": 442} +{"train_info/time_between_train_steps": 0.0035250186920166016, "step": 442} +{"info/global_step": 443, "train_info/time_within_train_step": 2.679821491241455, "step": 443} +{"train_info/time_between_train_steps": 0.0036797523498535156, "step": 443} +{"info/global_step": 444, "train_info/time_within_train_step": 2.675724983215332, "step": 444} +{"train_info/time_between_train_steps": 0.003751039505004883, "step": 444} +{"info/global_step": 445, "train_info/time_within_train_step": 2.6763381958007812, "step": 445} +{"train_info/time_between_train_steps": 0.0037393569946289062, "step": 445} +{"info/global_step": 446, "train_info/time_within_train_step": 2.6774230003356934, "step": 446} +{"train_info/time_between_train_steps": 0.003807544708251953, "step": 446} +{"info/global_step": 447, "train_info/time_within_train_step": 2.6759755611419678, "step": 447} +{"train_info/time_between_train_steps": 0.003734111785888672, "step": 447} +{"info/global_step": 448, "train_info/time_within_train_step": 2.6825759410858154, "step": 448} +{"train_info/time_between_train_steps": 0.003758668899536133, "step": 448} +{"info/global_step": 449, "train_info/time_within_train_step": 2.677807092666626, "step": 449} +{"train_info/time_between_train_steps": 0.0037660598754882812, "step": 449} +{"info/global_step": 450, "train_info/time_within_train_step": 2.676722526550293, "step": 450} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746204557, "_runtime": 1329}, "step": 450} +{"logs": {"train/loss": 5.3367, "train/learning_rate": 0.0005666666666666666, "train/epoch": 0.15, "_timestamp": 1746204557, "_runtime": 1329}, "step": 450} +{"train_info/time_between_train_steps": 0.024589061737060547, "step": 450} +{"info/global_step": 451, "train_info/time_within_train_step": 2.6752891540527344, "step": 451} +{"train_info/time_between_train_steps": 0.0037491321563720703, "step": 451} +{"info/global_step": 452, "train_info/time_within_train_step": 2.6761972904205322, "step": 452} +{"train_info/time_between_train_steps": 0.0037391185760498047, "step": 452} +{"info/global_step": 453, "train_info/time_within_train_step": 2.6765220165252686, "step": 453} +{"train_info/time_between_train_steps": 0.0037021636962890625, "step": 453} +{"info/global_step": 454, "train_info/time_within_train_step": 2.6753666400909424, "step": 454} +{"train_info/time_between_train_steps": 0.003697633743286133, "step": 454} +{"info/global_step": 455, "train_info/time_within_train_step": 2.676417827606201, "step": 455} +{"train_info/time_between_train_steps": 0.0036721229553222656, "step": 455} +{"info/global_step": 456, "train_info/time_within_train_step": 2.675852060317993, "step": 456} +{"train_info/time_between_train_steps": 0.0037102699279785156, "step": 456} +{"info/global_step": 457, "train_info/time_within_train_step": 2.6761560440063477, "step": 457} +{"train_info/time_between_train_steps": 0.003704071044921875, "step": 457} +{"info/global_step": 458, "train_info/time_within_train_step": 2.6756274700164795, "step": 458} +{"train_info/time_between_train_steps": 0.007248878479003906, "step": 458} +{"info/global_step": 459, "train_info/time_within_train_step": 2.674530267715454, "step": 459} +{"train_info/time_between_train_steps": 0.0037076473236083984, "step": 459} +{"info/global_step": 460, "train_info/time_within_train_step": 2.676335096359253, "step": 460} +{"train_info/time_between_train_steps": 0.0036475658416748047, "step": 460} +{"info/global_step": 461, "train_info/time_within_train_step": 2.67490291595459, "step": 461} +{"train_info/time_between_train_steps": 0.0036699771881103516, "step": 461} +{"info/global_step": 462, "train_info/time_within_train_step": 2.674426317214966, "step": 462} +{"train_info/time_between_train_steps": 0.003699064254760742, "step": 462} +{"info/global_step": 463, "train_info/time_within_train_step": 2.6752655506134033, "step": 463} +{"train_info/time_between_train_steps": 0.003708362579345703, "step": 463} +{"info/global_step": 464, "train_info/time_within_train_step": 2.67500376701355, "step": 464} +{"train_info/time_between_train_steps": 0.0036776065826416016, "step": 464} +{"info/global_step": 465, "train_info/time_within_train_step": 2.6754415035247803, "step": 465} +{"train_info/time_between_train_steps": 0.0036787986755371094, "step": 465} +{"info/global_step": 466, "train_info/time_within_train_step": 2.6754541397094727, "step": 466} +{"train_info/time_between_train_steps": 0.003735065460205078, "step": 466} +{"info/global_step": 467, "train_info/time_within_train_step": 2.675997734069824, "step": 467} +{"train_info/time_between_train_steps": 0.0037038326263427734, "step": 467} +{"info/global_step": 468, "train_info/time_within_train_step": 2.675206184387207, "step": 468} +{"train_info/time_between_train_steps": 0.007246971130371094, "step": 468} +{"info/global_step": 469, "train_info/time_within_train_step": 2.6740221977233887, "step": 469} +{"train_info/time_between_train_steps": 0.007172822952270508, "step": 469} +{"info/global_step": 470, "train_info/time_within_train_step": 2.6761181354522705, "step": 470} +{"train_info/time_between_train_steps": 0.0072345733642578125, "step": 470} +{"info/global_step": 471, "train_info/time_within_train_step": 2.677356243133545, "step": 471} +{"train_info/time_between_train_steps": 0.0072019100189208984, "step": 471} +{"info/global_step": 472, "train_info/time_within_train_step": 2.6764700412750244, "step": 472} +{"train_info/time_between_train_steps": 0.007198333740234375, "step": 472} +{"info/global_step": 473, "train_info/time_within_train_step": 2.6760847568511963, "step": 473} +{"train_info/time_between_train_steps": 0.007310628890991211, "step": 473} +{"info/global_step": 474, "train_info/time_within_train_step": 2.6761369705200195, "step": 474} +{"train_info/time_between_train_steps": 0.007227182388305664, "step": 474} +{"info/global_step": 475, "train_info/time_within_train_step": 2.6756865978240967, "step": 475} +{"train_info/time_between_train_steps": 0.0036165714263916016, "step": 475} +{"info/global_step": 476, "train_info/time_within_train_step": 2.6764376163482666, "step": 476} +{"train_info/time_between_train_steps": 0.003682851791381836, "step": 476} +{"info/global_step": 477, "train_info/time_within_train_step": 2.676013708114624, "step": 477} +{"train_info/time_between_train_steps": 0.0036063194274902344, "step": 477} +{"info/global_step": 478, "train_info/time_within_train_step": 2.676358938217163, "step": 478} +{"train_info/time_between_train_steps": 0.0037453174591064453, "step": 478} +{"info/global_step": 479, "train_info/time_within_train_step": 2.675750494003296, "step": 479} +{"train_info/time_between_train_steps": 0.003664255142211914, "step": 479} +{"info/global_step": 480, "train_info/time_within_train_step": 2.6766674518585205, "step": 480} +{"train_info/time_between_train_steps": 0.0037474632263183594, "step": 480} +{"info/global_step": 481, "train_info/time_within_train_step": 2.675518035888672, "step": 481} +{"train_info/time_between_train_steps": 0.0036385059356689453, "step": 481} +{"info/global_step": 482, "train_info/time_within_train_step": 2.676628351211548, "step": 482} +{"train_info/time_between_train_steps": 0.003624439239501953, "step": 482} +{"info/global_step": 483, "train_info/time_within_train_step": 2.676603317260742, "step": 483} +{"train_info/time_between_train_steps": 0.0037355422973632812, "step": 483} +{"info/global_step": 484, "train_info/time_within_train_step": 2.6769001483917236, "step": 484} +{"train_info/time_between_train_steps": 0.0037055015563964844, "step": 484} +{"info/global_step": 485, "train_info/time_within_train_step": 3.0401411056518555, "step": 485} +{"train_info/time_between_train_steps": 0.0033948421478271484, "step": 485} +{"info/global_step": 486, "train_info/time_within_train_step": 2.6751744747161865, "step": 486} +{"train_info/time_between_train_steps": 0.003366231918334961, "step": 486} +{"info/global_step": 487, "train_info/time_within_train_step": 2.6747348308563232, "step": 487} +{"train_info/time_between_train_steps": 0.003392934799194336, "step": 487} +{"info/global_step": 488, "train_info/time_within_train_step": 2.6750452518463135, "step": 488} +{"train_info/time_between_train_steps": 0.0034232139587402344, "step": 488} +{"info/global_step": 489, "train_info/time_within_train_step": 2.67486834526062, "step": 489} +{"train_info/time_between_train_steps": 0.0034661293029785156, "step": 489} +{"info/global_step": 490, "train_info/time_within_train_step": 2.6744585037231445, "step": 490} +{"train_info/time_between_train_steps": 0.003399372100830078, "step": 490} +{"info/global_step": 491, "train_info/time_within_train_step": 2.6746041774749756, "step": 491} +{"train_info/time_between_train_steps": 0.0037550926208496094, "step": 491} +{"info/global_step": 492, "train_info/time_within_train_step": 2.6739883422851562, "step": 492} +{"train_info/time_between_train_steps": 0.003420591354370117, "step": 492} +{"info/global_step": 493, "train_info/time_within_train_step": 2.6747655868530273, "step": 493} +{"train_info/time_between_train_steps": 0.0033826828002929688, "step": 493} +{"info/global_step": 494, "train_info/time_within_train_step": 2.6758227348327637, "step": 494} +{"train_info/time_between_train_steps": 0.0035238265991210938, "step": 494} +{"info/global_step": 495, "train_info/time_within_train_step": 2.6737611293792725, "step": 495} +{"train_info/time_between_train_steps": 0.003448009490966797, "step": 495} +{"info/global_step": 496, "train_info/time_within_train_step": 2.674922227859497, "step": 496} +{"train_info/time_between_train_steps": 0.0034265518188476562, "step": 496} +{"info/global_step": 497, "train_info/time_within_train_step": 2.6740541458129883, "step": 497} +{"train_info/time_between_train_steps": 0.0033974647521972656, "step": 497} +{"info/global_step": 498, "train_info/time_within_train_step": 2.6755592823028564, "step": 498} +{"train_info/time_between_train_steps": 0.003365755081176758, "step": 498} +{"info/global_step": 499, "train_info/time_within_train_step": 2.675001382827759, "step": 499} +{"train_info/time_between_train_steps": 0.003412485122680664, "step": 499} +{"info/global_step": 500, "train_info/time_within_train_step": 3.1909847259521484, "step": 500} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746204693, "_runtime": 1465}, "step": 500} +{"logs": {"train/loss": 5.2267, "train/learning_rate": 0.0005555555555555556, "train/epoch": 0.17, "_timestamp": 1746204693, "_runtime": 1465}, "step": 500} +{"train_info/time_between_train_steps": 13.318114995956421, "step": 500} +{"info/global_step": 501, "train_info/time_within_train_step": 2.4699671268463135, "step": 501} +{"train_info/time_between_train_steps": 0.003452777862548828, "step": 501} +{"info/global_step": 502, "train_info/time_within_train_step": 2.45778751373291, "step": 502} +{"train_info/time_between_train_steps": 0.0034356117248535156, "step": 502} +{"info/global_step": 503, "train_info/time_within_train_step": 2.4925310611724854, "step": 503} +{"train_info/time_between_train_steps": 0.0034003257751464844, "step": 503} +{"info/global_step": 504, "train_info/time_within_train_step": 2.659635066986084, "step": 504} +{"train_info/time_between_train_steps": 0.0033941268920898438, "step": 504} +{"info/global_step": 505, "train_info/time_within_train_step": 2.6722819805145264, "step": 505} +{"train_info/time_between_train_steps": 0.0034601688385009766, "step": 505} +{"info/global_step": 506, "train_info/time_within_train_step": 2.672679901123047, "step": 506} +{"train_info/time_between_train_steps": 0.003419637680053711, "step": 506} +{"info/global_step": 507, "train_info/time_within_train_step": 2.6737492084503174, "step": 507} +{"train_info/time_between_train_steps": 0.0034563541412353516, "step": 507} +{"info/global_step": 508, "train_info/time_within_train_step": 2.6745548248291016, "step": 508} +{"train_info/time_between_train_steps": 0.0034596920013427734, "step": 508} +{"info/global_step": 509, "train_info/time_within_train_step": 2.6758484840393066, "step": 509} +{"train_info/time_between_train_steps": 0.003411531448364258, "step": 509} +{"info/global_step": 510, "train_info/time_within_train_step": 2.675152063369751, "step": 510} +{"train_info/time_between_train_steps": 0.003397226333618164, "step": 510} +{"info/global_step": 511, "train_info/time_within_train_step": 2.6756505966186523, "step": 511} +{"train_info/time_between_train_steps": 0.0034313201904296875, "step": 511} +{"info/global_step": 512, "train_info/time_within_train_step": 2.67876935005188, "step": 512} +{"train_info/time_between_train_steps": 0.0034008026123046875, "step": 512} +{"info/global_step": 513, "train_info/time_within_train_step": 2.675258159637451, "step": 513} +{"train_info/time_between_train_steps": 0.0034322738647460938, "step": 513} +{"info/global_step": 514, "train_info/time_within_train_step": 2.6764349937438965, "step": 514} +{"train_info/time_between_train_steps": 0.003419160842895508, "step": 514} +{"info/global_step": 515, "train_info/time_within_train_step": 2.675384998321533, "step": 515} +{"train_info/time_between_train_steps": 0.003368854522705078, "step": 515} +{"info/global_step": 516, "train_info/time_within_train_step": 2.675962209701538, "step": 516} +{"train_info/time_between_train_steps": 0.003596782684326172, "step": 516} +{"info/global_step": 517, "train_info/time_within_train_step": 2.6752705574035645, "step": 517} +{"train_info/time_between_train_steps": 0.0033648014068603516, "step": 517} +{"info/global_step": 518, "train_info/time_within_train_step": 2.6757149696350098, "step": 518} +{"train_info/time_between_train_steps": 0.0034637451171875, "step": 518} +{"info/global_step": 519, "train_info/time_within_train_step": 2.673881769180298, "step": 519} +{"train_info/time_between_train_steps": 0.003371000289916992, "step": 519} +{"info/global_step": 520, "train_info/time_within_train_step": 2.6734795570373535, "step": 520} +{"train_info/time_between_train_steps": 0.0034422874450683594, "step": 520} +{"info/global_step": 521, "train_info/time_within_train_step": 2.6756443977355957, "step": 521} +{"train_info/time_between_train_steps": 0.003506898880004883, "step": 521} +{"info/global_step": 522, "train_info/time_within_train_step": 2.6778769493103027, "step": 522} +{"train_info/time_between_train_steps": 0.0037300586700439453, "step": 522} +{"info/global_step": 523, "train_info/time_within_train_step": 2.6765096187591553, "step": 523} +{"train_info/time_between_train_steps": 0.0036280155181884766, "step": 523} +{"info/global_step": 524, "train_info/time_within_train_step": 2.6767783164978027, "step": 524} +{"train_info/time_between_train_steps": 0.003634214401245117, "step": 524} +{"info/global_step": 525, "train_info/time_within_train_step": 2.675469398498535, "step": 525} +{"train_info/time_between_train_steps": 0.003598928451538086, "step": 525} +{"info/global_step": 526, "train_info/time_within_train_step": 2.6758573055267334, "step": 526} +{"train_info/time_between_train_steps": 0.0036127567291259766, "step": 526} +{"info/global_step": 527, "train_info/time_within_train_step": 3.024137258529663, "step": 527} +{"train_info/time_between_train_steps": 0.0033750534057617188, "step": 527} +{"info/global_step": 528, "train_info/time_within_train_step": 2.6739044189453125, "step": 528} +{"train_info/time_between_train_steps": 0.003442525863647461, "step": 528} +{"info/global_step": 529, "train_info/time_within_train_step": 2.6856725215911865, "step": 529} +{"train_info/time_between_train_steps": 0.003384828567504883, "step": 529} +{"info/global_step": 530, "train_info/time_within_train_step": 2.7077338695526123, "step": 530} +{"train_info/time_between_train_steps": 0.003374814987182617, "step": 530} +{"info/global_step": 531, "train_info/time_within_train_step": 2.674852132797241, "step": 531} +{"train_info/time_between_train_steps": 0.003368854522705078, "step": 531} +{"info/global_step": 532, "train_info/time_within_train_step": 2.678905963897705, "step": 532} +{"train_info/time_between_train_steps": 0.003993511199951172, "step": 532} +{"info/global_step": 533, "train_info/time_within_train_step": 2.674774169921875, "step": 533} +{"train_info/time_between_train_steps": 0.003386259078979492, "step": 533} +{"info/global_step": 534, "train_info/time_within_train_step": 2.674539566040039, "step": 534} +{"train_info/time_between_train_steps": 0.003379344940185547, "step": 534} +{"info/global_step": 535, "train_info/time_within_train_step": 2.6730525493621826, "step": 535} +{"train_info/time_between_train_steps": 0.0034224987030029297, "step": 535} +{"info/global_step": 536, "train_info/time_within_train_step": 2.6739611625671387, "step": 536} +{"train_info/time_between_train_steps": 0.0033898353576660156, "step": 536} +{"info/global_step": 537, "train_info/time_within_train_step": 2.674569845199585, "step": 537} +{"train_info/time_between_train_steps": 0.0035512447357177734, "step": 537} +{"info/global_step": 538, "train_info/time_within_train_step": 2.6749773025512695, "step": 538} +{"train_info/time_between_train_steps": 0.0033638477325439453, "step": 538} +{"info/global_step": 539, "train_info/time_within_train_step": 2.674048662185669, "step": 539} +{"train_info/time_between_train_steps": 0.003432750701904297, "step": 539} +{"info/global_step": 540, "train_info/time_within_train_step": 2.674685001373291, "step": 540} +{"train_info/time_between_train_steps": 0.0034487247467041016, "step": 540} +{"info/global_step": 541, "train_info/time_within_train_step": 2.6747350692749023, "step": 541} +{"train_info/time_between_train_steps": 0.0034139156341552734, "step": 541} +{"info/global_step": 542, "train_info/time_within_train_step": 2.6744277477264404, "step": 542} +{"train_info/time_between_train_steps": 0.0034017562866210938, "step": 542} +{"info/global_step": 543, "train_info/time_within_train_step": 2.674375057220459, "step": 543} +{"train_info/time_between_train_steps": 0.0034453868865966797, "step": 543} +{"info/global_step": 544, "train_info/time_within_train_step": 2.6753575801849365, "step": 544} +{"train_info/time_between_train_steps": 0.003401517868041992, "step": 544} +{"info/global_step": 545, "train_info/time_within_train_step": 2.6753878593444824, "step": 545} +{"train_info/time_between_train_steps": 0.0033838748931884766, "step": 545} +{"info/global_step": 546, "train_info/time_within_train_step": 2.679170846939087, "step": 546} +{"train_info/time_between_train_steps": 0.003393888473510742, "step": 546} +{"info/global_step": 547, "train_info/time_within_train_step": 2.6744441986083984, "step": 547} +{"train_info/time_between_train_steps": 0.0033669471740722656, "step": 547} +{"info/global_step": 548, "train_info/time_within_train_step": 2.6745057106018066, "step": 548} +{"train_info/time_between_train_steps": 0.0033965110778808594, "step": 548} +{"info/global_step": 549, "train_info/time_within_train_step": 2.6745071411132812, "step": 549} +{"train_info/time_between_train_steps": 0.0033915042877197266, "step": 549} +{"info/global_step": 550, "train_info/time_within_train_step": 2.675119400024414, "step": 550} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746204841, "_runtime": 1613}, "step": 550} +{"logs": {"train/loss": 5.1226, "train/learning_rate": 0.0005444444444444444, "train/epoch": 0.18, "_timestamp": 1746204841, "_runtime": 1613}, "step": 550} +{"train_info/time_between_train_steps": 0.02530813217163086, "step": 550} +{"info/global_step": 551, "train_info/time_within_train_step": 2.6779346466064453, "step": 551} +{"train_info/time_between_train_steps": 0.0034084320068359375, "step": 551} +{"info/global_step": 552, "train_info/time_within_train_step": 2.696552276611328, "step": 552} +{"train_info/time_between_train_steps": 0.003365755081176758, "step": 552} +{"info/global_step": 553, "train_info/time_within_train_step": 2.6745262145996094, "step": 553} +{"train_info/time_between_train_steps": 0.0030791759490966797, "step": 553} +{"info/global_step": 554, "train_info/time_within_train_step": 2.6735644340515137, "step": 554} +{"train_info/time_between_train_steps": 0.003102540969848633, "step": 554} +{"info/global_step": 555, "train_info/time_within_train_step": 2.6734678745269775, "step": 555} +{"train_info/time_between_train_steps": 0.003042936325073242, "step": 555} +{"info/global_step": 556, "train_info/time_within_train_step": 2.6729612350463867, "step": 556} +{"train_info/time_between_train_steps": 0.003026723861694336, "step": 556} +{"info/global_step": 557, "train_info/time_within_train_step": 2.673973321914673, "step": 557} +{"train_info/time_between_train_steps": 0.0030307769775390625, "step": 557} +{"info/global_step": 558, "train_info/time_within_train_step": 2.6721951961517334, "step": 558} +{"train_info/time_between_train_steps": 0.0030243396759033203, "step": 558} +{"info/global_step": 559, "train_info/time_within_train_step": 2.6717121601104736, "step": 559} +{"train_info/time_between_train_steps": 0.003083944320678711, "step": 559} +{"info/global_step": 560, "train_info/time_within_train_step": 2.6719918251037598, "step": 560} +{"train_info/time_between_train_steps": 0.0030689239501953125, "step": 560} +{"info/global_step": 561, "train_info/time_within_train_step": 2.672799587249756, "step": 561} +{"train_info/time_between_train_steps": 0.0030498504638671875, "step": 561} +{"info/global_step": 562, "train_info/time_within_train_step": 2.673004388809204, "step": 562} +{"train_info/time_between_train_steps": 0.0030660629272460938, "step": 562} +{"info/global_step": 563, "train_info/time_within_train_step": 2.6719002723693848, "step": 563} +{"train_info/time_between_train_steps": 0.003182649612426758, "step": 563} +{"info/global_step": 564, "train_info/time_within_train_step": 2.6725833415985107, "step": 564} +{"train_info/time_between_train_steps": 0.0030498504638671875, "step": 564} +{"info/global_step": 565, "train_info/time_within_train_step": 2.6726903915405273, "step": 565} +{"train_info/time_between_train_steps": 0.0030167102813720703, "step": 565} +{"info/global_step": 566, "train_info/time_within_train_step": 2.6736998558044434, "step": 566} +{"train_info/time_between_train_steps": 0.003066539764404297, "step": 566} +{"info/global_step": 567, "train_info/time_within_train_step": 2.6728322505950928, "step": 567} +{"train_info/time_between_train_steps": 0.003155231475830078, "step": 567} +{"info/global_step": 568, "train_info/time_within_train_step": 2.673844814300537, "step": 568} +{"train_info/time_between_train_steps": 0.0030241012573242188, "step": 568} +{"info/global_step": 569, "train_info/time_within_train_step": 2.6720426082611084, "step": 569} +{"train_info/time_between_train_steps": 0.003051280975341797, "step": 569} +{"info/global_step": 570, "train_info/time_within_train_step": 2.672677993774414, "step": 570} +{"train_info/time_between_train_steps": 0.0030364990234375, "step": 570} +{"info/global_step": 571, "train_info/time_within_train_step": 2.6723597049713135, "step": 571} +{"train_info/time_between_train_steps": 0.002995014190673828, "step": 571} +{"info/global_step": 572, "train_info/time_within_train_step": 2.6718928813934326, "step": 572} +{"train_info/time_between_train_steps": 0.003034830093383789, "step": 572} +{"info/global_step": 573, "train_info/time_within_train_step": 2.6736106872558594, "step": 573} +{"train_info/time_between_train_steps": 0.003101825714111328, "step": 573} +{"info/global_step": 574, "train_info/time_within_train_step": 2.670929193496704, "step": 574} +{"train_info/time_between_train_steps": 0.0030660629272460938, "step": 574} +{"info/global_step": 575, "train_info/time_within_train_step": 2.672290325164795, "step": 575} +{"train_info/time_between_train_steps": 0.0030584335327148438, "step": 575} +{"info/global_step": 576, "train_info/time_within_train_step": 2.6726620197296143, "step": 576} +{"train_info/time_between_train_steps": 0.003045320510864258, "step": 576} +{"info/global_step": 577, "train_info/time_within_train_step": 2.671926259994507, "step": 577} +{"train_info/time_between_train_steps": 0.003052949905395508, "step": 577} +{"info/global_step": 578, "train_info/time_within_train_step": 2.6726224422454834, "step": 578} +{"train_info/time_between_train_steps": 0.003008604049682617, "step": 578} +{"info/global_step": 579, "train_info/time_within_train_step": 2.673344612121582, "step": 579} +{"train_info/time_between_train_steps": 0.0029888153076171875, "step": 579} +{"info/global_step": 580, "train_info/time_within_train_step": 2.6736412048339844, "step": 580} +{"train_info/time_between_train_steps": 0.003052234649658203, "step": 580} +{"info/global_step": 581, "train_info/time_within_train_step": 2.6748290061950684, "step": 581} +{"train_info/time_between_train_steps": 0.0030257701873779297, "step": 581} +{"info/global_step": 582, "train_info/time_within_train_step": 2.673496723175049, "step": 582} +{"train_info/time_between_train_steps": 0.0029883384704589844, "step": 582} +{"info/global_step": 583, "train_info/time_within_train_step": 2.6731395721435547, "step": 583} +{"train_info/time_between_train_steps": 0.0030395984649658203, "step": 583} +{"info/global_step": 584, "train_info/time_within_train_step": 2.673832654953003, "step": 584} +{"train_info/time_between_train_steps": 0.0030214786529541016, "step": 584} +{"info/global_step": 585, "train_info/time_within_train_step": 2.6749491691589355, "step": 585} +{"train_info/time_between_train_steps": 0.0030167102813720703, "step": 585} +{"info/global_step": 586, "train_info/time_within_train_step": 2.6726911067962646, "step": 586} +{"train_info/time_between_train_steps": 0.0030655860900878906, "step": 586} +{"info/global_step": 587, "train_info/time_within_train_step": 2.673940420150757, "step": 587} +{"train_info/time_between_train_steps": 0.0030515193939208984, "step": 587} +{"info/global_step": 588, "train_info/time_within_train_step": 2.6708807945251465, "step": 588} +{"train_info/time_between_train_steps": 0.0029637813568115234, "step": 588} +{"info/global_step": 589, "train_info/time_within_train_step": 2.671746253967285, "step": 589} +{"train_info/time_between_train_steps": 0.0030531883239746094, "step": 589} +{"info/global_step": 590, "train_info/time_within_train_step": 2.6728694438934326, "step": 590} +{"train_info/time_between_train_steps": 0.003027677536010742, "step": 590} +{"info/global_step": 591, "train_info/time_within_train_step": 2.6713778972625732, "step": 591} +{"train_info/time_between_train_steps": 0.0030336380004882812, "step": 591} +{"info/global_step": 592, "train_info/time_within_train_step": 2.67179536819458, "step": 592} +{"train_info/time_between_train_steps": 0.003014802932739258, "step": 592} +{"info/global_step": 593, "train_info/time_within_train_step": 2.6712772846221924, "step": 593} +{"train_info/time_between_train_steps": 0.0029883384704589844, "step": 593} +{"info/global_step": 594, "train_info/time_within_train_step": 2.672182083129883, "step": 594} +{"train_info/time_between_train_steps": 0.0029833316802978516, "step": 594} +{"info/global_step": 595, "train_info/time_within_train_step": 2.6716644763946533, "step": 595} +{"train_info/time_between_train_steps": 0.0030145645141601562, "step": 595} +{"info/global_step": 596, "train_info/time_within_train_step": 2.671584367752075, "step": 596} +{"train_info/time_between_train_steps": 0.003023862838745117, "step": 596} +{"info/global_step": 597, "train_info/time_within_train_step": 2.672673463821411, "step": 597} +{"train_info/time_between_train_steps": 0.0029985904693603516, "step": 597} +{"info/global_step": 598, "train_info/time_within_train_step": 2.6725552082061768, "step": 598} +{"train_info/time_between_train_steps": 0.0030088424682617188, "step": 598} +{"info/global_step": 599, "train_info/time_within_train_step": 2.6738545894622803, "step": 599} +{"train_info/time_between_train_steps": 0.003022432327270508, "step": 599} +{"info/global_step": 600, "train_info/time_within_train_step": 2.671457052230835, "step": 600} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746204976, "_runtime": 1748}, "step": 600} +{"logs": {"train/loss": 5.0269, "train/learning_rate": 0.0005333333333333333, "train/epoch": 0.2, "_timestamp": 1746204976, "_runtime": 1748}, "step": 600} +{"train_info/time_between_train_steps": 15.120362520217896, "step": 600} +{"info/global_step": 601, "train_info/time_within_train_step": 2.4747138023376465, "step": 601} +{"train_info/time_between_train_steps": 0.003004312515258789, "step": 601} +{"info/global_step": 602, "train_info/time_within_train_step": 2.4554293155670166, "step": 602} +{"train_info/time_between_train_steps": 0.003038167953491211, "step": 602} +{"info/global_step": 603, "train_info/time_within_train_step": 2.461845636367798, "step": 603} +{"train_info/time_between_train_steps": 0.0030324459075927734, "step": 603} +{"info/global_step": 604, "train_info/time_within_train_step": 2.6414575576782227, "step": 604} +{"train_info/time_between_train_steps": 0.0030074119567871094, "step": 604} +{"info/global_step": 605, "train_info/time_within_train_step": 2.6714258193969727, "step": 605} +{"train_info/time_between_train_steps": 0.002987384796142578, "step": 605} +{"info/global_step": 606, "train_info/time_within_train_step": 2.671403646469116, "step": 606} +{"train_info/time_between_train_steps": 0.0029659271240234375, "step": 606} +{"info/global_step": 607, "train_info/time_within_train_step": 2.6725339889526367, "step": 607} +{"train_info/time_between_train_steps": 0.0030243396759033203, "step": 607} +{"info/global_step": 608, "train_info/time_within_train_step": 2.6723830699920654, "step": 608} +{"train_info/time_between_train_steps": 0.0029685497283935547, "step": 608} +{"info/global_step": 609, "train_info/time_within_train_step": 2.873812437057495, "step": 609} +{"train_info/time_between_train_steps": 0.0030045509338378906, "step": 609} +{"info/global_step": 610, "train_info/time_within_train_step": 2.673309326171875, "step": 610} +{"train_info/time_between_train_steps": 0.0029463768005371094, "step": 610} +{"info/global_step": 611, "train_info/time_within_train_step": 2.6740403175354004, "step": 611} +{"train_info/time_between_train_steps": 0.0029532909393310547, "step": 611} +{"info/global_step": 612, "train_info/time_within_train_step": 2.673757314682007, "step": 612} +{"train_info/time_between_train_steps": 0.002971649169921875, "step": 612} +{"info/global_step": 613, "train_info/time_within_train_step": 2.6824862957000732, "step": 613} +{"train_info/time_between_train_steps": 0.0029456615447998047, "step": 613} +{"info/global_step": 614, "train_info/time_within_train_step": 2.7064716815948486, "step": 614} +{"train_info/time_between_train_steps": 0.0029752254486083984, "step": 614} +{"info/global_step": 615, "train_info/time_within_train_step": 2.6739330291748047, "step": 615} +{"train_info/time_between_train_steps": 0.002962350845336914, "step": 615} +{"info/global_step": 616, "train_info/time_within_train_step": 2.68231463432312, "step": 616} +{"train_info/time_between_train_steps": 0.002979278564453125, "step": 616} +{"info/global_step": 617, "train_info/time_within_train_step": 2.672011613845825, "step": 617} +{"train_info/time_between_train_steps": 0.002942323684692383, "step": 617} +{"info/global_step": 618, "train_info/time_within_train_step": 2.67435622215271, "step": 618} +{"train_info/time_between_train_steps": 0.0030670166015625, "step": 618} +{"info/global_step": 619, "train_info/time_within_train_step": 2.6722118854522705, "step": 619} +{"train_info/time_between_train_steps": 0.002997159957885742, "step": 619} +{"info/global_step": 620, "train_info/time_within_train_step": 2.6738250255584717, "step": 620} +{"train_info/time_between_train_steps": 0.0029909610748291016, "step": 620} +{"info/global_step": 621, "train_info/time_within_train_step": 2.673341751098633, "step": 621} +{"train_info/time_between_train_steps": 0.002977132797241211, "step": 621} +{"info/global_step": 622, "train_info/time_within_train_step": 2.6738269329071045, "step": 622} +{"train_info/time_between_train_steps": 0.0030117034912109375, "step": 622} +{"info/global_step": 623, "train_info/time_within_train_step": 2.673008918762207, "step": 623} +{"train_info/time_between_train_steps": 0.0029664039611816406, "step": 623} +{"info/global_step": 624, "train_info/time_within_train_step": 2.6728169918060303, "step": 624} +{"train_info/time_between_train_steps": 0.0029485225677490234, "step": 624} +{"info/global_step": 625, "train_info/time_within_train_step": 2.6731455326080322, "step": 625} +{"train_info/time_between_train_steps": 0.00302886962890625, "step": 625} +{"info/global_step": 626, "train_info/time_within_train_step": 2.6730363368988037, "step": 626} +{"train_info/time_between_train_steps": 0.0029845237731933594, "step": 626} +{"info/global_step": 627, "train_info/time_within_train_step": 2.6725077629089355, "step": 627} +{"train_info/time_between_train_steps": 0.002945423126220703, "step": 627} +{"info/global_step": 628, "train_info/time_within_train_step": 2.674806594848633, "step": 628} +{"train_info/time_between_train_steps": 0.003117084503173828, "step": 628} +{"info/global_step": 629, "train_info/time_within_train_step": 2.672922134399414, "step": 629} +{"train_info/time_between_train_steps": 0.0029611587524414062, "step": 629} +{"info/global_step": 630, "train_info/time_within_train_step": 2.672999382019043, "step": 630} +{"train_info/time_between_train_steps": 0.003012418746948242, "step": 630} +{"info/global_step": 631, "train_info/time_within_train_step": 2.674287796020508, "step": 631} +{"train_info/time_between_train_steps": 0.002948760986328125, "step": 631} +{"info/global_step": 632, "train_info/time_within_train_step": 2.6723122596740723, "step": 632} +{"train_info/time_between_train_steps": 0.002947568893432617, "step": 632} +{"info/global_step": 633, "train_info/time_within_train_step": 2.673276662826538, "step": 633} +{"train_info/time_between_train_steps": 0.002973794937133789, "step": 633} +{"info/global_step": 634, "train_info/time_within_train_step": 2.6731393337249756, "step": 634} +{"train_info/time_between_train_steps": 0.0029904842376708984, "step": 634} +{"info/global_step": 635, "train_info/time_within_train_step": 2.6723618507385254, "step": 635} +{"train_info/time_between_train_steps": 0.0030295848846435547, "step": 635} +{"info/global_step": 636, "train_info/time_within_train_step": 2.673992156982422, "step": 636} +{"train_info/time_between_train_steps": 0.002950906753540039, "step": 636} +{"info/global_step": 637, "train_info/time_within_train_step": 2.672865152359009, "step": 637} +{"train_info/time_between_train_steps": 0.0030128955841064453, "step": 637} +{"info/global_step": 638, "train_info/time_within_train_step": 2.6709156036376953, "step": 638} +{"train_info/time_between_train_steps": 0.0029892921447753906, "step": 638} +{"info/global_step": 639, "train_info/time_within_train_step": 2.671982765197754, "step": 639} +{"train_info/time_between_train_steps": 0.002994060516357422, "step": 639} +{"info/global_step": 640, "train_info/time_within_train_step": 2.671128273010254, "step": 640} +{"train_info/time_between_train_steps": 0.002929210662841797, "step": 640} +{"info/global_step": 641, "train_info/time_within_train_step": 2.672051429748535, "step": 641} +{"train_info/time_between_train_steps": 0.003006458282470703, "step": 641} +{"info/global_step": 642, "train_info/time_within_train_step": 2.6709702014923096, "step": 642} +{"train_info/time_between_train_steps": 0.0029549598693847656, "step": 642} +{"info/global_step": 643, "train_info/time_within_train_step": 2.670992374420166, "step": 643} +{"train_info/time_between_train_steps": 0.0029599666595458984, "step": 643} +{"info/global_step": 644, "train_info/time_within_train_step": 2.6713242530822754, "step": 644} +{"train_info/time_between_train_steps": 0.0029659271240234375, "step": 644} +{"info/global_step": 645, "train_info/time_within_train_step": 2.671902656555176, "step": 645} +{"train_info/time_between_train_steps": 0.0029397010803222656, "step": 645} +{"info/global_step": 646, "train_info/time_within_train_step": 2.671781539916992, "step": 646} +{"train_info/time_between_train_steps": 0.002927541732788086, "step": 646} +{"info/global_step": 647, "train_info/time_within_train_step": 2.672671318054199, "step": 647} +{"train_info/time_between_train_steps": 0.002933979034423828, "step": 647} +{"info/global_step": 648, "train_info/time_within_train_step": 2.672271251678467, "step": 648} +{"train_info/time_between_train_steps": 0.0029604434967041016, "step": 648} +{"info/global_step": 649, "train_info/time_within_train_step": 2.6725335121154785, "step": 649} +{"train_info/time_between_train_steps": 0.0029616355895996094, "step": 649} +{"info/global_step": 650, "train_info/time_within_train_step": 2.671391725540161, "step": 650} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746205125, "_runtime": 1897}, "step": 650} +{"logs": {"train/loss": 4.9483, "train/learning_rate": 0.0005222222222222222, "train/epoch": 0.22, "_timestamp": 1746205125, "_runtime": 1897}, "step": 650} +{"train_info/time_between_train_steps": 0.024420976638793945, "step": 650} +{"info/global_step": 651, "train_info/time_within_train_step": 2.671700954437256, "step": 651} +{"train_info/time_between_train_steps": 0.0029616355895996094, "step": 651} +{"info/global_step": 652, "train_info/time_within_train_step": 2.6716463565826416, "step": 652} +{"train_info/time_between_train_steps": 0.002997159957885742, "step": 652} +{"info/global_step": 653, "train_info/time_within_train_step": 2.673295259475708, "step": 653} +{"train_info/time_between_train_steps": 0.0029664039611816406, "step": 653} +{"info/global_step": 654, "train_info/time_within_train_step": 2.6723275184631348, "step": 654} +{"train_info/time_between_train_steps": 0.003017425537109375, "step": 654} +{"info/global_step": 655, "train_info/time_within_train_step": 2.672070264816284, "step": 655} +{"train_info/time_between_train_steps": 0.0029604434967041016, "step": 655} +{"info/global_step": 656, "train_info/time_within_train_step": 2.6717464923858643, "step": 656} +{"train_info/time_between_train_steps": 0.0029366016387939453, "step": 656} +{"info/global_step": 657, "train_info/time_within_train_step": 2.67264461517334, "step": 657} +{"train_info/time_between_train_steps": 0.0029954910278320312, "step": 657} +{"info/global_step": 658, "train_info/time_within_train_step": 2.6717684268951416, "step": 658} +{"train_info/time_between_train_steps": 0.0030035972595214844, "step": 658} +{"info/global_step": 659, "train_info/time_within_train_step": 2.6711034774780273, "step": 659} +{"train_info/time_between_train_steps": 0.002963542938232422, "step": 659} +{"info/global_step": 660, "train_info/time_within_train_step": 2.6736719608306885, "step": 660} +{"train_info/time_between_train_steps": 0.0029811859130859375, "step": 660} +{"info/global_step": 661, "train_info/time_within_train_step": 2.6730077266693115, "step": 661} +{"train_info/time_between_train_steps": 0.00296783447265625, "step": 661} +{"info/global_step": 662, "train_info/time_within_train_step": 2.6728827953338623, "step": 662} +{"train_info/time_between_train_steps": 0.0029718875885009766, "step": 662} +{"info/global_step": 663, "train_info/time_within_train_step": 2.6734440326690674, "step": 663} +{"train_info/time_between_train_steps": 0.0029642581939697266, "step": 663} +{"info/global_step": 664, "train_info/time_within_train_step": 2.6717166900634766, "step": 664} +{"train_info/time_between_train_steps": 0.0029838085174560547, "step": 664} +{"info/global_step": 665, "train_info/time_within_train_step": 2.671586751937866, "step": 665} +{"train_info/time_between_train_steps": 0.003022909164428711, "step": 665} +{"info/global_step": 666, "train_info/time_within_train_step": 2.670851945877075, "step": 666} +{"train_info/time_between_train_steps": 0.002987384796142578, "step": 666} +{"info/global_step": 667, "train_info/time_within_train_step": 2.670947313308716, "step": 667} +{"train_info/time_between_train_steps": 0.002982616424560547, "step": 667} +{"info/global_step": 668, "train_info/time_within_train_step": 2.6716837882995605, "step": 668} +{"train_info/time_between_train_steps": 0.003046274185180664, "step": 668} +{"info/global_step": 669, "train_info/time_within_train_step": 2.673715829849243, "step": 669} +{"train_info/time_between_train_steps": 0.0062940120697021484, "step": 669} +{"info/global_step": 670, "train_info/time_within_train_step": 2.6727540493011475, "step": 670} +{"train_info/time_between_train_steps": 0.003055095672607422, "step": 670} +{"info/global_step": 671, "train_info/time_within_train_step": 2.673039674758911, "step": 671} +{"train_info/time_between_train_steps": 0.00307464599609375, "step": 671} +{"info/global_step": 672, "train_info/time_within_train_step": 2.672504425048828, "step": 672} +{"train_info/time_between_train_steps": 0.0030999183654785156, "step": 672} +{"info/global_step": 673, "train_info/time_within_train_step": 2.673152208328247, "step": 673} +{"train_info/time_between_train_steps": 0.0031244754791259766, "step": 673} +{"info/global_step": 674, "train_info/time_within_train_step": 2.6728880405426025, "step": 674} +{"train_info/time_between_train_steps": 0.003008127212524414, "step": 674} +{"info/global_step": 675, "train_info/time_within_train_step": 2.6727890968322754, "step": 675} +{"train_info/time_between_train_steps": 0.0030677318572998047, "step": 675} +{"info/global_step": 676, "train_info/time_within_train_step": 2.672964334487915, "step": 676} +{"train_info/time_between_train_steps": 0.003011941909790039, "step": 676} +{"info/global_step": 677, "train_info/time_within_train_step": 2.673243999481201, "step": 677} +{"train_info/time_between_train_steps": 0.0030879974365234375, "step": 677} +{"info/global_step": 678, "train_info/time_within_train_step": 2.6729371547698975, "step": 678} +{"train_info/time_between_train_steps": 0.003031015396118164, "step": 678} +{"info/global_step": 679, "train_info/time_within_train_step": 2.672201633453369, "step": 679} +{"train_info/time_between_train_steps": 0.003061532974243164, "step": 679} +{"info/global_step": 680, "train_info/time_within_train_step": 2.680260181427002, "step": 680} +{"train_info/time_between_train_steps": 0.003019571304321289, "step": 680} +{"info/global_step": 681, "train_info/time_within_train_step": 2.676025152206421, "step": 681} +{"train_info/time_between_train_steps": 0.0029993057250976562, "step": 681} +{"info/global_step": 682, "train_info/time_within_train_step": 2.6724448204040527, "step": 682} +{"train_info/time_between_train_steps": 0.0030231475830078125, "step": 682} +{"info/global_step": 683, "train_info/time_within_train_step": 2.6753907203674316, "step": 683} +{"train_info/time_between_train_steps": 0.003008127212524414, "step": 683} +{"info/global_step": 684, "train_info/time_within_train_step": 2.6730384826660156, "step": 684} +{"train_info/time_between_train_steps": 0.003083944320678711, "step": 684} +{"info/global_step": 685, "train_info/time_within_train_step": 2.6725432872772217, "step": 685} +{"train_info/time_between_train_steps": 0.003004312515258789, "step": 685} +{"info/global_step": 686, "train_info/time_within_train_step": 2.6727523803710938, "step": 686} +{"train_info/time_between_train_steps": 0.0030298233032226562, "step": 686} +{"info/global_step": 687, "train_info/time_within_train_step": 2.6741526126861572, "step": 687} +{"train_info/time_between_train_steps": 0.0030527114868164062, "step": 687} +{"info/global_step": 688, "train_info/time_within_train_step": 2.6722235679626465, "step": 688} +{"train_info/time_between_train_steps": 0.003084897994995117, "step": 688} +{"info/global_step": 689, "train_info/time_within_train_step": 2.6729891300201416, "step": 689} +{"train_info/time_between_train_steps": 0.0030333995819091797, "step": 689} +{"info/global_step": 690, "train_info/time_within_train_step": 2.6736152172088623, "step": 690} +{"train_info/time_between_train_steps": 0.0030753612518310547, "step": 690} +{"info/global_step": 691, "train_info/time_within_train_step": 2.6735095977783203, "step": 691} +{"train_info/time_between_train_steps": 0.0029985904693603516, "step": 691} +{"info/global_step": 692, "train_info/time_within_train_step": 2.6724040508270264, "step": 692} +{"train_info/time_between_train_steps": 0.0030298233032226562, "step": 692} +{"info/global_step": 693, "train_info/time_within_train_step": 2.6725902557373047, "step": 693} +{"train_info/time_between_train_steps": 0.0031058788299560547, "step": 693} +{"info/global_step": 694, "train_info/time_within_train_step": 2.6726162433624268, "step": 694} +{"train_info/time_between_train_steps": 0.003058910369873047, "step": 694} +{"info/global_step": 695, "train_info/time_within_train_step": 2.6713271141052246, "step": 695} +{"train_info/time_between_train_steps": 0.003025054931640625, "step": 695} +{"info/global_step": 696, "train_info/time_within_train_step": 2.6725738048553467, "step": 696} +{"train_info/time_between_train_steps": 0.003021240234375, "step": 696} +{"info/global_step": 697, "train_info/time_within_train_step": 2.6717209815979004, "step": 697} +{"train_info/time_between_train_steps": 0.0030438899993896484, "step": 697} +{"info/global_step": 698, "train_info/time_within_train_step": 2.6734976768493652, "step": 698} +{"train_info/time_between_train_steps": 0.0031151771545410156, "step": 698} +{"info/global_step": 699, "train_info/time_within_train_step": 2.673764228820801, "step": 699} +{"train_info/time_between_train_steps": 0.0030181407928466797, "step": 699} +{"info/global_step": 700, "train_info/time_within_train_step": 2.6730971336364746, "step": 700} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746205260, "_runtime": 2032}, "step": 700} +{"logs": {"train/loss": 4.8869, "train/learning_rate": 0.0005111111111111111, "train/epoch": 0.23, "_timestamp": 1746205260, "_runtime": 2032}, "step": 700} +{"train_info/time_between_train_steps": 13.305840730667114, "step": 700} +{"info/global_step": 701, "train_info/time_within_train_step": 2.4645512104034424, "step": 701} +{"train_info/time_between_train_steps": 0.0030717849731445312, "step": 701} +{"info/global_step": 702, "train_info/time_within_train_step": 2.608613967895508, "step": 702} +{"train_info/time_between_train_steps": 0.0030508041381835938, "step": 702} +{"info/global_step": 703, "train_info/time_within_train_step": 2.4835124015808105, "step": 703} +{"train_info/time_between_train_steps": 0.0030477046966552734, "step": 703} +{"info/global_step": 704, "train_info/time_within_train_step": 2.6582353115081787, "step": 704} +{"train_info/time_between_train_steps": 0.003086090087890625, "step": 704} +{"info/global_step": 705, "train_info/time_within_train_step": 2.6714670658111572, "step": 705} +{"train_info/time_between_train_steps": 0.0030736923217773438, "step": 705} +{"info/global_step": 706, "train_info/time_within_train_step": 2.673133134841919, "step": 706} +{"train_info/time_between_train_steps": 0.0030677318572998047, "step": 706} +{"info/global_step": 707, "train_info/time_within_train_step": 2.673590660095215, "step": 707} +{"train_info/time_between_train_steps": 0.0030205249786376953, "step": 707} +{"info/global_step": 708, "train_info/time_within_train_step": 2.6733813285827637, "step": 708} +{"train_info/time_between_train_steps": 0.0030100345611572266, "step": 708} +{"info/global_step": 709, "train_info/time_within_train_step": 2.674896001815796, "step": 709} +{"train_info/time_between_train_steps": 0.0030803680419921875, "step": 709} +{"info/global_step": 710, "train_info/time_within_train_step": 2.674363136291504, "step": 710} +{"train_info/time_between_train_steps": 0.003180265426635742, "step": 710} +{"info/global_step": 711, "train_info/time_within_train_step": 2.6755268573760986, "step": 711} +{"train_info/time_between_train_steps": 0.0030341148376464844, "step": 711} +{"info/global_step": 712, "train_info/time_within_train_step": 2.6756691932678223, "step": 712} +{"train_info/time_between_train_steps": 0.0030355453491210938, "step": 712} +{"info/global_step": 713, "train_info/time_within_train_step": 2.6758530139923096, "step": 713} +{"train_info/time_between_train_steps": 0.0030426979064941406, "step": 713} +{"info/global_step": 714, "train_info/time_within_train_step": 2.67671275138855, "step": 714} +{"train_info/time_between_train_steps": 0.0030350685119628906, "step": 714} +{"info/global_step": 715, "train_info/time_within_train_step": 2.675686836242676, "step": 715} +{"train_info/time_between_train_steps": 0.003017902374267578, "step": 715} +{"info/global_step": 716, "train_info/time_within_train_step": 2.676100015640259, "step": 716} +{"train_info/time_between_train_steps": 0.0030298233032226562, "step": 716} +{"info/global_step": 717, "train_info/time_within_train_step": 2.6757657527923584, "step": 717} +{"train_info/time_between_train_steps": 0.0032176971435546875, "step": 717} +{"info/global_step": 718, "train_info/time_within_train_step": 2.675642728805542, "step": 718} +{"train_info/time_between_train_steps": 0.003025531768798828, "step": 718} +{"info/global_step": 719, "train_info/time_within_train_step": 2.675199270248413, "step": 719} +{"train_info/time_between_train_steps": 0.0030672550201416016, "step": 719} +{"info/global_step": 720, "train_info/time_within_train_step": 2.6742193698883057, "step": 720} +{"train_info/time_between_train_steps": 0.0030460357666015625, "step": 720} +{"info/global_step": 721, "train_info/time_within_train_step": 2.674337863922119, "step": 721} +{"train_info/time_between_train_steps": 0.0030934810638427734, "step": 721} +{"info/global_step": 722, "train_info/time_within_train_step": 2.6743221282958984, "step": 722} +{"train_info/time_between_train_steps": 0.00302886962890625, "step": 722} +{"info/global_step": 723, "train_info/time_within_train_step": 2.675863027572632, "step": 723} +{"train_info/time_between_train_steps": 0.0036611557006835938, "step": 723} +{"info/global_step": 724, "train_info/time_within_train_step": 2.6731109619140625, "step": 724} +{"train_info/time_between_train_steps": 0.0030355453491210938, "step": 724} +{"info/global_step": 725, "train_info/time_within_train_step": 2.6743979454040527, "step": 725} +{"train_info/time_between_train_steps": 0.0030395984649658203, "step": 725} +{"info/global_step": 726, "train_info/time_within_train_step": 2.672576904296875, "step": 726} +{"train_info/time_between_train_steps": 0.003021240234375, "step": 726} +{"info/global_step": 727, "train_info/time_within_train_step": 2.674295663833618, "step": 727} +{"train_info/time_between_train_steps": 0.003029346466064453, "step": 727} +{"info/global_step": 728, "train_info/time_within_train_step": 2.6730453968048096, "step": 728} +{"train_info/time_between_train_steps": 0.0030341148376464844, "step": 728} +{"info/global_step": 729, "train_info/time_within_train_step": 2.6739554405212402, "step": 729} +{"train_info/time_between_train_steps": 0.0030655860900878906, "step": 729} +{"info/global_step": 730, "train_info/time_within_train_step": 2.6752328872680664, "step": 730} +{"train_info/time_between_train_steps": 0.003083944320678711, "step": 730} +{"info/global_step": 731, "train_info/time_within_train_step": 2.672410249710083, "step": 731} +{"train_info/time_between_train_steps": 0.003007173538208008, "step": 731} +{"info/global_step": 732, "train_info/time_within_train_step": 2.6736507415771484, "step": 732} +{"train_info/time_between_train_steps": 0.003023386001586914, "step": 732} +{"info/global_step": 733, "train_info/time_within_train_step": 2.6733880043029785, "step": 733} +{"train_info/time_between_train_steps": 0.003040790557861328, "step": 733} +{"info/global_step": 734, "train_info/time_within_train_step": 2.6739988327026367, "step": 734} +{"train_info/time_between_train_steps": 0.0030078887939453125, "step": 734} +{"info/global_step": 735, "train_info/time_within_train_step": 2.6735920906066895, "step": 735} +{"train_info/time_between_train_steps": 0.0030930042266845703, "step": 735} +{"info/global_step": 736, "train_info/time_within_train_step": 2.673760414123535, "step": 736} +{"train_info/time_between_train_steps": 0.0030624866485595703, "step": 736} +{"info/global_step": 737, "train_info/time_within_train_step": 2.6738579273223877, "step": 737} +{"train_info/time_between_train_steps": 0.0030210018157958984, "step": 737} +{"info/global_step": 738, "train_info/time_within_train_step": 2.673701763153076, "step": 738} +{"train_info/time_between_train_steps": 0.0030059814453125, "step": 738} +{"info/global_step": 739, "train_info/time_within_train_step": 2.674009323120117, "step": 739} +{"train_info/time_between_train_steps": 0.003044605255126953, "step": 739} +{"info/global_step": 740, "train_info/time_within_train_step": 2.6743733882904053, "step": 740} +{"train_info/time_between_train_steps": 0.00301361083984375, "step": 740} +{"info/global_step": 741, "train_info/time_within_train_step": 2.6736152172088623, "step": 741} +{"train_info/time_between_train_steps": 0.0030443668365478516, "step": 741} +{"info/global_step": 742, "train_info/time_within_train_step": 2.6736536026000977, "step": 742} +{"train_info/time_between_train_steps": 0.0030183792114257812, "step": 742} +{"info/global_step": 743, "train_info/time_within_train_step": 2.673189163208008, "step": 743} +{"train_info/time_between_train_steps": 0.0029969215393066406, "step": 743} +{"info/global_step": 744, "train_info/time_within_train_step": 2.6743013858795166, "step": 744} +{"train_info/time_between_train_steps": 0.0030357837677001953, "step": 744} +{"info/global_step": 745, "train_info/time_within_train_step": 2.715280532836914, "step": 745} +{"train_info/time_between_train_steps": 0.0031309127807617188, "step": 745} +{"info/global_step": 746, "train_info/time_within_train_step": 2.674394369125366, "step": 746} +{"train_info/time_between_train_steps": 0.0036873817443847656, "step": 746} +{"info/global_step": 747, "train_info/time_within_train_step": 2.673896551132202, "step": 747} +{"train_info/time_between_train_steps": 0.003030538558959961, "step": 747} +{"info/global_step": 748, "train_info/time_within_train_step": 2.6723103523254395, "step": 748} +{"train_info/time_between_train_steps": 0.0032558441162109375, "step": 748} +{"info/global_step": 749, "train_info/time_within_train_step": 2.6734960079193115, "step": 749} +{"train_info/time_between_train_steps": 0.003099679946899414, "step": 749} +{"info/global_step": 750, "train_info/time_within_train_step": 3.2166013717651367, "step": 750} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746205408, "_runtime": 2180}, "step": 750} +{"logs": {"train/loss": 4.8279, "train/learning_rate": 0.0005, "train/epoch": 0.25, "_timestamp": 1746205408, "_runtime": 2180}, "step": 750} +{"train_info/time_between_train_steps": 0.02364373207092285, "step": 750} +{"info/global_step": 751, "train_info/time_within_train_step": 2.672792673110962, "step": 751} +{"train_info/time_between_train_steps": 0.003097057342529297, "step": 751} +{"info/global_step": 752, "train_info/time_within_train_step": 2.673241376876831, "step": 752} +{"train_info/time_between_train_steps": 0.003032684326171875, "step": 752} +{"info/global_step": 753, "train_info/time_within_train_step": 2.674598217010498, "step": 753} +{"train_info/time_between_train_steps": 0.0030858516693115234, "step": 753} +{"info/global_step": 754, "train_info/time_within_train_step": 2.672922372817993, "step": 754} +{"train_info/time_between_train_steps": 0.0030705928802490234, "step": 754} +{"info/global_step": 755, "train_info/time_within_train_step": 2.6737186908721924, "step": 755} +{"train_info/time_between_train_steps": 0.003006458282470703, "step": 755} +{"info/global_step": 756, "train_info/time_within_train_step": 2.672970771789551, "step": 756} +{"train_info/time_between_train_steps": 0.0030667781829833984, "step": 756} +{"info/global_step": 757, "train_info/time_within_train_step": 2.6735339164733887, "step": 757} +{"train_info/time_between_train_steps": 0.0030274391174316406, "step": 757} +{"info/global_step": 758, "train_info/time_within_train_step": 2.6737749576568604, "step": 758} +{"train_info/time_between_train_steps": 0.003072500228881836, "step": 758} +{"info/global_step": 759, "train_info/time_within_train_step": 2.674370527267456, "step": 759} +{"train_info/time_between_train_steps": 0.003072977066040039, "step": 759} +{"info/global_step": 760, "train_info/time_within_train_step": 2.675628900527954, "step": 760} +{"train_info/time_between_train_steps": 0.003094911575317383, "step": 760} +{"info/global_step": 761, "train_info/time_within_train_step": 2.67384934425354, "step": 761} +{"train_info/time_between_train_steps": 0.0032410621643066406, "step": 761} +{"info/global_step": 762, "train_info/time_within_train_step": 2.673414945602417, "step": 762} +{"train_info/time_between_train_steps": 0.003045797348022461, "step": 762} +{"info/global_step": 763, "train_info/time_within_train_step": 2.673140287399292, "step": 763} +{"train_info/time_between_train_steps": 0.003169536590576172, "step": 763} +{"info/global_step": 764, "train_info/time_within_train_step": 2.67301607131958, "step": 764} +{"train_info/time_between_train_steps": 0.0031108856201171875, "step": 764} +{"info/global_step": 765, "train_info/time_within_train_step": 2.6741526126861572, "step": 765} +{"train_info/time_between_train_steps": 0.003030061721801758, "step": 765} +{"info/global_step": 766, "train_info/time_within_train_step": 2.6736721992492676, "step": 766} +{"train_info/time_between_train_steps": 0.0030748844146728516, "step": 766} +{"info/global_step": 767, "train_info/time_within_train_step": 2.673740863800049, "step": 767} +{"train_info/time_between_train_steps": 0.0030617713928222656, "step": 767} +{"info/global_step": 768, "train_info/time_within_train_step": 2.6737124919891357, "step": 768} +{"train_info/time_between_train_steps": 0.0030803680419921875, "step": 768} +{"info/global_step": 769, "train_info/time_within_train_step": 2.6722452640533447, "step": 769} +{"train_info/time_between_train_steps": 0.0030548572540283203, "step": 769} +{"info/global_step": 770, "train_info/time_within_train_step": 2.67514705657959, "step": 770} +{"train_info/time_between_train_steps": 0.003055572509765625, "step": 770} +{"info/global_step": 771, "train_info/time_within_train_step": 2.6736156940460205, "step": 771} +{"train_info/time_between_train_steps": 0.0030527114868164062, "step": 771} +{"info/global_step": 772, "train_info/time_within_train_step": 2.6755309104919434, "step": 772} +{"train_info/time_between_train_steps": 0.003022432327270508, "step": 772} +{"info/global_step": 773, "train_info/time_within_train_step": 2.6724841594696045, "step": 773} +{"train_info/time_between_train_steps": 0.0030241012573242188, "step": 773} +{"info/global_step": 774, "train_info/time_within_train_step": 2.6727492809295654, "step": 774} +{"train_info/time_between_train_steps": 0.0030477046966552734, "step": 774} +{"info/global_step": 775, "train_info/time_within_train_step": 2.67253041267395, "step": 775} +{"train_info/time_between_train_steps": 0.003025054931640625, "step": 775} +{"info/global_step": 776, "train_info/time_within_train_step": 2.679669141769409, "step": 776} +{"train_info/time_between_train_steps": 0.0030591487884521484, "step": 776} +{"info/global_step": 777, "train_info/time_within_train_step": 2.7223145961761475, "step": 777} +{"train_info/time_between_train_steps": 0.0030579566955566406, "step": 777} +{"info/global_step": 778, "train_info/time_within_train_step": 2.6745221614837646, "step": 778} +{"train_info/time_between_train_steps": 0.0030395984649658203, "step": 778} +{"info/global_step": 779, "train_info/time_within_train_step": 2.673445463180542, "step": 779} +{"train_info/time_between_train_steps": 0.0030624866485595703, "step": 779} +{"info/global_step": 780, "train_info/time_within_train_step": 2.6739511489868164, "step": 780} +{"train_info/time_between_train_steps": 0.0030472278594970703, "step": 780} +{"info/global_step": 781, "train_info/time_within_train_step": 2.6728806495666504, "step": 781} +{"train_info/time_between_train_steps": 0.0030622482299804688, "step": 781} +{"info/global_step": 782, "train_info/time_within_train_step": 2.674362897872925, "step": 782} +{"train_info/time_between_train_steps": 0.003051280975341797, "step": 782} +{"info/global_step": 783, "train_info/time_within_train_step": 2.674039125442505, "step": 783} +{"train_info/time_between_train_steps": 0.0030946731567382812, "step": 783} +{"info/global_step": 784, "train_info/time_within_train_step": 2.6727495193481445, "step": 784} +{"train_info/time_between_train_steps": 0.0030527114868164062, "step": 784} +{"info/global_step": 785, "train_info/time_within_train_step": 2.6727945804595947, "step": 785} +{"train_info/time_between_train_steps": 0.0030660629272460938, "step": 785} +{"info/global_step": 786, "train_info/time_within_train_step": 2.6734864711761475, "step": 786} +{"train_info/time_between_train_steps": 0.0030508041381835938, "step": 786} +{"info/global_step": 787, "train_info/time_within_train_step": 2.673241138458252, "step": 787} +{"train_info/time_between_train_steps": 0.003075838088989258, "step": 787} +{"info/global_step": 788, "train_info/time_within_train_step": 2.6733314990997314, "step": 788} +{"train_info/time_between_train_steps": 0.0030472278594970703, "step": 788} +{"info/global_step": 789, "train_info/time_within_train_step": 2.673236608505249, "step": 789} +{"train_info/time_between_train_steps": 0.003061532974243164, "step": 789} +{"info/global_step": 790, "train_info/time_within_train_step": 2.6733486652374268, "step": 790} +{"train_info/time_between_train_steps": 0.0030488967895507812, "step": 790} +{"info/global_step": 791, "train_info/time_within_train_step": 2.673694133758545, "step": 791} +{"train_info/time_between_train_steps": 0.0030670166015625, "step": 791} +{"info/global_step": 792, "train_info/time_within_train_step": 2.672441244125366, "step": 792} +{"train_info/time_between_train_steps": 0.0030782222747802734, "step": 792} +{"info/global_step": 793, "train_info/time_within_train_step": 2.673814535140991, "step": 793} +{"train_info/time_between_train_steps": 0.0030722618103027344, "step": 793} +{"info/global_step": 794, "train_info/time_within_train_step": 2.7706658840179443, "step": 794} +{"train_info/time_between_train_steps": 0.0039403438568115234, "step": 794} +{"info/global_step": 795, "train_info/time_within_train_step": 2.674107313156128, "step": 795} +{"train_info/time_between_train_steps": 0.003064870834350586, "step": 795} +{"info/global_step": 796, "train_info/time_within_train_step": 2.675252914428711, "step": 796} +{"train_info/time_between_train_steps": 0.003148794174194336, "step": 796} +{"info/global_step": 797, "train_info/time_within_train_step": 2.676382541656494, "step": 797} +{"train_info/time_between_train_steps": 0.003033876419067383, "step": 797} +{"info/global_step": 798, "train_info/time_within_train_step": 2.6737852096557617, "step": 798} +{"train_info/time_between_train_steps": 0.00305938720703125, "step": 798} +{"info/global_step": 799, "train_info/time_within_train_step": 2.6735639572143555, "step": 799} +{"train_info/time_between_train_steps": 0.003062725067138672, "step": 799} +{"info/global_step": 800, "train_info/time_within_train_step": 2.674286365509033, "step": 800} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746205543, "_runtime": 2315}, "step": 800} +{"logs": {"train/loss": 4.7687, "train/learning_rate": 0.0004888888888888889, "train/epoch": 0.27, "_timestamp": 1746205543, "_runtime": 2315}, "step": 800} +{"train_info/time_between_train_steps": 15.621060371398926, "step": 800} +{"info/global_step": 801, "train_info/time_within_train_step": 2.4612369537353516, "step": 801} +{"train_info/time_between_train_steps": 0.0030705928802490234, "step": 801} +{"info/global_step": 802, "train_info/time_within_train_step": 2.455592632293701, "step": 802} +{"train_info/time_between_train_steps": 0.003113985061645508, "step": 802} +{"info/global_step": 803, "train_info/time_within_train_step": 2.4616587162017822, "step": 803} +{"train_info/time_between_train_steps": 0.0030469894409179688, "step": 803} +{"info/global_step": 804, "train_info/time_within_train_step": 2.638227701187134, "step": 804} +{"train_info/time_between_train_steps": 0.003026247024536133, "step": 804} +{"info/global_step": 805, "train_info/time_within_train_step": 2.6747186183929443, "step": 805} +{"train_info/time_between_train_steps": 0.003247976303100586, "step": 805} +{"info/global_step": 806, "train_info/time_within_train_step": 2.6742451190948486, "step": 806} +{"train_info/time_between_train_steps": 0.003045320510864258, "step": 806} +{"info/global_step": 807, "train_info/time_within_train_step": 2.675638437271118, "step": 807} +{"train_info/time_between_train_steps": 0.0030968189239501953, "step": 807} +{"info/global_step": 808, "train_info/time_within_train_step": 2.6812376976013184, "step": 808} +{"train_info/time_between_train_steps": 0.0031080245971679688, "step": 808} +{"info/global_step": 809, "train_info/time_within_train_step": 2.6758923530578613, "step": 809} +{"train_info/time_between_train_steps": 0.003088712692260742, "step": 809} +{"info/global_step": 810, "train_info/time_within_train_step": 2.676767110824585, "step": 810} +{"train_info/time_between_train_steps": 0.0030596256256103516, "step": 810} +{"info/global_step": 811, "train_info/time_within_train_step": 2.6761763095855713, "step": 811} +{"train_info/time_between_train_steps": 0.0031003952026367188, "step": 811} +{"info/global_step": 812, "train_info/time_within_train_step": 2.675443172454834, "step": 812} +{"train_info/time_between_train_steps": 0.0030515193939208984, "step": 812} +{"info/global_step": 813, "train_info/time_within_train_step": 2.676990032196045, "step": 813} +{"train_info/time_between_train_steps": 0.0030422210693359375, "step": 813} +{"info/global_step": 814, "train_info/time_within_train_step": 2.6762218475341797, "step": 814} +{"train_info/time_between_train_steps": 0.003043651580810547, "step": 814} +{"info/global_step": 815, "train_info/time_within_train_step": 2.676254987716675, "step": 815} +{"train_info/time_between_train_steps": 0.0030975341796875, "step": 815} +{"info/global_step": 816, "train_info/time_within_train_step": 2.6768789291381836, "step": 816} +{"train_info/time_between_train_steps": 0.0030395984649658203, "step": 816} +{"info/global_step": 817, "train_info/time_within_train_step": 2.676417350769043, "step": 817} +{"train_info/time_between_train_steps": 0.0030672550201416016, "step": 817} +{"info/global_step": 818, "train_info/time_within_train_step": 2.6769115924835205, "step": 818} +{"train_info/time_between_train_steps": 0.0030472278594970703, "step": 818} +{"info/global_step": 819, "train_info/time_within_train_step": 2.6763358116149902, "step": 819} +{"train_info/time_between_train_steps": 0.0030651092529296875, "step": 819} +{"info/global_step": 820, "train_info/time_within_train_step": 2.676568031311035, "step": 820} +{"train_info/time_between_train_steps": 0.003137350082397461, "step": 820} +{"info/global_step": 821, "train_info/time_within_train_step": 2.6765692234039307, "step": 821} +{"train_info/time_between_train_steps": 0.003042936325073242, "step": 821} +{"info/global_step": 822, "train_info/time_within_train_step": 2.674868106842041, "step": 822} +{"train_info/time_between_train_steps": 0.0030968189239501953, "step": 822} +{"info/global_step": 823, "train_info/time_within_train_step": 2.6748108863830566, "step": 823} +{"train_info/time_between_train_steps": 0.003034353256225586, "step": 823} +{"info/global_step": 824, "train_info/time_within_train_step": 2.6763601303100586, "step": 824} +{"train_info/time_between_train_steps": 0.003095388412475586, "step": 824} +{"info/global_step": 825, "train_info/time_within_train_step": 2.676358938217163, "step": 825} +{"train_info/time_between_train_steps": 0.003058910369873047, "step": 825} +{"info/global_step": 826, "train_info/time_within_train_step": 2.6748952865600586, "step": 826} +{"train_info/time_between_train_steps": 0.003043651580810547, "step": 826} +{"info/global_step": 827, "train_info/time_within_train_step": 2.6760029792785645, "step": 827} +{"train_info/time_between_train_steps": 0.003127574920654297, "step": 827} +{"info/global_step": 828, "train_info/time_within_train_step": 2.6760685443878174, "step": 828} +{"train_info/time_between_train_steps": 0.0030651092529296875, "step": 828} +{"info/global_step": 829, "train_info/time_within_train_step": 2.676126003265381, "step": 829} +{"train_info/time_between_train_steps": 0.003029346466064453, "step": 829} +{"info/global_step": 830, "train_info/time_within_train_step": 2.6753382682800293, "step": 830} +{"train_info/time_between_train_steps": 0.0030748844146728516, "step": 830} +{"info/global_step": 831, "train_info/time_within_train_step": 2.676036834716797, "step": 831} +{"train_info/time_between_train_steps": 0.003128528594970703, "step": 831} +{"info/global_step": 832, "train_info/time_within_train_step": 2.6765201091766357, "step": 832} +{"train_info/time_between_train_steps": 0.00311279296875, "step": 832} +{"info/global_step": 833, "train_info/time_within_train_step": 2.6748178005218506, "step": 833} +{"train_info/time_between_train_steps": 0.003122568130493164, "step": 833} +{"info/global_step": 834, "train_info/time_within_train_step": 2.675177812576294, "step": 834} +{"train_info/time_between_train_steps": 0.003177165985107422, "step": 834} +{"info/global_step": 835, "train_info/time_within_train_step": 2.674163579940796, "step": 835} +{"train_info/time_between_train_steps": 0.0030362606048583984, "step": 835} +{"info/global_step": 836, "train_info/time_within_train_step": 2.6749653816223145, "step": 836} +{"train_info/time_between_train_steps": 0.003153562545776367, "step": 836} +{"info/global_step": 837, "train_info/time_within_train_step": 2.6739141941070557, "step": 837} +{"train_info/time_between_train_steps": 0.0031173229217529297, "step": 837} +{"info/global_step": 838, "train_info/time_within_train_step": 2.6747019290924072, "step": 838} +{"train_info/time_between_train_steps": 0.003121614456176758, "step": 838} +{"info/global_step": 839, "train_info/time_within_train_step": 2.6743907928466797, "step": 839} +{"train_info/time_between_train_steps": 0.0031108856201171875, "step": 839} +{"info/global_step": 840, "train_info/time_within_train_step": 2.6750924587249756, "step": 840} +{"train_info/time_between_train_steps": 0.003149271011352539, "step": 840} +{"info/global_step": 841, "train_info/time_within_train_step": 2.6755778789520264, "step": 841} +{"train_info/time_between_train_steps": 0.0031354427337646484, "step": 841} +{"info/global_step": 842, "train_info/time_within_train_step": 2.6750128269195557, "step": 842} +{"train_info/time_between_train_steps": 0.0031554698944091797, "step": 842} +{"info/global_step": 843, "train_info/time_within_train_step": 2.6757290363311768, "step": 843} +{"train_info/time_between_train_steps": 0.0032701492309570312, "step": 843} +{"info/global_step": 844, "train_info/time_within_train_step": 2.6750118732452393, "step": 844} +{"train_info/time_between_train_steps": 0.0032546520233154297, "step": 844} +{"info/global_step": 845, "train_info/time_within_train_step": 2.674468994140625, "step": 845} +{"train_info/time_between_train_steps": 0.0031890869140625, "step": 845} +{"info/global_step": 846, "train_info/time_within_train_step": 2.6752521991729736, "step": 846} +{"train_info/time_between_train_steps": 0.003223896026611328, "step": 846} +{"info/global_step": 847, "train_info/time_within_train_step": 2.675159454345703, "step": 847} +{"train_info/time_between_train_steps": 0.0032112598419189453, "step": 847} +{"info/global_step": 848, "train_info/time_within_train_step": 2.6750364303588867, "step": 848} +{"train_info/time_between_train_steps": 0.0033223628997802734, "step": 848} +{"info/global_step": 849, "train_info/time_within_train_step": 2.673990488052368, "step": 849} +{"train_info/time_between_train_steps": 0.003288745880126953, "step": 849} +{"info/global_step": 850, "train_info/time_within_train_step": 2.6741979122161865, "step": 850} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746205693, "_runtime": 2465}, "step": 850} +{"logs": {"train/loss": 4.7261, "train/learning_rate": 0.0004777777777777777, "train/epoch": 0.28, "_timestamp": 1746205693, "_runtime": 2465}, "step": 850} +{"train_info/time_between_train_steps": 0.02471303939819336, "step": 850} +{"info/global_step": 851, "train_info/time_within_train_step": 2.6744632720947266, "step": 851} +{"train_info/time_between_train_steps": 0.0034139156341552734, "step": 851} +{"info/global_step": 852, "train_info/time_within_train_step": 2.674457311630249, "step": 852} +{"train_info/time_between_train_steps": 0.0033681392669677734, "step": 852} +{"info/global_step": 853, "train_info/time_within_train_step": 2.6758718490600586, "step": 853} +{"train_info/time_between_train_steps": 0.003420114517211914, "step": 853} +{"info/global_step": 854, "train_info/time_within_train_step": 2.6757898330688477, "step": 854} +{"train_info/time_between_train_steps": 0.003396272659301758, "step": 854} +{"info/global_step": 855, "train_info/time_within_train_step": 2.6753315925598145, "step": 855} +{"train_info/time_between_train_steps": 0.0034067630767822266, "step": 855} +{"info/global_step": 856, "train_info/time_within_train_step": 2.676050901412964, "step": 856} +{"train_info/time_between_train_steps": 0.003388643264770508, "step": 856} +{"info/global_step": 857, "train_info/time_within_train_step": 2.676037073135376, "step": 857} +{"train_info/time_between_train_steps": 0.0036101341247558594, "step": 857} +{"info/global_step": 858, "train_info/time_within_train_step": 2.6759986877441406, "step": 858} +{"train_info/time_between_train_steps": 0.003398895263671875, "step": 858} +{"info/global_step": 859, "train_info/time_within_train_step": 2.6768293380737305, "step": 859} +{"train_info/time_between_train_steps": 0.0036809444427490234, "step": 859} +{"info/global_step": 860, "train_info/time_within_train_step": 2.676577568054199, "step": 860} +{"train_info/time_between_train_steps": 0.0034263134002685547, "step": 860} +{"info/global_step": 861, "train_info/time_within_train_step": 2.6758954524993896, "step": 861} +{"train_info/time_between_train_steps": 0.003897428512573242, "step": 861} +{"info/global_step": 862, "train_info/time_within_train_step": 2.67769455909729, "step": 862} +{"train_info/time_between_train_steps": 0.0037813186645507812, "step": 862} +{"info/global_step": 863, "train_info/time_within_train_step": 2.6765685081481934, "step": 863} +{"train_info/time_between_train_steps": 0.003802061080932617, "step": 863} +{"info/global_step": 864, "train_info/time_within_train_step": 2.6769838333129883, "step": 864} +{"train_info/time_between_train_steps": 0.003436565399169922, "step": 864} +{"train_info/time_between_train_steps": 2.5015804767608643, "step": 864} +{"info/global_step": 865, "train_info/time_within_train_step": 2.6326770782470703, "step": 865} +{"train_info/time_between_train_steps": 0.0032837390899658203, "step": 865} +{"info/global_step": 866, "train_info/time_within_train_step": 2.6739907264709473, "step": 866} +{"train_info/time_between_train_steps": 0.003301382064819336, "step": 866} +{"info/global_step": 867, "train_info/time_within_train_step": 2.6743710041046143, "step": 867} +{"train_info/time_between_train_steps": 0.0033681392669677734, "step": 867} +{"info/global_step": 868, "train_info/time_within_train_step": 2.6756365299224854, "step": 868} +{"train_info/time_between_train_steps": 0.0032815933227539062, "step": 868} +{"info/global_step": 869, "train_info/time_within_train_step": 2.6752755641937256, "step": 869} +{"train_info/time_between_train_steps": 0.003312349319458008, "step": 869} +{"info/global_step": 870, "train_info/time_within_train_step": 2.675274610519409, "step": 870} +{"train_info/time_between_train_steps": 0.0033071041107177734, "step": 870} +{"info/global_step": 871, "train_info/time_within_train_step": 2.6753458976745605, "step": 871} +{"train_info/time_between_train_steps": 0.0033445358276367188, "step": 871} +{"info/global_step": 872, "train_info/time_within_train_step": 2.7153220176696777, "step": 872} +{"train_info/time_between_train_steps": 0.003299713134765625, "step": 872} +{"info/global_step": 873, "train_info/time_within_train_step": 2.6760828495025635, "step": 873} +{"train_info/time_between_train_steps": 0.0032727718353271484, "step": 873} +{"info/global_step": 874, "train_info/time_within_train_step": 2.6751761436462402, "step": 874} +{"train_info/time_between_train_steps": 0.0033004283905029297, "step": 874} +{"info/global_step": 875, "train_info/time_within_train_step": 2.674996852874756, "step": 875} +{"train_info/time_between_train_steps": 0.003293752670288086, "step": 875} +{"info/global_step": 876, "train_info/time_within_train_step": 2.674607038497925, "step": 876} +{"train_info/time_between_train_steps": 0.003329038619995117, "step": 876} +{"info/global_step": 877, "train_info/time_within_train_step": 2.6740269660949707, "step": 877} +{"train_info/time_between_train_steps": 0.003292083740234375, "step": 877} +{"info/global_step": 878, "train_info/time_within_train_step": 2.673889398574829, "step": 878} +{"train_info/time_between_train_steps": 0.0032684803009033203, "step": 878} +{"info/global_step": 879, "train_info/time_within_train_step": 2.6748616695404053, "step": 879} +{"train_info/time_between_train_steps": 0.003330707550048828, "step": 879} +{"info/global_step": 880, "train_info/time_within_train_step": 2.6738107204437256, "step": 880} +{"train_info/time_between_train_steps": 0.003314971923828125, "step": 880} +{"info/global_step": 881, "train_info/time_within_train_step": 2.6745669841766357, "step": 881} +{"train_info/time_between_train_steps": 0.0032927989959716797, "step": 881} +{"info/global_step": 882, "train_info/time_within_train_step": 2.88620924949646, "step": 882} +{"train_info/time_between_train_steps": 0.003296375274658203, "step": 882} +{"info/global_step": 883, "train_info/time_within_train_step": 2.6742539405822754, "step": 883} +{"train_info/time_between_train_steps": 0.0033016204833984375, "step": 883} +{"info/global_step": 884, "train_info/time_within_train_step": 2.674384832382202, "step": 884} +{"train_info/time_between_train_steps": 0.0032846927642822266, "step": 884} +{"info/global_step": 885, "train_info/time_within_train_step": 2.673966407775879, "step": 885} +{"train_info/time_between_train_steps": 0.0032830238342285156, "step": 885} +{"info/global_step": 886, "train_info/time_within_train_step": 2.675058603286743, "step": 886} +{"train_info/time_between_train_steps": 0.003330230712890625, "step": 886} +{"info/global_step": 887, "train_info/time_within_train_step": 2.674032211303711, "step": 887} +{"train_info/time_between_train_steps": 0.003271341323852539, "step": 887} +{"info/global_step": 888, "train_info/time_within_train_step": 2.674504518508911, "step": 888} +{"train_info/time_between_train_steps": 0.0033562183380126953, "step": 888} +{"info/global_step": 889, "train_info/time_within_train_step": 2.674862861633301, "step": 889} +{"train_info/time_between_train_steps": 0.0033347606658935547, "step": 889} +{"info/global_step": 890, "train_info/time_within_train_step": 2.6748998165130615, "step": 890} +{"train_info/time_between_train_steps": 0.003305673599243164, "step": 890} +{"info/global_step": 891, "train_info/time_within_train_step": 2.6752688884735107, "step": 891} +{"train_info/time_between_train_steps": 0.003266572952270508, "step": 891} +{"info/global_step": 892, "train_info/time_within_train_step": 2.674859046936035, "step": 892} +{"train_info/time_between_train_steps": 0.0033071041107177734, "step": 892} +{"info/global_step": 893, "train_info/time_within_train_step": 2.6744890213012695, "step": 893} +{"train_info/time_between_train_steps": 0.0032956600189208984, "step": 893} +{"info/global_step": 894, "train_info/time_within_train_step": 2.6744120121002197, "step": 894} +{"train_info/time_between_train_steps": 0.0032966136932373047, "step": 894} +{"info/global_step": 895, "train_info/time_within_train_step": 2.674999952316284, "step": 895} +{"train_info/time_between_train_steps": 0.0033426284790039062, "step": 895} +{"info/global_step": 896, "train_info/time_within_train_step": 2.6744043827056885, "step": 896} +{"train_info/time_between_train_steps": 0.0033588409423828125, "step": 896} +{"info/global_step": 897, "train_info/time_within_train_step": 2.674135446548462, "step": 897} +{"train_info/time_between_train_steps": 0.0033044815063476562, "step": 897} +{"info/global_step": 898, "train_info/time_within_train_step": 2.673797130584717, "step": 898} +{"train_info/time_between_train_steps": 0.003271341323852539, "step": 898} +{"info/global_step": 899, "train_info/time_within_train_step": 2.6749300956726074, "step": 899} +{"train_info/time_between_train_steps": 0.0033397674560546875, "step": 899} +{"info/global_step": 900, "train_info/time_within_train_step": 2.67388916015625, "step": 900} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746205831, "_runtime": 2603}, "step": 900} +{"logs": {"train/loss": 4.7028, "train/learning_rate": 0.0004666666666666666, "train/epoch": 1.01, "_timestamp": 1746205831, "_runtime": 2603}, "step": 900} +{"train_info/time_between_train_steps": 13.072946310043335, "step": 900} +{"info/global_step": 901, "train_info/time_within_train_step": 2.4765169620513916, "step": 901} +{"train_info/time_between_train_steps": 0.0033118724822998047, "step": 901} +{"info/global_step": 902, "train_info/time_within_train_step": 2.46195912361145, "step": 902} +{"train_info/time_between_train_steps": 0.0033555030822753906, "step": 902} +{"info/global_step": 903, "train_info/time_within_train_step": 2.473090171813965, "step": 903} +{"train_info/time_between_train_steps": 0.003515481948852539, "step": 903} +{"info/global_step": 904, "train_info/time_within_train_step": 2.6495916843414307, "step": 904} +{"train_info/time_between_train_steps": 0.003319978713989258, "step": 904} +{"info/global_step": 905, "train_info/time_within_train_step": 2.673989772796631, "step": 905} +{"train_info/time_between_train_steps": 0.0032958984375, "step": 905} +{"info/global_step": 906, "train_info/time_within_train_step": 2.6750240325927734, "step": 906} +{"train_info/time_between_train_steps": 0.0033156871795654297, "step": 906} +{"info/global_step": 907, "train_info/time_within_train_step": 2.674581289291382, "step": 907} +{"train_info/time_between_train_steps": 0.003319263458251953, "step": 907} +{"info/global_step": 908, "train_info/time_within_train_step": 2.674394369125366, "step": 908} +{"train_info/time_between_train_steps": 0.0033011436462402344, "step": 908} +{"info/global_step": 909, "train_info/time_within_train_step": 2.675112247467041, "step": 909} +{"train_info/time_between_train_steps": 0.003294706344604492, "step": 909} +{"info/global_step": 910, "train_info/time_within_train_step": 2.6745102405548096, "step": 910} +{"train_info/time_between_train_steps": 0.003323078155517578, "step": 910} +{"info/global_step": 911, "train_info/time_within_train_step": 2.676384687423706, "step": 911} +{"train_info/time_between_train_steps": 0.003304004669189453, "step": 911} +{"info/global_step": 912, "train_info/time_within_train_step": 2.7132978439331055, "step": 912} +{"train_info/time_between_train_steps": 0.0032906532287597656, "step": 912} +{"info/global_step": 913, "train_info/time_within_train_step": 2.676063299179077, "step": 913} +{"train_info/time_between_train_steps": 0.003630399703979492, "step": 913} +{"info/global_step": 914, "train_info/time_within_train_step": 2.6761066913604736, "step": 914} +{"train_info/time_between_train_steps": 0.0032656192779541016, "step": 914} +{"info/global_step": 915, "train_info/time_within_train_step": 2.6760826110839844, "step": 915} +{"train_info/time_between_train_steps": 0.0033423900604248047, "step": 915} +{"info/global_step": 916, "train_info/time_within_train_step": 2.6760191917419434, "step": 916} +{"train_info/time_between_train_steps": 0.0032854080200195312, "step": 916} +{"info/global_step": 917, "train_info/time_within_train_step": 2.675577402114868, "step": 917} +{"train_info/time_between_train_steps": 0.0033385753631591797, "step": 917} +{"info/global_step": 918, "train_info/time_within_train_step": 2.677330255508423, "step": 918} +{"train_info/time_between_train_steps": 0.003322601318359375, "step": 918} +{"info/global_step": 919, "train_info/time_within_train_step": 2.6774659156799316, "step": 919} +{"train_info/time_between_train_steps": 0.0033299922943115234, "step": 919} +{"info/global_step": 920, "train_info/time_within_train_step": 2.676471471786499, "step": 920} +{"train_info/time_between_train_steps": 0.0032782554626464844, "step": 920} +{"info/global_step": 921, "train_info/time_within_train_step": 2.6767587661743164, "step": 921} +{"train_info/time_between_train_steps": 0.003311634063720703, "step": 921} +{"info/global_step": 922, "train_info/time_within_train_step": 2.676800012588501, "step": 922} +{"train_info/time_between_train_steps": 0.0032875537872314453, "step": 922} +{"info/global_step": 923, "train_info/time_within_train_step": 2.6771230697631836, "step": 923} +{"train_info/time_between_train_steps": 0.0032949447631835938, "step": 923} +{"info/global_step": 924, "train_info/time_within_train_step": 2.6761178970336914, "step": 924} +{"train_info/time_between_train_steps": 0.0032529830932617188, "step": 924} +{"info/global_step": 925, "train_info/time_within_train_step": 2.6762168407440186, "step": 925} +{"train_info/time_between_train_steps": 0.0033507347106933594, "step": 925} +{"info/global_step": 926, "train_info/time_within_train_step": 2.676121950149536, "step": 926} +{"train_info/time_between_train_steps": 0.003284454345703125, "step": 926} +{"info/global_step": 927, "train_info/time_within_train_step": 2.791105031967163, "step": 927} +{"train_info/time_between_train_steps": 0.003345966339111328, "step": 927} +{"info/global_step": 928, "train_info/time_within_train_step": 2.676642417907715, "step": 928} +{"train_info/time_between_train_steps": 0.0033397674560546875, "step": 928} +{"info/global_step": 929, "train_info/time_within_train_step": 2.6776797771453857, "step": 929} +{"train_info/time_between_train_steps": 0.0033538341522216797, "step": 929} +{"info/global_step": 930, "train_info/time_within_train_step": 2.6766088008880615, "step": 930} +{"train_info/time_between_train_steps": 0.0033731460571289062, "step": 930} +{"info/global_step": 931, "train_info/time_within_train_step": 2.6772379875183105, "step": 931} +{"train_info/time_between_train_steps": 0.0033409595489501953, "step": 931} +{"info/global_step": 932, "train_info/time_within_train_step": 2.6768569946289062, "step": 932} +{"train_info/time_between_train_steps": 0.0033311843872070312, "step": 932} +{"info/global_step": 933, "train_info/time_within_train_step": 2.676887273788452, "step": 933} +{"train_info/time_between_train_steps": 0.0033721923828125, "step": 933} +{"info/global_step": 934, "train_info/time_within_train_step": 2.6761057376861572, "step": 934} +{"train_info/time_between_train_steps": 0.003316164016723633, "step": 934} +{"info/global_step": 935, "train_info/time_within_train_step": 2.6770553588867188, "step": 935} +{"train_info/time_between_train_steps": 0.0033164024353027344, "step": 935} +{"info/global_step": 936, "train_info/time_within_train_step": 2.6754047870635986, "step": 936} +{"train_info/time_between_train_steps": 0.0033540725708007812, "step": 936} +{"info/global_step": 937, "train_info/time_within_train_step": 2.673859119415283, "step": 937} +{"train_info/time_between_train_steps": 0.0033457279205322266, "step": 937} +{"info/global_step": 938, "train_info/time_within_train_step": 2.676380157470703, "step": 938} +{"train_info/time_between_train_steps": 0.00339508056640625, "step": 938} +{"info/global_step": 939, "train_info/time_within_train_step": 2.676206350326538, "step": 939} +{"train_info/time_between_train_steps": 0.0033617019653320312, "step": 939} +{"info/global_step": 940, "train_info/time_within_train_step": 2.89808988571167, "step": 940} +{"train_info/time_between_train_steps": 0.0033452510833740234, "step": 940} +{"info/global_step": 941, "train_info/time_within_train_step": 2.674740791320801, "step": 941} +{"train_info/time_between_train_steps": 0.0033631324768066406, "step": 941} +{"info/global_step": 942, "train_info/time_within_train_step": 2.674987554550171, "step": 942} +{"train_info/time_between_train_steps": 0.003289937973022461, "step": 942} +{"info/global_step": 943, "train_info/time_within_train_step": 2.6758570671081543, "step": 943} +{"train_info/time_between_train_steps": 0.0033130645751953125, "step": 943} +{"info/global_step": 944, "train_info/time_within_train_step": 2.6748406887054443, "step": 944} +{"train_info/time_between_train_steps": 0.003332376480102539, "step": 944} +{"info/global_step": 945, "train_info/time_within_train_step": 2.674546957015991, "step": 945} +{"train_info/time_between_train_steps": 0.003317117691040039, "step": 945} +{"info/global_step": 946, "train_info/time_within_train_step": 2.674992084503174, "step": 946} +{"train_info/time_between_train_steps": 0.0033121109008789062, "step": 946} +{"info/global_step": 947, "train_info/time_within_train_step": 2.676093578338623, "step": 947} +{"train_info/time_between_train_steps": 0.0033767223358154297, "step": 947} +{"info/global_step": 948, "train_info/time_within_train_step": 2.675351858139038, "step": 948} +{"train_info/time_between_train_steps": 0.0034224987030029297, "step": 948} +{"info/global_step": 949, "train_info/time_within_train_step": 2.675276279449463, "step": 949} +{"train_info/time_between_train_steps": 0.00336456298828125, "step": 949} +{"info/global_step": 950, "train_info/time_within_train_step": 2.67704701423645, "step": 950} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746205979, "_runtime": 2751}, "step": 950} +{"logs": {"train/loss": 4.6217, "train/learning_rate": 0.00045555555555555556, "train/epoch": 1.03, "_timestamp": 1746205979, "_runtime": 2751}, "step": 950} +{"train_info/time_between_train_steps": 0.0241391658782959, "step": 950} +{"info/global_step": 951, "train_info/time_within_train_step": 2.6765313148498535, "step": 951} +{"train_info/time_between_train_steps": 0.0033206939697265625, "step": 951} +{"info/global_step": 952, "train_info/time_within_train_step": 2.67594051361084, "step": 952} +{"train_info/time_between_train_steps": 0.0034575462341308594, "step": 952} +{"info/global_step": 953, "train_info/time_within_train_step": 2.6752843856811523, "step": 953} +{"train_info/time_between_train_steps": 0.0032935142517089844, "step": 953} +{"info/global_step": 954, "train_info/time_within_train_step": 2.6760005950927734, "step": 954} +{"train_info/time_between_train_steps": 0.003302335739135742, "step": 954} +{"info/global_step": 955, "train_info/time_within_train_step": 2.6760168075561523, "step": 955} +{"train_info/time_between_train_steps": 0.0032896995544433594, "step": 955} +{"info/global_step": 956, "train_info/time_within_train_step": 2.6753101348876953, "step": 956} +{"train_info/time_between_train_steps": 0.0033006668090820312, "step": 956} +{"info/global_step": 957, "train_info/time_within_train_step": 2.6742610931396484, "step": 957} +{"train_info/time_between_train_steps": 0.0033173561096191406, "step": 957} +{"info/global_step": 958, "train_info/time_within_train_step": 2.6745095252990723, "step": 958} +{"train_info/time_between_train_steps": 0.003332376480102539, "step": 958} +{"info/global_step": 959, "train_info/time_within_train_step": 2.675065279006958, "step": 959} +{"train_info/time_between_train_steps": 0.0033762454986572266, "step": 959} +{"info/global_step": 960, "train_info/time_within_train_step": 2.6768441200256348, "step": 960} +{"train_info/time_between_train_steps": 0.003366708755493164, "step": 960} +{"info/global_step": 961, "train_info/time_within_train_step": 2.67629337310791, "step": 961} +{"train_info/time_between_train_steps": 0.0033092498779296875, "step": 961} +{"info/global_step": 962, "train_info/time_within_train_step": 2.676905632019043, "step": 962} +{"train_info/time_between_train_steps": 0.003322601318359375, "step": 962} +{"info/global_step": 963, "train_info/time_within_train_step": 2.6767072677612305, "step": 963} +{"train_info/time_between_train_steps": 0.003322601318359375, "step": 963} +{"info/global_step": 964, "train_info/time_within_train_step": 2.676393508911133, "step": 964} +{"train_info/time_between_train_steps": 0.0033333301544189453, "step": 964} +{"info/global_step": 965, "train_info/time_within_train_step": 2.676403045654297, "step": 965} +{"train_info/time_between_train_steps": 0.0033326148986816406, "step": 965} +{"info/global_step": 966, "train_info/time_within_train_step": 2.676574945449829, "step": 966} +{"train_info/time_between_train_steps": 0.0033416748046875, "step": 966} +{"info/global_step": 967, "train_info/time_within_train_step": 2.6760318279266357, "step": 967} +{"train_info/time_between_train_steps": 0.0032854080200195312, "step": 967} +{"info/global_step": 968, "train_info/time_within_train_step": 2.6749753952026367, "step": 968} +{"train_info/time_between_train_steps": 0.003281116485595703, "step": 968} +{"info/global_step": 969, "train_info/time_within_train_step": 2.674752950668335, "step": 969} +{"train_info/time_between_train_steps": 0.003300189971923828, "step": 969} +{"info/global_step": 970, "train_info/time_within_train_step": 2.675246477127075, "step": 970} +{"train_info/time_between_train_steps": 0.003313302993774414, "step": 970} +{"info/global_step": 971, "train_info/time_within_train_step": 2.674821376800537, "step": 971} +{"train_info/time_between_train_steps": 0.0033042430877685547, "step": 971} +{"info/global_step": 972, "train_info/time_within_train_step": 2.681569814682007, "step": 972} +{"train_info/time_between_train_steps": 0.003326416015625, "step": 972} +{"info/global_step": 973, "train_info/time_within_train_step": 2.674704074859619, "step": 973} +{"train_info/time_between_train_steps": 0.003300189971923828, "step": 973} +{"info/global_step": 974, "train_info/time_within_train_step": 2.6745195388793945, "step": 974} +{"train_info/time_between_train_steps": 0.0033092498779296875, "step": 974} +{"info/global_step": 975, "train_info/time_within_train_step": 2.675685167312622, "step": 975} +{"train_info/time_between_train_steps": 0.00328826904296875, "step": 975} +{"info/global_step": 976, "train_info/time_within_train_step": 2.6746017932891846, "step": 976} +{"train_info/time_between_train_steps": 0.003324270248413086, "step": 976} +{"info/global_step": 977, "train_info/time_within_train_step": 2.6746041774749756, "step": 977} +{"train_info/time_between_train_steps": 0.0032892227172851562, "step": 977} +{"info/global_step": 978, "train_info/time_within_train_step": 2.675060272216797, "step": 978} +{"train_info/time_between_train_steps": 0.0032570362091064453, "step": 978} +{"info/global_step": 979, "train_info/time_within_train_step": 2.8958420753479004, "step": 979} +{"train_info/time_between_train_steps": 0.003304719924926758, "step": 979} +{"info/global_step": 980, "train_info/time_within_train_step": 2.6751255989074707, "step": 980} +{"train_info/time_between_train_steps": 0.0032677650451660156, "step": 980} +{"info/global_step": 981, "train_info/time_within_train_step": 2.67503023147583, "step": 981} +{"train_info/time_between_train_steps": 0.003282308578491211, "step": 981} +{"info/global_step": 982, "train_info/time_within_train_step": 2.6744191646575928, "step": 982} +{"train_info/time_between_train_steps": 0.003309011459350586, "step": 982} +{"info/global_step": 983, "train_info/time_within_train_step": 2.6736602783203125, "step": 983} +{"train_info/time_between_train_steps": 0.003293752670288086, "step": 983} +{"info/global_step": 984, "train_info/time_within_train_step": 2.67452073097229, "step": 984} +{"train_info/time_between_train_steps": 0.003289937973022461, "step": 984} +{"info/global_step": 985, "train_info/time_within_train_step": 2.6745517253875732, "step": 985} +{"train_info/time_between_train_steps": 0.003354310989379883, "step": 985} +{"info/global_step": 986, "train_info/time_within_train_step": 2.674835443496704, "step": 986} +{"train_info/time_between_train_steps": 0.0032927989959716797, "step": 986} +{"info/global_step": 987, "train_info/time_within_train_step": 2.675034284591675, "step": 987} +{"train_info/time_between_train_steps": 0.003271341323852539, "step": 987} +{"info/global_step": 988, "train_info/time_within_train_step": 2.67372465133667, "step": 988} +{"train_info/time_between_train_steps": 0.00328826904296875, "step": 988} +{"info/global_step": 989, "train_info/time_within_train_step": 2.6760473251342773, "step": 989} +{"train_info/time_between_train_steps": 0.12318801879882812, "step": 989} +{"info/global_step": 990, "train_info/time_within_train_step": 2.674332618713379, "step": 990} +{"train_info/time_between_train_steps": 0.003309965133666992, "step": 990} +{"info/global_step": 991, "train_info/time_within_train_step": 2.6761410236358643, "step": 991} +{"train_info/time_between_train_steps": 0.003290891647338867, "step": 991} +{"info/global_step": 992, "train_info/time_within_train_step": 2.6745593547821045, "step": 992} +{"train_info/time_between_train_steps": 0.0033528804779052734, "step": 992} +{"info/global_step": 993, "train_info/time_within_train_step": 2.673295497894287, "step": 993} +{"train_info/time_between_train_steps": 0.003323078155517578, "step": 993} +{"info/global_step": 994, "train_info/time_within_train_step": 2.6741364002227783, "step": 994} +{"train_info/time_between_train_steps": 0.003338336944580078, "step": 994} +{"info/global_step": 995, "train_info/time_within_train_step": 2.674647569656372, "step": 995} +{"train_info/time_between_train_steps": 0.0033020973205566406, "step": 995} +{"info/global_step": 996, "train_info/time_within_train_step": 2.674243450164795, "step": 996} +{"train_info/time_between_train_steps": 0.0033524036407470703, "step": 996} +{"info/global_step": 997, "train_info/time_within_train_step": 2.674600124359131, "step": 997} +{"train_info/time_between_train_steps": 0.0033216476440429688, "step": 997} +{"info/global_step": 998, "train_info/time_within_train_step": 2.674755573272705, "step": 998} +{"train_info/time_between_train_steps": 0.0033257007598876953, "step": 998} +{"info/global_step": 999, "train_info/time_within_train_step": 2.674668312072754, "step": 999} +{"train_info/time_between_train_steps": 0.003335237503051758, "step": 999} +{"info/global_step": 1000, "train_info/time_within_train_step": 3.1993703842163086, "step": 1000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746206114, "_runtime": 2886}, "step": 1000} +{"logs": {"train/loss": 4.6024, "train/learning_rate": 0.00044444444444444436, "train/epoch": 1.05, "_timestamp": 1746206114, "_runtime": 2886}, "step": 1000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746206120, "_runtime": 2892}, "step": 1000} +{"logs": {"eval/loss": 4.849012851715088, "eval/runtime": 5.621, "eval/samples_per_second": 35.936, "eval/steps_per_second": 1.245, "train/epoch": 1.05, "_timestamp": 1746206120, "_runtime": 2892}, "step": 1000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746206120, "_runtime": 2892}, "step": 1000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.849012851715088, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 127.61435335786472, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.621, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 35.936, "train/epoch": 1.05, "_timestamp": 1746206120, "_runtime": 2892}, "step": 1000} +{"train_info/time_between_train_steps": 18.66721534729004, "step": 1000} +{"info/global_step": 1001, "train_info/time_within_train_step": 2.4733023643493652, "step": 1001} +{"train_info/time_between_train_steps": 0.0033130645751953125, "step": 1001} +{"info/global_step": 1002, "train_info/time_within_train_step": 2.459758758544922, "step": 1002} +{"train_info/time_between_train_steps": 0.003283262252807617, "step": 1002} +{"info/global_step": 1003, "train_info/time_within_train_step": 2.4650802612304688, "step": 1003} +{"train_info/time_between_train_steps": 0.003248929977416992, "step": 1003} +{"info/global_step": 1004, "train_info/time_within_train_step": 2.625761032104492, "step": 1004} +{"train_info/time_between_train_steps": 0.0032806396484375, "step": 1004} +{"info/global_step": 1005, "train_info/time_within_train_step": 2.6726021766662598, "step": 1005} +{"train_info/time_between_train_steps": 0.003270864486694336, "step": 1005} +{"info/global_step": 1006, "train_info/time_within_train_step": 2.675086498260498, "step": 1006} +{"train_info/time_between_train_steps": 0.003310680389404297, "step": 1006} +{"info/global_step": 1007, "train_info/time_within_train_step": 2.6758763790130615, "step": 1007} +{"train_info/time_between_train_steps": 0.0033304691314697266, "step": 1007} +{"info/global_step": 1008, "train_info/time_within_train_step": 2.6735246181488037, "step": 1008} +{"train_info/time_between_train_steps": 0.0032792091369628906, "step": 1008} +{"info/global_step": 1009, "train_info/time_within_train_step": 2.6733362674713135, "step": 1009} +{"train_info/time_between_train_steps": 0.003303050994873047, "step": 1009} +{"info/global_step": 1010, "train_info/time_within_train_step": 2.674250841140747, "step": 1010} +{"train_info/time_between_train_steps": 0.0033271312713623047, "step": 1010} +{"info/global_step": 1011, "train_info/time_within_train_step": 2.6734156608581543, "step": 1011} +{"train_info/time_between_train_steps": 0.0032358169555664062, "step": 1011} +{"info/global_step": 1012, "train_info/time_within_train_step": 2.674987316131592, "step": 1012} +{"train_info/time_between_train_steps": 0.0032858848571777344, "step": 1012} +{"info/global_step": 1013, "train_info/time_within_train_step": 2.6735990047454834, "step": 1013} +{"train_info/time_between_train_steps": 0.0032684803009033203, "step": 1013} +{"info/global_step": 1014, "train_info/time_within_train_step": 2.6755170822143555, "step": 1014} +{"train_info/time_between_train_steps": 0.0032706260681152344, "step": 1014} +{"info/global_step": 1015, "train_info/time_within_train_step": 2.675636053085327, "step": 1015} +{"train_info/time_between_train_steps": 0.0032749176025390625, "step": 1015} +{"info/global_step": 1016, "train_info/time_within_train_step": 2.674955368041992, "step": 1016} +{"train_info/time_between_train_steps": 0.003249645233154297, "step": 1016} +{"info/global_step": 1017, "train_info/time_within_train_step": 2.6757025718688965, "step": 1017} +{"train_info/time_between_train_steps": 0.003276824951171875, "step": 1017} +{"info/global_step": 1018, "train_info/time_within_train_step": 2.6749606132507324, "step": 1018} +{"train_info/time_between_train_steps": 0.003281831741333008, "step": 1018} +{"info/global_step": 1019, "train_info/time_within_train_step": 2.6756718158721924, "step": 1019} +{"train_info/time_between_train_steps": 0.0033516883850097656, "step": 1019} +{"info/global_step": 1020, "train_info/time_within_train_step": 2.675387382507324, "step": 1020} +{"train_info/time_between_train_steps": 0.003316164016723633, "step": 1020} +{"info/global_step": 1021, "train_info/time_within_train_step": 2.673975706100464, "step": 1021} +{"train_info/time_between_train_steps": 0.0032851696014404297, "step": 1021} +{"info/global_step": 1022, "train_info/time_within_train_step": 2.6749775409698486, "step": 1022} +{"train_info/time_between_train_steps": 0.003258228302001953, "step": 1022} +{"info/global_step": 1023, "train_info/time_within_train_step": 2.675025701522827, "step": 1023} +{"train_info/time_between_train_steps": 0.0032634735107421875, "step": 1023} +{"info/global_step": 1024, "train_info/time_within_train_step": 2.6744935512542725, "step": 1024} +{"train_info/time_between_train_steps": 0.0032396316528320312, "step": 1024} +{"info/global_step": 1025, "train_info/time_within_train_step": 2.6741883754730225, "step": 1025} +{"train_info/time_between_train_steps": 0.0033059120178222656, "step": 1025} +{"info/global_step": 1026, "train_info/time_within_train_step": 2.6748106479644775, "step": 1026} +{"train_info/time_between_train_steps": 0.003296375274658203, "step": 1026} +{"info/global_step": 1027, "train_info/time_within_train_step": 2.675433397293091, "step": 1027} +{"train_info/time_between_train_steps": 0.0032699108123779297, "step": 1027} +{"info/global_step": 1028, "train_info/time_within_train_step": 2.897376537322998, "step": 1028} +{"train_info/time_between_train_steps": 0.003251314163208008, "step": 1028} +{"info/global_step": 1029, "train_info/time_within_train_step": 2.673865556716919, "step": 1029} +{"train_info/time_between_train_steps": 0.0033025741577148438, "step": 1029} +{"info/global_step": 1030, "train_info/time_within_train_step": 2.675008535385132, "step": 1030} +{"train_info/time_between_train_steps": 0.0032606124877929688, "step": 1030} +{"info/global_step": 1031, "train_info/time_within_train_step": 2.6744465827941895, "step": 1031} +{"train_info/time_between_train_steps": 0.003346681594848633, "step": 1031} +{"info/global_step": 1032, "train_info/time_within_train_step": 2.6743857860565186, "step": 1032} +{"train_info/time_between_train_steps": 0.003262042999267578, "step": 1032} +{"info/global_step": 1033, "train_info/time_within_train_step": 2.674417734146118, "step": 1033} +{"train_info/time_between_train_steps": 0.003248929977416992, "step": 1033} +{"info/global_step": 1034, "train_info/time_within_train_step": 2.6751275062561035, "step": 1034} +{"train_info/time_between_train_steps": 0.003256082534790039, "step": 1034} +{"info/global_step": 1035, "train_info/time_within_train_step": 2.6731154918670654, "step": 1035} +{"train_info/time_between_train_steps": 0.0032112598419189453, "step": 1035} +{"info/global_step": 1036, "train_info/time_within_train_step": 2.673021078109741, "step": 1036} +{"train_info/time_between_train_steps": 0.003225564956665039, "step": 1036} +{"info/global_step": 1037, "train_info/time_within_train_step": 2.672881603240967, "step": 1037} +{"train_info/time_between_train_steps": 0.0032575130462646484, "step": 1037} +{"info/global_step": 1038, "train_info/time_within_train_step": 2.672840118408203, "step": 1038} +{"train_info/time_between_train_steps": 0.003263235092163086, "step": 1038} +{"info/global_step": 1039, "train_info/time_within_train_step": 2.678382158279419, "step": 1039} +{"train_info/time_between_train_steps": 0.003217935562133789, "step": 1039} +{"info/global_step": 1040, "train_info/time_within_train_step": 2.6746997833251953, "step": 1040} +{"train_info/time_between_train_steps": 0.0032737255096435547, "step": 1040} +{"info/global_step": 1041, "train_info/time_within_train_step": 2.673274278640747, "step": 1041} +{"train_info/time_between_train_steps": 0.0032739639282226562, "step": 1041} +{"info/global_step": 1042, "train_info/time_within_train_step": 2.6808948516845703, "step": 1042} +{"train_info/time_between_train_steps": 0.0032706260681152344, "step": 1042} +{"info/global_step": 1043, "train_info/time_within_train_step": 2.673711061477661, "step": 1043} +{"train_info/time_between_train_steps": 0.003249645233154297, "step": 1043} +{"info/global_step": 1044, "train_info/time_within_train_step": 2.6745851039886475, "step": 1044} +{"train_info/time_between_train_steps": 0.0032715797424316406, "step": 1044} +{"info/global_step": 1045, "train_info/time_within_train_step": 2.674002170562744, "step": 1045} +{"train_info/time_between_train_steps": 0.003230571746826172, "step": 1045} +{"info/global_step": 1046, "train_info/time_within_train_step": 2.6725552082061768, "step": 1046} +{"train_info/time_between_train_steps": 0.003228425979614258, "step": 1046} +{"info/global_step": 1047, "train_info/time_within_train_step": 2.6723437309265137, "step": 1047} +{"train_info/time_between_train_steps": 0.0032744407653808594, "step": 1047} +{"info/global_step": 1048, "train_info/time_within_train_step": 2.6733663082122803, "step": 1048} +{"train_info/time_between_train_steps": 0.0033698081970214844, "step": 1048} +{"info/global_step": 1049, "train_info/time_within_train_step": 2.672597885131836, "step": 1049} +{"train_info/time_between_train_steps": 0.0032787322998046875, "step": 1049} +{"info/global_step": 1050, "train_info/time_within_train_step": 2.6738202571868896, "step": 1050} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746206268, "_runtime": 3040}, "step": 1050} +{"logs": {"train/loss": 4.5633, "train/learning_rate": 0.0004333333333333333, "train/epoch": 1.06, "_timestamp": 1746206268, "_runtime": 3040}, "step": 1050} +{"train_info/time_between_train_steps": 0.024630308151245117, "step": 1050} +{"info/global_step": 1051, "train_info/time_within_train_step": 2.673280715942383, "step": 1051} +{"train_info/time_between_train_steps": 0.003255605697631836, "step": 1051} +{"info/global_step": 1052, "train_info/time_within_train_step": 2.792039632797241, "step": 1052} +{"train_info/time_between_train_steps": 0.0032851696014404297, "step": 1052} +{"info/global_step": 1053, "train_info/time_within_train_step": 2.6741819381713867, "step": 1053} +{"train_info/time_between_train_steps": 0.003322601318359375, "step": 1053} +{"info/global_step": 1054, "train_info/time_within_train_step": 2.67521595954895, "step": 1054} +{"train_info/time_between_train_steps": 0.0032815933227539062, "step": 1054} +{"info/global_step": 1055, "train_info/time_within_train_step": 2.672395944595337, "step": 1055} +{"train_info/time_between_train_steps": 0.0033195018768310547, "step": 1055} +{"info/global_step": 1056, "train_info/time_within_train_step": 2.6733455657958984, "step": 1056} +{"train_info/time_between_train_steps": 0.0032587051391601562, "step": 1056} +{"info/global_step": 1057, "train_info/time_within_train_step": 2.6745810508728027, "step": 1057} +{"train_info/time_between_train_steps": 0.003263235092163086, "step": 1057} +{"info/global_step": 1058, "train_info/time_within_train_step": 2.6740474700927734, "step": 1058} +{"train_info/time_between_train_steps": 0.003316640853881836, "step": 1058} +{"info/global_step": 1059, "train_info/time_within_train_step": 2.6747398376464844, "step": 1059} +{"train_info/time_between_train_steps": 0.003250598907470703, "step": 1059} +{"info/global_step": 1060, "train_info/time_within_train_step": 2.6743385791778564, "step": 1060} +{"train_info/time_between_train_steps": 0.0032927989959716797, "step": 1060} +{"info/global_step": 1061, "train_info/time_within_train_step": 2.6731808185577393, "step": 1061} +{"train_info/time_between_train_steps": 0.0032608509063720703, "step": 1061} +{"info/global_step": 1062, "train_info/time_within_train_step": 2.673358201980591, "step": 1062} +{"train_info/time_between_train_steps": 0.003233671188354492, "step": 1062} +{"info/global_step": 1063, "train_info/time_within_train_step": 2.674447536468506, "step": 1063} +{"train_info/time_between_train_steps": 0.0032868385314941406, "step": 1063} +{"info/global_step": 1064, "train_info/time_within_train_step": 2.6732747554779053, "step": 1064} +{"train_info/time_between_train_steps": 0.0032606124877929688, "step": 1064} +{"info/global_step": 1065, "train_info/time_within_train_step": 2.6728577613830566, "step": 1065} +{"train_info/time_between_train_steps": 0.0032753944396972656, "step": 1065} +{"info/global_step": 1066, "train_info/time_within_train_step": 2.6738407611846924, "step": 1066} +{"train_info/time_between_train_steps": 0.0033037662506103516, "step": 1066} +{"info/global_step": 1067, "train_info/time_within_train_step": 2.67569899559021, "step": 1067} +{"train_info/time_between_train_steps": 0.0033164024353027344, "step": 1067} +{"info/global_step": 1068, "train_info/time_within_train_step": 2.6757009029388428, "step": 1068} +{"train_info/time_between_train_steps": 0.0032825469970703125, "step": 1068} +{"info/global_step": 1069, "train_info/time_within_train_step": 2.673916816711426, "step": 1069} +{"train_info/time_between_train_steps": 0.0032966136932373047, "step": 1069} +{"info/global_step": 1070, "train_info/time_within_train_step": 2.674785852432251, "step": 1070} +{"train_info/time_between_train_steps": 0.003285646438598633, "step": 1070} +{"info/global_step": 1071, "train_info/time_within_train_step": 2.6756951808929443, "step": 1071} +{"train_info/time_between_train_steps": 0.003287792205810547, "step": 1071} +{"info/global_step": 1072, "train_info/time_within_train_step": 2.6759791374206543, "step": 1072} +{"train_info/time_between_train_steps": 0.003322124481201172, "step": 1072} +{"info/global_step": 1073, "train_info/time_within_train_step": 2.675004243850708, "step": 1073} +{"train_info/time_between_train_steps": 0.0032885074615478516, "step": 1073} +{"info/global_step": 1074, "train_info/time_within_train_step": 2.675503969192505, "step": 1074} +{"train_info/time_between_train_steps": 0.0034351348876953125, "step": 1074} +{"info/global_step": 1075, "train_info/time_within_train_step": 2.673792600631714, "step": 1075} +{"train_info/time_between_train_steps": 0.00330352783203125, "step": 1075} +{"info/global_step": 1076, "train_info/time_within_train_step": 2.6742630004882812, "step": 1076} +{"train_info/time_between_train_steps": 0.0035772323608398438, "step": 1076} +{"info/global_step": 1077, "train_info/time_within_train_step": 2.673295259475708, "step": 1077} +{"train_info/time_between_train_steps": 0.0036590099334716797, "step": 1077} +{"info/global_step": 1078, "train_info/time_within_train_step": 2.6731114387512207, "step": 1078} +{"train_info/time_between_train_steps": 0.0036368370056152344, "step": 1078} +{"info/global_step": 1079, "train_info/time_within_train_step": 2.672916889190674, "step": 1079} +{"train_info/time_between_train_steps": 0.003468751907348633, "step": 1079} +{"info/global_step": 1080, "train_info/time_within_train_step": 2.6736676692962646, "step": 1080} +{"train_info/time_between_train_steps": 0.0035161972045898438, "step": 1080} +{"info/global_step": 1081, "train_info/time_within_train_step": 2.6740431785583496, "step": 1081} +{"train_info/time_between_train_steps": 0.0035359859466552734, "step": 1081} +{"info/global_step": 1082, "train_info/time_within_train_step": 2.674717903137207, "step": 1082} +{"train_info/time_between_train_steps": 0.0035827159881591797, "step": 1082} +{"info/global_step": 1083, "train_info/time_within_train_step": 2.6735775470733643, "step": 1083} +{"train_info/time_between_train_steps": 0.003559112548828125, "step": 1083} +{"info/global_step": 1084, "train_info/time_within_train_step": 2.6749064922332764, "step": 1084} +{"train_info/time_between_train_steps": 0.003622770309448242, "step": 1084} +{"info/global_step": 1085, "train_info/time_within_train_step": 2.6756038665771484, "step": 1085} +{"train_info/time_between_train_steps": 0.0036323070526123047, "step": 1085} +{"info/global_step": 1086, "train_info/time_within_train_step": 2.6759161949157715, "step": 1086} +{"train_info/time_between_train_steps": 0.0037500858306884766, "step": 1086} +{"info/global_step": 1087, "train_info/time_within_train_step": 2.6755857467651367, "step": 1087} +{"train_info/time_between_train_steps": 0.0036911964416503906, "step": 1087} +{"info/global_step": 1088, "train_info/time_within_train_step": 2.6772689819335938, "step": 1088} +{"train_info/time_between_train_steps": 0.003549337387084961, "step": 1088} +{"info/global_step": 1089, "train_info/time_within_train_step": 2.674107551574707, "step": 1089} +{"train_info/time_between_train_steps": 0.0035958290100097656, "step": 1089} +{"info/global_step": 1090, "train_info/time_within_train_step": 2.6744465827941895, "step": 1090} +{"train_info/time_between_train_steps": 0.003590106964111328, "step": 1090} +{"info/global_step": 1091, "train_info/time_within_train_step": 2.6743204593658447, "step": 1091} +{"train_info/time_between_train_steps": 0.003623485565185547, "step": 1091} +{"info/global_step": 1092, "train_info/time_within_train_step": 2.6760971546173096, "step": 1092} +{"train_info/time_between_train_steps": 0.003673076629638672, "step": 1092} +{"info/global_step": 1093, "train_info/time_within_train_step": 2.676818370819092, "step": 1093} +{"train_info/time_between_train_steps": 0.003867626190185547, "step": 1093} +{"info/global_step": 1094, "train_info/time_within_train_step": 2.6759982109069824, "step": 1094} +{"train_info/time_between_train_steps": 0.0036139488220214844, "step": 1094} +{"info/global_step": 1095, "train_info/time_within_train_step": 2.6765732765197754, "step": 1095} +{"train_info/time_between_train_steps": 0.003670930862426758, "step": 1095} +{"info/global_step": 1096, "train_info/time_within_train_step": 2.674384832382202, "step": 1096} +{"train_info/time_between_train_steps": 0.003630399703979492, "step": 1096} +{"info/global_step": 1097, "train_info/time_within_train_step": 2.673959493637085, "step": 1097} +{"train_info/time_between_train_steps": 0.003542661666870117, "step": 1097} +{"info/global_step": 1098, "train_info/time_within_train_step": 2.6737828254699707, "step": 1098} +{"train_info/time_between_train_steps": 0.003503561019897461, "step": 1098} +{"info/global_step": 1099, "train_info/time_within_train_step": 2.6729788780212402, "step": 1099} +{"train_info/time_between_train_steps": 0.003571748733520508, "step": 1099} +{"info/global_step": 1100, "train_info/time_within_train_step": 2.674391269683838, "step": 1100} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746206403, "_runtime": 3175}, "step": 1100} +{"logs": {"train/loss": 4.5344, "train/learning_rate": 0.0004222222222222222, "train/epoch": 1.08, "_timestamp": 1746206403, "_runtime": 3175}, "step": 1100} +{"train_info/time_between_train_steps": 13.48010540008545, "step": 1100} +{"info/global_step": 1101, "train_info/time_within_train_step": 2.5148661136627197, "step": 1101} +{"train_info/time_between_train_steps": 0.0035772323608398438, "step": 1101} +{"info/global_step": 1102, "train_info/time_within_train_step": 2.4594202041625977, "step": 1102} +{"train_info/time_between_train_steps": 0.0034856796264648438, "step": 1102} +{"info/global_step": 1103, "train_info/time_within_train_step": 2.476736545562744, "step": 1103} +{"train_info/time_between_train_steps": 0.0035638809204101562, "step": 1103} +{"info/global_step": 1104, "train_info/time_within_train_step": 2.6574339866638184, "step": 1104} +{"train_info/time_between_train_steps": 0.003565549850463867, "step": 1104} +{"info/global_step": 1105, "train_info/time_within_train_step": 2.6721370220184326, "step": 1105} +{"train_info/time_between_train_steps": 0.0035665035247802734, "step": 1105} +{"info/global_step": 1106, "train_info/time_within_train_step": 2.6741528511047363, "step": 1106} +{"train_info/time_between_train_steps": 0.0034041404724121094, "step": 1106} +{"info/global_step": 1107, "train_info/time_within_train_step": 3.011936902999878, "step": 1107} +{"train_info/time_between_train_steps": 0.003242969512939453, "step": 1107} +{"info/global_step": 1108, "train_info/time_within_train_step": 2.6727936267852783, "step": 1108} +{"train_info/time_between_train_steps": 0.0032606124877929688, "step": 1108} +{"info/global_step": 1109, "train_info/time_within_train_step": 2.674952745437622, "step": 1109} +{"train_info/time_between_train_steps": 0.0032901763916015625, "step": 1109} +{"info/global_step": 1110, "train_info/time_within_train_step": 2.674121856689453, "step": 1110} +{"train_info/time_between_train_steps": 0.003281831741333008, "step": 1110} +{"info/global_step": 1111, "train_info/time_within_train_step": 2.6743717193603516, "step": 1111} +{"train_info/time_between_train_steps": 0.003297090530395508, "step": 1111} +{"info/global_step": 1112, "train_info/time_within_train_step": 2.6757988929748535, "step": 1112} +{"train_info/time_between_train_steps": 0.0032427310943603516, "step": 1112} +{"info/global_step": 1113, "train_info/time_within_train_step": 2.6745009422302246, "step": 1113} +{"train_info/time_between_train_steps": 0.0032536983489990234, "step": 1113} +{"info/global_step": 1114, "train_info/time_within_train_step": 2.6754422187805176, "step": 1114} +{"train_info/time_between_train_steps": 0.14116740226745605, "step": 1114} +{"info/global_step": 1115, "train_info/time_within_train_step": 2.6750423908233643, "step": 1115} +{"train_info/time_between_train_steps": 0.0032415390014648438, "step": 1115} +{"info/global_step": 1116, "train_info/time_within_train_step": 2.6734468936920166, "step": 1116} +{"train_info/time_between_train_steps": 0.0033164024353027344, "step": 1116} +{"info/global_step": 1117, "train_info/time_within_train_step": 2.674443006515503, "step": 1117} +{"train_info/time_between_train_steps": 0.0033147335052490234, "step": 1117} +{"info/global_step": 1118, "train_info/time_within_train_step": 2.6735427379608154, "step": 1118} +{"train_info/time_between_train_steps": 0.0032944679260253906, "step": 1118} +{"info/global_step": 1119, "train_info/time_within_train_step": 2.674574136734009, "step": 1119} +{"train_info/time_between_train_steps": 0.0032906532287597656, "step": 1119} +{"info/global_step": 1120, "train_info/time_within_train_step": 2.674530029296875, "step": 1120} +{"train_info/time_between_train_steps": 0.003360271453857422, "step": 1120} +{"info/global_step": 1121, "train_info/time_within_train_step": 2.673719882965088, "step": 1121} +{"train_info/time_between_train_steps": 0.0032720565795898438, "step": 1121} +{"info/global_step": 1122, "train_info/time_within_train_step": 2.6741316318511963, "step": 1122} +{"train_info/time_between_train_steps": 0.0032520294189453125, "step": 1122} +{"info/global_step": 1123, "train_info/time_within_train_step": 2.6741528511047363, "step": 1123} +{"train_info/time_between_train_steps": 0.0032842159271240234, "step": 1123} +{"info/global_step": 1124, "train_info/time_within_train_step": 2.6748695373535156, "step": 1124} +{"train_info/time_between_train_steps": 0.0032796859741210938, "step": 1124} +{"info/global_step": 1125, "train_info/time_within_train_step": 2.6736230850219727, "step": 1125} +{"train_info/time_between_train_steps": 0.0032815933227539062, "step": 1125} +{"info/global_step": 1126, "train_info/time_within_train_step": 2.6744651794433594, "step": 1126} +{"train_info/time_between_train_steps": 0.0032520294189453125, "step": 1126} +{"info/global_step": 1127, "train_info/time_within_train_step": 2.673827648162842, "step": 1127} +{"train_info/time_between_train_steps": 0.003282785415649414, "step": 1127} +{"info/global_step": 1128, "train_info/time_within_train_step": 2.6750359535217285, "step": 1128} +{"train_info/time_between_train_steps": 0.0033049583435058594, "step": 1128} +{"info/global_step": 1129, "train_info/time_within_train_step": 2.6728086471557617, "step": 1129} +{"train_info/time_between_train_steps": 0.003233671188354492, "step": 1129} +{"info/global_step": 1130, "train_info/time_within_train_step": 2.6736040115356445, "step": 1130} +{"train_info/time_between_train_steps": 0.003260374069213867, "step": 1130} +{"info/global_step": 1131, "train_info/time_within_train_step": 2.6734042167663574, "step": 1131} +{"train_info/time_between_train_steps": 0.0032901763916015625, "step": 1131} +{"info/global_step": 1132, "train_info/time_within_train_step": 2.6734023094177246, "step": 1132} +{"train_info/time_between_train_steps": 0.0032122135162353516, "step": 1132} +{"info/global_step": 1133, "train_info/time_within_train_step": 2.673551559448242, "step": 1133} +{"train_info/time_between_train_steps": 0.003211498260498047, "step": 1133} +{"info/global_step": 1134, "train_info/time_within_train_step": 2.6732547283172607, "step": 1134} +{"train_info/time_between_train_steps": 0.003331422805786133, "step": 1134} +{"info/global_step": 1135, "train_info/time_within_train_step": 2.6734468936920166, "step": 1135} +{"train_info/time_between_train_steps": 0.003256559371948242, "step": 1135} +{"info/global_step": 1136, "train_info/time_within_train_step": 2.6724681854248047, "step": 1136} +{"train_info/time_between_train_steps": 0.00323486328125, "step": 1136} +{"info/global_step": 1137, "train_info/time_within_train_step": 2.672834634780884, "step": 1137} +{"train_info/time_between_train_steps": 0.003229856491088867, "step": 1137} +{"info/global_step": 1138, "train_info/time_within_train_step": 2.6744933128356934, "step": 1138} +{"train_info/time_between_train_steps": 0.0032172203063964844, "step": 1138} +{"info/global_step": 1139, "train_info/time_within_train_step": 2.6723835468292236, "step": 1139} +{"train_info/time_between_train_steps": 0.0031862258911132812, "step": 1139} +{"info/global_step": 1140, "train_info/time_within_train_step": 2.673335552215576, "step": 1140} +{"train_info/time_between_train_steps": 0.0033159255981445312, "step": 1140} +{"info/global_step": 1141, "train_info/time_within_train_step": 2.673807382583618, "step": 1141} +{"train_info/time_between_train_steps": 0.0032639503479003906, "step": 1141} +{"info/global_step": 1142, "train_info/time_within_train_step": 2.674018383026123, "step": 1142} +{"train_info/time_between_train_steps": 0.003288745880126953, "step": 1142} +{"info/global_step": 1143, "train_info/time_within_train_step": 2.676694631576538, "step": 1143} +{"train_info/time_between_train_steps": 0.0034203529357910156, "step": 1143} +{"info/global_step": 1144, "train_info/time_within_train_step": 2.673837900161743, "step": 1144} +{"train_info/time_between_train_steps": 0.0033562183380126953, "step": 1144} +{"info/global_step": 1145, "train_info/time_within_train_step": 2.6728105545043945, "step": 1145} +{"train_info/time_between_train_steps": 0.0032396316528320312, "step": 1145} +{"info/global_step": 1146, "train_info/time_within_train_step": 2.6713995933532715, "step": 1146} +{"train_info/time_between_train_steps": 0.0032439231872558594, "step": 1146} +{"info/global_step": 1147, "train_info/time_within_train_step": 2.6740012168884277, "step": 1147} +{"train_info/time_between_train_steps": 0.003453969955444336, "step": 1147} +{"info/global_step": 1148, "train_info/time_within_train_step": 2.672837972640991, "step": 1148} +{"train_info/time_between_train_steps": 0.003475666046142578, "step": 1148} +{"info/global_step": 1149, "train_info/time_within_train_step": 2.6751155853271484, "step": 1149} +{"train_info/time_between_train_steps": 0.003687620162963867, "step": 1149} +{"info/global_step": 1150, "train_info/time_within_train_step": 2.677260398864746, "step": 1150} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746206551, "_runtime": 3323}, "step": 1150} +{"logs": {"train/loss": 4.4915, "train/learning_rate": 0.0004111111111111111, "train/epoch": 1.1, "_timestamp": 1746206551, "_runtime": 3323}, "step": 1150} +{"train_info/time_between_train_steps": 0.024641036987304688, "step": 1150} +{"info/global_step": 1151, "train_info/time_within_train_step": 2.6767241954803467, "step": 1151} +{"train_info/time_between_train_steps": 0.0036749839782714844, "step": 1151} +{"info/global_step": 1152, "train_info/time_within_train_step": 2.6758759021759033, "step": 1152} +{"train_info/time_between_train_steps": 0.0036478042602539062, "step": 1152} +{"info/global_step": 1153, "train_info/time_within_train_step": 2.6766035556793213, "step": 1153} +{"train_info/time_between_train_steps": 0.0037255287170410156, "step": 1153} +{"info/global_step": 1154, "train_info/time_within_train_step": 2.6752984523773193, "step": 1154} +{"train_info/time_between_train_steps": 0.003628969192504883, "step": 1154} +{"info/global_step": 1155, "train_info/time_within_train_step": 2.6753573417663574, "step": 1155} +{"train_info/time_between_train_steps": 0.0036530494689941406, "step": 1155} +{"info/global_step": 1156, "train_info/time_within_train_step": 2.674187421798706, "step": 1156} +{"train_info/time_between_train_steps": 0.0036993026733398438, "step": 1156} +{"info/global_step": 1157, "train_info/time_within_train_step": 2.6753311157226562, "step": 1157} +{"train_info/time_between_train_steps": 0.0036160945892333984, "step": 1157} +{"info/global_step": 1158, "train_info/time_within_train_step": 2.67339825630188, "step": 1158} +{"train_info/time_between_train_steps": 0.0036284923553466797, "step": 1158} +{"info/global_step": 1159, "train_info/time_within_train_step": 3.026914119720459, "step": 1159} +{"train_info/time_between_train_steps": 0.0034279823303222656, "step": 1159} +{"info/global_step": 1160, "train_info/time_within_train_step": 2.6731810569763184, "step": 1160} +{"train_info/time_between_train_steps": 0.0045506954193115234, "step": 1160} +{"info/global_step": 1161, "train_info/time_within_train_step": 2.6732535362243652, "step": 1161} +{"train_info/time_between_train_steps": 0.0033502578735351562, "step": 1161} +{"info/global_step": 1162, "train_info/time_within_train_step": 2.673956871032715, "step": 1162} +{"train_info/time_between_train_steps": 0.003331422805786133, "step": 1162} +{"info/global_step": 1163, "train_info/time_within_train_step": 2.6732139587402344, "step": 1163} +{"train_info/time_between_train_steps": 0.00342559814453125, "step": 1163} +{"info/global_step": 1164, "train_info/time_within_train_step": 2.67350435256958, "step": 1164} +{"train_info/time_between_train_steps": 0.0033283233642578125, "step": 1164} +{"info/global_step": 1165, "train_info/time_within_train_step": 2.6734511852264404, "step": 1165} +{"train_info/time_between_train_steps": 0.003415346145629883, "step": 1165} +{"info/global_step": 1166, "train_info/time_within_train_step": 2.6729109287261963, "step": 1166} +{"train_info/time_between_train_steps": 0.003396272659301758, "step": 1166} +{"info/global_step": 1167, "train_info/time_within_train_step": 2.672320604324341, "step": 1167} +{"train_info/time_between_train_steps": 0.0034110546112060547, "step": 1167} +{"info/global_step": 1168, "train_info/time_within_train_step": 2.674532175064087, "step": 1168} +{"train_info/time_between_train_steps": 0.0033299922943115234, "step": 1168} +{"info/global_step": 1169, "train_info/time_within_train_step": 2.673691511154175, "step": 1169} +{"train_info/time_between_train_steps": 0.0033769607543945312, "step": 1169} +{"info/global_step": 1170, "train_info/time_within_train_step": 2.673100233078003, "step": 1170} +{"train_info/time_between_train_steps": 0.003325223922729492, "step": 1170} +{"info/global_step": 1171, "train_info/time_within_train_step": 2.6742303371429443, "step": 1171} +{"train_info/time_between_train_steps": 0.0033674240112304688, "step": 1171} +{"info/global_step": 1172, "train_info/time_within_train_step": 2.6745455265045166, "step": 1172} +{"train_info/time_between_train_steps": 0.003522634506225586, "step": 1172} +{"info/global_step": 1173, "train_info/time_within_train_step": 2.6741690635681152, "step": 1173} +{"train_info/time_between_train_steps": 0.003337860107421875, "step": 1173} +{"info/global_step": 1174, "train_info/time_within_train_step": 2.671682119369507, "step": 1174} +{"train_info/time_between_train_steps": 0.0033566951751708984, "step": 1174} +{"info/global_step": 1175, "train_info/time_within_train_step": 2.6729376316070557, "step": 1175} +{"train_info/time_between_train_steps": 0.00360107421875, "step": 1175} +{"info/global_step": 1176, "train_info/time_within_train_step": 2.673140048980713, "step": 1176} +{"train_info/time_between_train_steps": 0.0034515857696533203, "step": 1176} +{"info/global_step": 1177, "train_info/time_within_train_step": 2.8500263690948486, "step": 1177} +{"train_info/time_between_train_steps": 0.0035529136657714844, "step": 1177} +{"info/global_step": 1178, "train_info/time_within_train_step": 2.724910020828247, "step": 1178} +{"train_info/time_between_train_steps": 0.003532886505126953, "step": 1178} +{"info/global_step": 1179, "train_info/time_within_train_step": 2.674492597579956, "step": 1179} +{"train_info/time_between_train_steps": 0.0035691261291503906, "step": 1179} +{"info/global_step": 1180, "train_info/time_within_train_step": 2.6743507385253906, "step": 1180} +{"train_info/time_between_train_steps": 0.0035254955291748047, "step": 1180} +{"info/global_step": 1181, "train_info/time_within_train_step": 2.674294948577881, "step": 1181} +{"train_info/time_between_train_steps": 0.006994009017944336, "step": 1181} +{"info/global_step": 1182, "train_info/time_within_train_step": 2.6737358570098877, "step": 1182} +{"train_info/time_between_train_steps": 0.007524728775024414, "step": 1182} +{"info/global_step": 1183, "train_info/time_within_train_step": 2.674731969833374, "step": 1183} +{"train_info/time_between_train_steps": 0.006879329681396484, "step": 1183} +{"info/global_step": 1184, "train_info/time_within_train_step": 2.6732518672943115, "step": 1184} +{"train_info/time_between_train_steps": 0.0034515857696533203, "step": 1184} +{"info/global_step": 1185, "train_info/time_within_train_step": 2.6727793216705322, "step": 1185} +{"train_info/time_between_train_steps": 0.003541707992553711, "step": 1185} +{"info/global_step": 1186, "train_info/time_within_train_step": 2.6744682788848877, "step": 1186} +{"train_info/time_between_train_steps": 0.0035440921783447266, "step": 1186} +{"info/global_step": 1187, "train_info/time_within_train_step": 2.675279140472412, "step": 1187} +{"train_info/time_between_train_steps": 0.0035200119018554688, "step": 1187} +{"info/global_step": 1188, "train_info/time_within_train_step": 2.6764752864837646, "step": 1188} +{"train_info/time_between_train_steps": 0.0035605430603027344, "step": 1188} +{"info/global_step": 1189, "train_info/time_within_train_step": 2.674893856048584, "step": 1189} +{"train_info/time_between_train_steps": 0.0036535263061523438, "step": 1189} +{"info/global_step": 1190, "train_info/time_within_train_step": 2.674245595932007, "step": 1190} +{"train_info/time_between_train_steps": 0.003529071807861328, "step": 1190} +{"info/global_step": 1191, "train_info/time_within_train_step": 2.673758029937744, "step": 1191} +{"train_info/time_between_train_steps": 0.0034837722778320312, "step": 1191} +{"info/global_step": 1192, "train_info/time_within_train_step": 2.673396348953247, "step": 1192} +{"train_info/time_between_train_steps": 0.003477334976196289, "step": 1192} +{"info/global_step": 1193, "train_info/time_within_train_step": 2.6755504608154297, "step": 1193} +{"train_info/time_between_train_steps": 0.0035195350646972656, "step": 1193} +{"info/global_step": 1194, "train_info/time_within_train_step": 2.675262689590454, "step": 1194} +{"train_info/time_between_train_steps": 0.0035080909729003906, "step": 1194} +{"info/global_step": 1195, "train_info/time_within_train_step": 2.674168348312378, "step": 1195} +{"train_info/time_between_train_steps": 0.0035271644592285156, "step": 1195} +{"info/global_step": 1196, "train_info/time_within_train_step": 2.674762725830078, "step": 1196} +{"train_info/time_between_train_steps": 0.003594636917114258, "step": 1196} +{"info/global_step": 1197, "train_info/time_within_train_step": 2.9934184551239014, "step": 1197} +{"train_info/time_between_train_steps": 0.003384113311767578, "step": 1197} +{"info/global_step": 1198, "train_info/time_within_train_step": 2.675149917602539, "step": 1198} +{"train_info/time_between_train_steps": 0.003407001495361328, "step": 1198} +{"info/global_step": 1199, "train_info/time_within_train_step": 2.674161434173584, "step": 1199} +{"train_info/time_between_train_steps": 0.0033559799194335938, "step": 1199} +{"info/global_step": 1200, "train_info/time_within_train_step": 2.673011064529419, "step": 1200} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746206687, "_runtime": 3459}, "step": 1200} +{"logs": {"train/loss": 4.4726, "train/learning_rate": 0.00039999999999999996, "train/epoch": 1.11, "_timestamp": 1746206687, "_runtime": 3459}, "step": 1200} +{"train_info/time_between_train_steps": 13.183404207229614, "step": 1200} +{"info/global_step": 1201, "train_info/time_within_train_step": 2.47296404838562, "step": 1201} +{"train_info/time_between_train_steps": 0.0033071041107177734, "step": 1201} +{"info/global_step": 1202, "train_info/time_within_train_step": 2.4601290225982666, "step": 1202} +{"train_info/time_between_train_steps": 0.0032896995544433594, "step": 1202} +{"info/global_step": 1203, "train_info/time_within_train_step": 2.4985849857330322, "step": 1203} +{"train_info/time_between_train_steps": 0.0033397674560546875, "step": 1203} +{"info/global_step": 1204, "train_info/time_within_train_step": 2.666440725326538, "step": 1204} +{"train_info/time_between_train_steps": 0.003358125686645508, "step": 1204} +{"info/global_step": 1205, "train_info/time_within_train_step": 2.6746928691864014, "step": 1205} +{"train_info/time_between_train_steps": 0.0033767223358154297, "step": 1205} +{"info/global_step": 1206, "train_info/time_within_train_step": 2.6738357543945312, "step": 1206} +{"train_info/time_between_train_steps": 0.003352642059326172, "step": 1206} +{"info/global_step": 1207, "train_info/time_within_train_step": 2.6749916076660156, "step": 1207} +{"train_info/time_between_train_steps": 0.006009578704833984, "step": 1207} +{"info/global_step": 1208, "train_info/time_within_train_step": 2.674276351928711, "step": 1208} +{"train_info/time_between_train_steps": 0.0032837390899658203, "step": 1208} +{"info/global_step": 1209, "train_info/time_within_train_step": 2.6736793518066406, "step": 1209} +{"train_info/time_between_train_steps": 0.0032868385314941406, "step": 1209} +{"info/global_step": 1210, "train_info/time_within_train_step": 2.673348903656006, "step": 1210} +{"train_info/time_between_train_steps": 0.0033016204833984375, "step": 1210} +{"info/global_step": 1211, "train_info/time_within_train_step": 2.673445463180542, "step": 1211} +{"train_info/time_between_train_steps": 0.0034856796264648438, "step": 1211} +{"info/global_step": 1212, "train_info/time_within_train_step": 2.6743781566619873, "step": 1212} +{"train_info/time_between_train_steps": 0.0033152103424072266, "step": 1212} +{"info/global_step": 1213, "train_info/time_within_train_step": 2.6750569343566895, "step": 1213} +{"train_info/time_between_train_steps": 0.003323793411254883, "step": 1213} +{"info/global_step": 1214, "train_info/time_within_train_step": 2.674992084503174, "step": 1214} +{"train_info/time_between_train_steps": 0.0033080577850341797, "step": 1214} +{"info/global_step": 1215, "train_info/time_within_train_step": 2.675450563430786, "step": 1215} +{"train_info/time_between_train_steps": 0.0033028125762939453, "step": 1215} +{"info/global_step": 1216, "train_info/time_within_train_step": 2.675489902496338, "step": 1216} +{"train_info/time_between_train_steps": 0.003295421600341797, "step": 1216} +{"info/global_step": 1217, "train_info/time_within_train_step": 2.675855875015259, "step": 1217} +{"train_info/time_between_train_steps": 0.00339508056640625, "step": 1217} +{"info/global_step": 1218, "train_info/time_within_train_step": 2.675323486328125, "step": 1218} +{"train_info/time_between_train_steps": 0.003328084945678711, "step": 1218} +{"info/global_step": 1219, "train_info/time_within_train_step": 2.6754391193389893, "step": 1219} +{"train_info/time_between_train_steps": 0.0032863616943359375, "step": 1219} +{"info/global_step": 1220, "train_info/time_within_train_step": 2.674471616744995, "step": 1220} +{"train_info/time_between_train_steps": 0.003287076950073242, "step": 1220} +{"info/global_step": 1221, "train_info/time_within_train_step": 2.6748104095458984, "step": 1221} +{"train_info/time_between_train_steps": 0.0032978057861328125, "step": 1221} +{"info/global_step": 1222, "train_info/time_within_train_step": 2.673959970474243, "step": 1222} +{"train_info/time_between_train_steps": 0.0032744407653808594, "step": 1222} +{"info/global_step": 1223, "train_info/time_within_train_step": 2.673776865005493, "step": 1223} +{"train_info/time_between_train_steps": 0.0033075809478759766, "step": 1223} +{"info/global_step": 1224, "train_info/time_within_train_step": 2.6734368801116943, "step": 1224} +{"train_info/time_between_train_steps": 0.0032813549041748047, "step": 1224} +{"info/global_step": 1225, "train_info/time_within_train_step": 2.6733717918395996, "step": 1225} +{"train_info/time_between_train_steps": 0.0032584667205810547, "step": 1225} +{"info/global_step": 1226, "train_info/time_within_train_step": 2.6727676391601562, "step": 1226} +{"train_info/time_between_train_steps": 0.003347158432006836, "step": 1226} +{"info/global_step": 1227, "train_info/time_within_train_step": 2.674060583114624, "step": 1227} +{"train_info/time_between_train_steps": 0.0033740997314453125, "step": 1227} +{"info/global_step": 1228, "train_info/time_within_train_step": 2.6730833053588867, "step": 1228} +{"train_info/time_between_train_steps": 0.0033054351806640625, "step": 1228} +{"info/global_step": 1229, "train_info/time_within_train_step": 2.674866199493408, "step": 1229} +{"train_info/time_between_train_steps": 0.003255605697631836, "step": 1229} +{"info/global_step": 1230, "train_info/time_within_train_step": 2.6728689670562744, "step": 1230} +{"train_info/time_between_train_steps": 0.0032777786254882812, "step": 1230} +{"info/global_step": 1231, "train_info/time_within_train_step": 2.673933982849121, "step": 1231} +{"train_info/time_between_train_steps": 0.003294229507446289, "step": 1231} +{"info/global_step": 1232, "train_info/time_within_train_step": 2.6738228797912598, "step": 1232} +{"train_info/time_between_train_steps": 0.003309965133666992, "step": 1232} +{"info/global_step": 1233, "train_info/time_within_train_step": 2.6736583709716797, "step": 1233} +{"train_info/time_between_train_steps": 0.003290891647338867, "step": 1233} +{"info/global_step": 1234, "train_info/time_within_train_step": 2.67427134513855, "step": 1234} +{"train_info/time_between_train_steps": 0.003300189971923828, "step": 1234} +{"info/global_step": 1235, "train_info/time_within_train_step": 2.6746339797973633, "step": 1235} +{"train_info/time_between_train_steps": 0.0032758712768554688, "step": 1235} +{"info/global_step": 1236, "train_info/time_within_train_step": 2.6732747554779053, "step": 1236} +{"train_info/time_between_train_steps": 0.0032906532287597656, "step": 1236} +{"info/global_step": 1237, "train_info/time_within_train_step": 2.673799514770508, "step": 1237} +{"train_info/time_between_train_steps": 0.0032892227172851562, "step": 1237} +{"info/global_step": 1238, "train_info/time_within_train_step": 2.6729795932769775, "step": 1238} +{"train_info/time_between_train_steps": 0.0032913684844970703, "step": 1238} +{"info/global_step": 1239, "train_info/time_within_train_step": 2.6737871170043945, "step": 1239} +{"train_info/time_between_train_steps": 0.12562870979309082, "step": 1239} +{"info/global_step": 1240, "train_info/time_within_train_step": 2.6723744869232178, "step": 1240} +{"train_info/time_between_train_steps": 0.0033054351806640625, "step": 1240} +{"info/global_step": 1241, "train_info/time_within_train_step": 2.673874616622925, "step": 1241} +{"train_info/time_between_train_steps": 0.0032815933227539062, "step": 1241} +{"info/global_step": 1242, "train_info/time_within_train_step": 2.6746985912323, "step": 1242} +{"train_info/time_between_train_steps": 0.0033202171325683594, "step": 1242} +{"info/global_step": 1243, "train_info/time_within_train_step": 2.6742842197418213, "step": 1243} +{"train_info/time_between_train_steps": 0.0033550262451171875, "step": 1243} +{"info/global_step": 1244, "train_info/time_within_train_step": 2.6746826171875, "step": 1244} +{"train_info/time_between_train_steps": 0.0032846927642822266, "step": 1244} +{"info/global_step": 1245, "train_info/time_within_train_step": 2.674499750137329, "step": 1245} +{"train_info/time_between_train_steps": 0.0034003257751464844, "step": 1245} +{"info/global_step": 1246, "train_info/time_within_train_step": 2.6738173961639404, "step": 1246} +{"train_info/time_between_train_steps": 0.003446340560913086, "step": 1246} +{"info/global_step": 1247, "train_info/time_within_train_step": 2.673977851867676, "step": 1247} +{"train_info/time_between_train_steps": 0.003583192825317383, "step": 1247} +{"info/global_step": 1248, "train_info/time_within_train_step": 2.673837900161743, "step": 1248} +{"train_info/time_between_train_steps": 0.0035157203674316406, "step": 1248} +{"info/global_step": 1249, "train_info/time_within_train_step": 2.6745381355285645, "step": 1249} +{"train_info/time_between_train_steps": 0.003551006317138672, "step": 1249} +{"info/global_step": 1250, "train_info/time_within_train_step": 3.6056582927703857, "step": 1250} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746206835, "_runtime": 3607}, "step": 1250} +{"logs": {"train/loss": 4.4378, "train/learning_rate": 0.00038888888888888887, "train/epoch": 1.13, "_timestamp": 1746206835, "_runtime": 3607}, "step": 1250} +{"train_info/time_between_train_steps": 0.02467656135559082, "step": 1250} +{"info/global_step": 1251, "train_info/time_within_train_step": 2.673069953918457, "step": 1251} +{"train_info/time_between_train_steps": 0.0033180713653564453, "step": 1251} +{"info/global_step": 1252, "train_info/time_within_train_step": 2.672498941421509, "step": 1252} +{"train_info/time_between_train_steps": 0.003345012664794922, "step": 1252} +{"info/global_step": 1253, "train_info/time_within_train_step": 2.672210454940796, "step": 1253} +{"train_info/time_between_train_steps": 0.0033087730407714844, "step": 1253} +{"info/global_step": 1254, "train_info/time_within_train_step": 2.673146963119507, "step": 1254} +{"train_info/time_between_train_steps": 0.003401517868041992, "step": 1254} +{"info/global_step": 1255, "train_info/time_within_train_step": 2.6735947132110596, "step": 1255} +{"train_info/time_between_train_steps": 0.0033309459686279297, "step": 1255} +{"info/global_step": 1256, "train_info/time_within_train_step": 2.675311326980591, "step": 1256} +{"train_info/time_between_train_steps": 0.0033283233642578125, "step": 1256} +{"info/global_step": 1257, "train_info/time_within_train_step": 2.6738064289093018, "step": 1257} +{"train_info/time_between_train_steps": 0.0033197402954101562, "step": 1257} +{"info/global_step": 1258, "train_info/time_within_train_step": 2.672886610031128, "step": 1258} +{"train_info/time_between_train_steps": 0.0033292770385742188, "step": 1258} +{"info/global_step": 1259, "train_info/time_within_train_step": 2.672976016998291, "step": 1259} +{"train_info/time_between_train_steps": 0.003273487091064453, "step": 1259} +{"info/global_step": 1260, "train_info/time_within_train_step": 2.673546314239502, "step": 1260} +{"train_info/time_between_train_steps": 0.003319263458251953, "step": 1260} +{"info/global_step": 1261, "train_info/time_within_train_step": 2.6727962493896484, "step": 1261} +{"train_info/time_between_train_steps": 0.003330230712890625, "step": 1261} +{"info/global_step": 1262, "train_info/time_within_train_step": 2.673208713531494, "step": 1262} +{"train_info/time_between_train_steps": 0.0033156871795654297, "step": 1262} +{"info/global_step": 1263, "train_info/time_within_train_step": 2.6739368438720703, "step": 1263} +{"train_info/time_between_train_steps": 0.003302335739135742, "step": 1263} +{"info/global_step": 1264, "train_info/time_within_train_step": 2.6722257137298584, "step": 1264} +{"train_info/time_between_train_steps": 0.00333404541015625, "step": 1264} +{"info/global_step": 1265, "train_info/time_within_train_step": 2.6728203296661377, "step": 1265} +{"train_info/time_between_train_steps": 0.0033147335052490234, "step": 1265} +{"info/global_step": 1266, "train_info/time_within_train_step": 2.6719677448272705, "step": 1266} +{"train_info/time_between_train_steps": 0.0033626556396484375, "step": 1266} +{"info/global_step": 1267, "train_info/time_within_train_step": 2.6728692054748535, "step": 1267} +{"train_info/time_between_train_steps": 0.0033071041107177734, "step": 1267} +{"info/global_step": 1268, "train_info/time_within_train_step": 2.6734228134155273, "step": 1268} +{"train_info/time_between_train_steps": 0.0033245086669921875, "step": 1268} +{"info/global_step": 1269, "train_info/time_within_train_step": 2.6739821434020996, "step": 1269} +{"train_info/time_between_train_steps": 0.0033452510833740234, "step": 1269} +{"info/global_step": 1270, "train_info/time_within_train_step": 2.673424243927002, "step": 1270} +{"train_info/time_between_train_steps": 0.003319978713989258, "step": 1270} +{"info/global_step": 1271, "train_info/time_within_train_step": 2.673849582672119, "step": 1271} +{"train_info/time_between_train_steps": 0.0033349990844726562, "step": 1271} +{"info/global_step": 1272, "train_info/time_within_train_step": 2.673327684402466, "step": 1272} +{"train_info/time_between_train_steps": 0.0033729076385498047, "step": 1272} +{"info/global_step": 1273, "train_info/time_within_train_step": 2.6750409603118896, "step": 1273} +{"train_info/time_between_train_steps": 0.00336456298828125, "step": 1273} +{"info/global_step": 1274, "train_info/time_within_train_step": 2.674647808074951, "step": 1274} +{"train_info/time_between_train_steps": 0.003500223159790039, "step": 1274} +{"info/global_step": 1275, "train_info/time_within_train_step": 2.6747097969055176, "step": 1275} +{"train_info/time_between_train_steps": 0.0034608840942382812, "step": 1275} +{"info/global_step": 1276, "train_info/time_within_train_step": 2.674099922180176, "step": 1276} +{"train_info/time_between_train_steps": 0.003551959991455078, "step": 1276} +{"info/global_step": 1277, "train_info/time_within_train_step": 2.674417734146118, "step": 1277} +{"train_info/time_between_train_steps": 0.0035927295684814453, "step": 1277} +{"info/global_step": 1278, "train_info/time_within_train_step": 2.6732146739959717, "step": 1278} +{"train_info/time_between_train_steps": 0.0035665035247802734, "step": 1278} +{"info/global_step": 1279, "train_info/time_within_train_step": 2.673515796661377, "step": 1279} +{"train_info/time_between_train_steps": 0.003547191619873047, "step": 1279} +{"info/global_step": 1280, "train_info/time_within_train_step": 2.6735622882843018, "step": 1280} +{"train_info/time_between_train_steps": 0.0036072731018066406, "step": 1280} +{"info/global_step": 1281, "train_info/time_within_train_step": 2.673569917678833, "step": 1281} +{"train_info/time_between_train_steps": 0.0035119056701660156, "step": 1281} +{"info/global_step": 1282, "train_info/time_within_train_step": 2.6724414825439453, "step": 1282} +{"train_info/time_between_train_steps": 0.003614187240600586, "step": 1282} +{"info/global_step": 1283, "train_info/time_within_train_step": 2.6734721660614014, "step": 1283} +{"train_info/time_between_train_steps": 0.0035784244537353516, "step": 1283} +{"info/global_step": 1284, "train_info/time_within_train_step": 2.674954414367676, "step": 1284} +{"train_info/time_between_train_steps": 0.0035762786865234375, "step": 1284} +{"info/global_step": 1285, "train_info/time_within_train_step": 2.6751577854156494, "step": 1285} +{"train_info/time_between_train_steps": 0.0035440921783447266, "step": 1285} +{"info/global_step": 1286, "train_info/time_within_train_step": 2.725024700164795, "step": 1286} +{"train_info/time_between_train_steps": 0.0037097930908203125, "step": 1286} +{"info/global_step": 1287, "train_info/time_within_train_step": 2.675539970397949, "step": 1287} +{"train_info/time_between_train_steps": 0.0035898685455322266, "step": 1287} +{"info/global_step": 1288, "train_info/time_within_train_step": 2.6728525161743164, "step": 1288} +{"train_info/time_between_train_steps": 0.003618478775024414, "step": 1288} +{"info/global_step": 1289, "train_info/time_within_train_step": 2.6757683753967285, "step": 1289} +{"train_info/time_between_train_steps": 0.003539562225341797, "step": 1289} +{"info/global_step": 1290, "train_info/time_within_train_step": 2.6746325492858887, "step": 1290} +{"train_info/time_between_train_steps": 0.003571748733520508, "step": 1290} +{"info/global_step": 1291, "train_info/time_within_train_step": 2.6757776737213135, "step": 1291} +{"train_info/time_between_train_steps": 0.0035452842712402344, "step": 1291} +{"info/global_step": 1292, "train_info/time_within_train_step": 2.67521333694458, "step": 1292} +{"train_info/time_between_train_steps": 0.0036003589630126953, "step": 1292} +{"info/global_step": 1293, "train_info/time_within_train_step": 2.673689842224121, "step": 1293} +{"train_info/time_between_train_steps": 0.0035943984985351562, "step": 1293} +{"info/global_step": 1294, "train_info/time_within_train_step": 2.674304246902466, "step": 1294} +{"train_info/time_between_train_steps": 0.0035657882690429688, "step": 1294} +{"info/global_step": 1295, "train_info/time_within_train_step": 2.676306962966919, "step": 1295} +{"train_info/time_between_train_steps": 0.003639698028564453, "step": 1295} +{"info/global_step": 1296, "train_info/time_within_train_step": 2.6756091117858887, "step": 1296} +{"train_info/time_between_train_steps": 0.003541231155395508, "step": 1296} +{"info/global_step": 1297, "train_info/time_within_train_step": 2.6737489700317383, "step": 1297} +{"train_info/time_between_train_steps": 0.0034923553466796875, "step": 1297} +{"info/global_step": 1298, "train_info/time_within_train_step": 2.6738224029541016, "step": 1298} +{"train_info/time_between_train_steps": 0.003451108932495117, "step": 1298} +{"info/global_step": 1299, "train_info/time_within_train_step": 2.673011541366577, "step": 1299} +{"train_info/time_between_train_steps": 0.0035657882690429688, "step": 1299} +{"info/global_step": 1300, "train_info/time_within_train_step": 2.6743698120117188, "step": 1300} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746206970, "_runtime": 3742}, "step": 1300} +{"logs": {"train/loss": 4.4126, "train/learning_rate": 0.00037777777777777777, "train/epoch": 1.15, "_timestamp": 1746206970, "_runtime": 3742}, "step": 1300} +{"train_info/time_between_train_steps": 13.141604900360107, "step": 1300} +{"info/global_step": 1301, "train_info/time_within_train_step": 2.470951795578003, "step": 1301} +{"train_info/time_between_train_steps": 0.003469705581665039, "step": 1301} +{"info/global_step": 1302, "train_info/time_within_train_step": 2.9246296882629395, "step": 1302} +{"train_info/time_between_train_steps": 0.0032911300659179688, "step": 1302} +{"info/global_step": 1303, "train_info/time_within_train_step": 2.4680001735687256, "step": 1303} +{"train_info/time_between_train_steps": 0.0032465457916259766, "step": 1303} +{"info/global_step": 1304, "train_info/time_within_train_step": 2.6522867679595947, "step": 1304} +{"train_info/time_between_train_steps": 0.003329038619995117, "step": 1304} +{"info/global_step": 1305, "train_info/time_within_train_step": 2.6718645095825195, "step": 1305} +{"train_info/time_between_train_steps": 0.003298521041870117, "step": 1305} +{"info/global_step": 1306, "train_info/time_within_train_step": 2.6691696643829346, "step": 1306} +{"train_info/time_between_train_steps": 0.0033016204833984375, "step": 1306} +{"info/global_step": 1307, "train_info/time_within_train_step": 2.6718132495880127, "step": 1307} +{"train_info/time_between_train_steps": 0.0032644271850585938, "step": 1307} +{"info/global_step": 1308, "train_info/time_within_train_step": 2.671417474746704, "step": 1308} +{"train_info/time_between_train_steps": 0.003283262252807617, "step": 1308} +{"info/global_step": 1309, "train_info/time_within_train_step": 2.67228364944458, "step": 1309} +{"train_info/time_between_train_steps": 0.0032808780670166016, "step": 1309} +{"info/global_step": 1310, "train_info/time_within_train_step": 2.6730668544769287, "step": 1310} +{"train_info/time_between_train_steps": 0.0032711029052734375, "step": 1310} +{"info/global_step": 1311, "train_info/time_within_train_step": 2.6743953227996826, "step": 1311} +{"train_info/time_between_train_steps": 0.0032804012298583984, "step": 1311} +{"info/global_step": 1312, "train_info/time_within_train_step": 2.6739895343780518, "step": 1312} +{"train_info/time_between_train_steps": 0.003309965133666992, "step": 1312} +{"info/global_step": 1313, "train_info/time_within_train_step": 2.673994779586792, "step": 1313} +{"train_info/time_between_train_steps": 0.003274679183959961, "step": 1313} +{"info/global_step": 1314, "train_info/time_within_train_step": 2.673889636993408, "step": 1314} +{"train_info/time_between_train_steps": 0.0032355785369873047, "step": 1314} +{"info/global_step": 1315, "train_info/time_within_train_step": 2.6748106479644775, "step": 1315} +{"train_info/time_between_train_steps": 0.0033223628997802734, "step": 1315} +{"info/global_step": 1316, "train_info/time_within_train_step": 2.675493001937866, "step": 1316} +{"train_info/time_between_train_steps": 0.003307342529296875, "step": 1316} +{"info/global_step": 1317, "train_info/time_within_train_step": 2.6735761165618896, "step": 1317} +{"train_info/time_between_train_steps": 0.003298044204711914, "step": 1317} +{"info/global_step": 1318, "train_info/time_within_train_step": 2.6741669178009033, "step": 1318} +{"train_info/time_between_train_steps": 0.0032930374145507812, "step": 1318} +{"info/global_step": 1319, "train_info/time_within_train_step": 2.675004243850708, "step": 1319} +{"train_info/time_between_train_steps": 0.0033473968505859375, "step": 1319} +{"info/global_step": 1320, "train_info/time_within_train_step": 2.6745553016662598, "step": 1320} +{"train_info/time_between_train_steps": 0.0033349990844726562, "step": 1320} +{"info/global_step": 1321, "train_info/time_within_train_step": 2.6732192039489746, "step": 1321} +{"train_info/time_between_train_steps": 0.003288745880126953, "step": 1321} +{"info/global_step": 1322, "train_info/time_within_train_step": 2.6723313331604004, "step": 1322} +{"train_info/time_between_train_steps": 0.0032973289489746094, "step": 1322} +{"info/global_step": 1323, "train_info/time_within_train_step": 2.6737940311431885, "step": 1323} +{"train_info/time_between_train_steps": 0.0032434463500976562, "step": 1323} +{"info/global_step": 1324, "train_info/time_within_train_step": 2.673210859298706, "step": 1324} +{"train_info/time_between_train_steps": 0.0032248497009277344, "step": 1324} +{"info/global_step": 1325, "train_info/time_within_train_step": 2.6737637519836426, "step": 1325} +{"train_info/time_between_train_steps": 0.003291606903076172, "step": 1325} +{"info/global_step": 1326, "train_info/time_within_train_step": 2.723482847213745, "step": 1326} +{"train_info/time_between_train_steps": 0.0032355785369873047, "step": 1326} +{"info/global_step": 1327, "train_info/time_within_train_step": 2.672921657562256, "step": 1327} +{"train_info/time_between_train_steps": 0.0032377243041992188, "step": 1327} +{"info/global_step": 1328, "train_info/time_within_train_step": 2.675173044204712, "step": 1328} +{"train_info/time_between_train_steps": 0.003329038619995117, "step": 1328} +{"info/global_step": 1329, "train_info/time_within_train_step": 2.672116994857788, "step": 1329} +{"train_info/time_between_train_steps": 0.003299713134765625, "step": 1329} +{"info/global_step": 1330, "train_info/time_within_train_step": 2.6736230850219727, "step": 1330} +{"train_info/time_between_train_steps": 0.0036439895629882812, "step": 1330} +{"info/global_step": 1331, "train_info/time_within_train_step": 2.675382375717163, "step": 1331} +{"train_info/time_between_train_steps": 0.003557443618774414, "step": 1331} +{"info/global_step": 1332, "train_info/time_within_train_step": 2.6736462116241455, "step": 1332} +{"train_info/time_between_train_steps": 0.0037674903869628906, "step": 1332} +{"info/global_step": 1333, "train_info/time_within_train_step": 2.675685167312622, "step": 1333} +{"train_info/time_between_train_steps": 0.0036063194274902344, "step": 1333} +{"info/global_step": 1334, "train_info/time_within_train_step": 2.6743884086608887, "step": 1334} +{"train_info/time_between_train_steps": 0.003604412078857422, "step": 1334} +{"info/global_step": 1335, "train_info/time_within_train_step": 2.674868583679199, "step": 1335} +{"train_info/time_between_train_steps": 0.0035347938537597656, "step": 1335} +{"info/global_step": 1336, "train_info/time_within_train_step": 2.674046516418457, "step": 1336} +{"train_info/time_between_train_steps": 0.0035598278045654297, "step": 1336} +{"info/global_step": 1337, "train_info/time_within_train_step": 2.6750071048736572, "step": 1337} +{"train_info/time_between_train_steps": 0.0035789012908935547, "step": 1337} +{"info/global_step": 1338, "train_info/time_within_train_step": 2.674945116043091, "step": 1338} +{"train_info/time_between_train_steps": 0.0036525726318359375, "step": 1338} +{"info/global_step": 1339, "train_info/time_within_train_step": 2.674098253250122, "step": 1339} +{"train_info/time_between_train_steps": 0.0035631656646728516, "step": 1339} +{"info/global_step": 1340, "train_info/time_within_train_step": 2.676543951034546, "step": 1340} +{"train_info/time_between_train_steps": 0.0036208629608154297, "step": 1340} +{"info/global_step": 1341, "train_info/time_within_train_step": 2.6737496852874756, "step": 1341} +{"train_info/time_between_train_steps": 0.0035712718963623047, "step": 1341} +{"info/global_step": 1342, "train_info/time_within_train_step": 2.6733481884002686, "step": 1342} +{"train_info/time_between_train_steps": 0.0035543441772460938, "step": 1342} +{"info/global_step": 1343, "train_info/time_within_train_step": 2.6752922534942627, "step": 1343} +{"train_info/time_between_train_steps": 0.003658771514892578, "step": 1343} +{"info/global_step": 1344, "train_info/time_within_train_step": 2.674685001373291, "step": 1344} +{"train_info/time_between_train_steps": 0.0035200119018554688, "step": 1344} +{"info/global_step": 1345, "train_info/time_within_train_step": 2.674097776412964, "step": 1345} +{"train_info/time_between_train_steps": 0.0036041736602783203, "step": 1345} +{"info/global_step": 1346, "train_info/time_within_train_step": 2.6730964183807373, "step": 1346} +{"train_info/time_between_train_steps": 0.0035381317138671875, "step": 1346} +{"info/global_step": 1347, "train_info/time_within_train_step": 2.6737029552459717, "step": 1347} +{"train_info/time_between_train_steps": 0.0036172866821289062, "step": 1347} +{"info/global_step": 1348, "train_info/time_within_train_step": 2.6750049591064453, "step": 1348} +{"train_info/time_between_train_steps": 0.003718852996826172, "step": 1348} +{"info/global_step": 1349, "train_info/time_within_train_step": 2.67399525642395, "step": 1349} +{"train_info/time_between_train_steps": 0.0036194324493408203, "step": 1349} +{"info/global_step": 1350, "train_info/time_within_train_step": 2.6740801334381104, "step": 1350} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746207118, "_runtime": 3890}, "step": 1350} +{"logs": {"train/loss": 4.3828, "train/learning_rate": 0.00036666666666666667, "train/epoch": 1.16, "_timestamp": 1746207118, "_runtime": 3890}, "step": 1350} +{"train_info/time_between_train_steps": 0.024613618850708008, "step": 1350} +{"info/global_step": 1351, "train_info/time_within_train_step": 2.674875497817993, "step": 1351} +{"train_info/time_between_train_steps": 0.003749847412109375, "step": 1351} +{"info/global_step": 1352, "train_info/time_within_train_step": 2.675974130630493, "step": 1352} +{"train_info/time_between_train_steps": 0.003658294677734375, "step": 1352} +{"info/global_step": 1353, "train_info/time_within_train_step": 2.6752235889434814, "step": 1353} +{"train_info/time_between_train_steps": 0.0036215782165527344, "step": 1353} +{"info/global_step": 1354, "train_info/time_within_train_step": 2.676440715789795, "step": 1354} +{"train_info/time_between_train_steps": 0.003650665283203125, "step": 1354} +{"info/global_step": 1355, "train_info/time_within_train_step": 3.031240463256836, "step": 1355} +{"train_info/time_between_train_steps": 0.0033416748046875, "step": 1355} +{"info/global_step": 1356, "train_info/time_within_train_step": 2.6733663082122803, "step": 1356} +{"train_info/time_between_train_steps": 0.0033702850341796875, "step": 1356} +{"info/global_step": 1357, "train_info/time_within_train_step": 2.6735877990722656, "step": 1357} +{"train_info/time_between_train_steps": 0.0033402442932128906, "step": 1357} +{"info/global_step": 1358, "train_info/time_within_train_step": 2.6717123985290527, "step": 1358} +{"train_info/time_between_train_steps": 0.0033478736877441406, "step": 1358} +{"info/global_step": 1359, "train_info/time_within_train_step": 2.6718759536743164, "step": 1359} +{"train_info/time_between_train_steps": 0.0033202171325683594, "step": 1359} +{"info/global_step": 1360, "train_info/time_within_train_step": 2.6736152172088623, "step": 1360} +{"train_info/time_between_train_steps": 0.003378152847290039, "step": 1360} +{"info/global_step": 1361, "train_info/time_within_train_step": 2.672301769256592, "step": 1361} +{"train_info/time_between_train_steps": 0.0033178329467773438, "step": 1361} +{"info/global_step": 1362, "train_info/time_within_train_step": 2.674318790435791, "step": 1362} +{"train_info/time_between_train_steps": 0.0033783912658691406, "step": 1362} +{"info/global_step": 1363, "train_info/time_within_train_step": 2.674598455429077, "step": 1363} +{"train_info/time_between_train_steps": 0.0034253597259521484, "step": 1363} +{"info/global_step": 1364, "train_info/time_within_train_step": 2.674764394760132, "step": 1364} +{"train_info/time_between_train_steps": 0.12144327163696289, "step": 1364} +{"info/global_step": 1365, "train_info/time_within_train_step": 2.688098430633545, "step": 1365} +{"train_info/time_between_train_steps": 0.003353118896484375, "step": 1365} +{"info/global_step": 1366, "train_info/time_within_train_step": 2.673661231994629, "step": 1366} +{"train_info/time_between_train_steps": 0.0035676956176757812, "step": 1366} +{"info/global_step": 1367, "train_info/time_within_train_step": 2.674105167388916, "step": 1367} +{"train_info/time_between_train_steps": 0.0033140182495117188, "step": 1367} +{"info/global_step": 1368, "train_info/time_within_train_step": 2.6714608669281006, "step": 1368} +{"train_info/time_between_train_steps": 0.00328826904296875, "step": 1368} +{"info/global_step": 1369, "train_info/time_within_train_step": 2.673166275024414, "step": 1369} +{"train_info/time_between_train_steps": 0.0033278465270996094, "step": 1369} +{"info/global_step": 1370, "train_info/time_within_train_step": 2.672508478164673, "step": 1370} +{"train_info/time_between_train_steps": 0.003285646438598633, "step": 1370} +{"info/global_step": 1371, "train_info/time_within_train_step": 2.6720809936523438, "step": 1371} +{"train_info/time_between_train_steps": 0.0032958984375, "step": 1371} +{"info/global_step": 1372, "train_info/time_within_train_step": 2.6719489097595215, "step": 1372} +{"train_info/time_between_train_steps": 0.0033884048461914062, "step": 1372} +{"info/global_step": 1373, "train_info/time_within_train_step": 2.67132306098938, "step": 1373} +{"train_info/time_between_train_steps": 0.003331899642944336, "step": 1373} +{"info/global_step": 1374, "train_info/time_within_train_step": 2.672706127166748, "step": 1374} +{"train_info/time_between_train_steps": 0.003301382064819336, "step": 1374} +{"info/global_step": 1375, "train_info/time_within_train_step": 2.6735918521881104, "step": 1375} +{"train_info/time_between_train_steps": 0.003325939178466797, "step": 1375} +{"info/global_step": 1376, "train_info/time_within_train_step": 2.673548698425293, "step": 1376} +{"train_info/time_between_train_steps": 0.0033228397369384766, "step": 1376} +{"info/global_step": 1377, "train_info/time_within_train_step": 2.6733205318450928, "step": 1377} +{"train_info/time_between_train_steps": 0.003351926803588867, "step": 1377} +{"info/global_step": 1378, "train_info/time_within_train_step": 2.67227840423584, "step": 1378} +{"train_info/time_between_train_steps": 0.003309965133666992, "step": 1378} +{"info/global_step": 1379, "train_info/time_within_train_step": 2.673896551132202, "step": 1379} +{"train_info/time_between_train_steps": 0.003470182418823242, "step": 1379} +{"info/global_step": 1380, "train_info/time_within_train_step": 2.6738438606262207, "step": 1380} +{"train_info/time_between_train_steps": 0.0034093856811523438, "step": 1380} +{"info/global_step": 1381, "train_info/time_within_train_step": 2.6745636463165283, "step": 1381} +{"train_info/time_between_train_steps": 0.0035517215728759766, "step": 1381} +{"info/global_step": 1382, "train_info/time_within_train_step": 2.6740171909332275, "step": 1382} +{"train_info/time_between_train_steps": 0.0036461353302001953, "step": 1382} +{"info/global_step": 1383, "train_info/time_within_train_step": 2.674400806427002, "step": 1383} +{"train_info/time_between_train_steps": 0.003584146499633789, "step": 1383} +{"info/global_step": 1384, "train_info/time_within_train_step": 2.6737306118011475, "step": 1384} +{"train_info/time_between_train_steps": 0.0035555362701416016, "step": 1384} +{"info/global_step": 1385, "train_info/time_within_train_step": 2.6753201484680176, "step": 1385} +{"train_info/time_between_train_steps": 0.0043182373046875, "step": 1385} +{"info/global_step": 1386, "train_info/time_within_train_step": 2.6734778881073, "step": 1386} +{"train_info/time_between_train_steps": 0.003617525100708008, "step": 1386} +{"info/global_step": 1387, "train_info/time_within_train_step": 2.6733052730560303, "step": 1387} +{"train_info/time_between_train_steps": 0.0036208629608154297, "step": 1387} +{"info/global_step": 1388, "train_info/time_within_train_step": 2.6740000247955322, "step": 1388} +{"train_info/time_between_train_steps": 0.0035333633422851562, "step": 1388} +{"info/global_step": 1389, "train_info/time_within_train_step": 2.673640251159668, "step": 1389} +{"train_info/time_between_train_steps": 0.003627777099609375, "step": 1389} +{"info/global_step": 1390, "train_info/time_within_train_step": 2.673959970474243, "step": 1390} +{"train_info/time_between_train_steps": 0.0036270618438720703, "step": 1390} +{"info/global_step": 1391, "train_info/time_within_train_step": 2.6745378971099854, "step": 1391} +{"train_info/time_between_train_steps": 0.0035364627838134766, "step": 1391} +{"info/global_step": 1392, "train_info/time_within_train_step": 2.6743996143341064, "step": 1392} +{"train_info/time_between_train_steps": 0.0035784244537353516, "step": 1392} +{"info/global_step": 1393, "train_info/time_within_train_step": 2.724987030029297, "step": 1393} +{"train_info/time_between_train_steps": 0.0036535263061523438, "step": 1393} +{"info/global_step": 1394, "train_info/time_within_train_step": 3.032318115234375, "step": 1394} +{"train_info/time_between_train_steps": 0.003355741500854492, "step": 1394} +{"info/global_step": 1395, "train_info/time_within_train_step": 2.6731550693511963, "step": 1395} +{"train_info/time_between_train_steps": 0.003490924835205078, "step": 1395} +{"info/global_step": 1396, "train_info/time_within_train_step": 2.674177646636963, "step": 1396} +{"train_info/time_between_train_steps": 0.0035245418548583984, "step": 1396} +{"info/global_step": 1397, "train_info/time_within_train_step": 2.6741485595703125, "step": 1397} +{"train_info/time_between_train_steps": 0.0034673213958740234, "step": 1397} +{"info/global_step": 1398, "train_info/time_within_train_step": 2.6749260425567627, "step": 1398} +{"train_info/time_between_train_steps": 0.0035436153411865234, "step": 1398} +{"info/global_step": 1399, "train_info/time_within_train_step": 2.6737070083618164, "step": 1399} +{"train_info/time_between_train_steps": 0.003537416458129883, "step": 1399} +{"info/global_step": 1400, "train_info/time_within_train_step": 2.673039197921753, "step": 1400} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746207254, "_runtime": 4026}, "step": 1400} +{"logs": {"train/loss": 4.3571, "train/learning_rate": 0.0003555555555555555, "train/epoch": 1.18, "_timestamp": 1746207254, "_runtime": 4026}, "step": 1400} +{"train_info/time_between_train_steps": 13.246649980545044, "step": 1400} +{"info/global_step": 1401, "train_info/time_within_train_step": 2.4770631790161133, "step": 1401} +{"train_info/time_between_train_steps": 0.0035605430603027344, "step": 1401} +{"info/global_step": 1402, "train_info/time_within_train_step": 2.459425210952759, "step": 1402} +{"train_info/time_between_train_steps": 0.0035316944122314453, "step": 1402} +{"info/global_step": 1403, "train_info/time_within_train_step": 2.464656352996826, "step": 1403} +{"train_info/time_between_train_steps": 0.003599405288696289, "step": 1403} +{"info/global_step": 1404, "train_info/time_within_train_step": 2.6344006061553955, "step": 1404} +{"train_info/time_between_train_steps": 0.0035581588745117188, "step": 1404} +{"info/global_step": 1405, "train_info/time_within_train_step": 2.674375534057617, "step": 1405} +{"train_info/time_between_train_steps": 0.003474712371826172, "step": 1405} +{"info/global_step": 1406, "train_info/time_within_train_step": 2.675492525100708, "step": 1406} +{"train_info/time_between_train_steps": 0.007038116455078125, "step": 1406} +{"info/global_step": 1407, "train_info/time_within_train_step": 2.6738297939300537, "step": 1407} +{"train_info/time_between_train_steps": 0.006951808929443359, "step": 1407} +{"info/global_step": 1408, "train_info/time_within_train_step": 2.6744041442871094, "step": 1408} +{"train_info/time_between_train_steps": 0.007004976272583008, "step": 1408} +{"info/global_step": 1409, "train_info/time_within_train_step": 2.674898386001587, "step": 1409} +{"train_info/time_between_train_steps": 0.006895303726196289, "step": 1409} +{"info/global_step": 1410, "train_info/time_within_train_step": 2.674511432647705, "step": 1410} +{"train_info/time_between_train_steps": 0.006982088088989258, "step": 1410} +{"info/global_step": 1411, "train_info/time_within_train_step": 2.6761960983276367, "step": 1411} +{"train_info/time_between_train_steps": 0.006907463073730469, "step": 1411} +{"info/global_step": 1412, "train_info/time_within_train_step": 2.6756327152252197, "step": 1412} +{"train_info/time_between_train_steps": 0.007024526596069336, "step": 1412} +{"info/global_step": 1413, "train_info/time_within_train_step": 2.6755645275115967, "step": 1413} +{"train_info/time_between_train_steps": 0.0069162845611572266, "step": 1413} +{"info/global_step": 1414, "train_info/time_within_train_step": 2.6782643795013428, "step": 1414} +{"train_info/time_between_train_steps": 0.007051944732666016, "step": 1414} +{"info/global_step": 1415, "train_info/time_within_train_step": 2.677687168121338, "step": 1415} +{"train_info/time_between_train_steps": 0.0034902095794677734, "step": 1415} +{"info/global_step": 1416, "train_info/time_within_train_step": 2.708721160888672, "step": 1416} +{"train_info/time_between_train_steps": 0.003345966339111328, "step": 1416} +{"info/global_step": 1417, "train_info/time_within_train_step": 2.677391767501831, "step": 1417} +{"train_info/time_between_train_steps": 0.003040790557861328, "step": 1417} +{"info/global_step": 1418, "train_info/time_within_train_step": 2.6769826412200928, "step": 1418} +{"train_info/time_between_train_steps": 0.0030181407928466797, "step": 1418} +{"info/global_step": 1419, "train_info/time_within_train_step": 2.6760942935943604, "step": 1419} +{"train_info/time_between_train_steps": 0.0030307769775390625, "step": 1419} +{"info/global_step": 1420, "train_info/time_within_train_step": 2.6750502586364746, "step": 1420} +{"train_info/time_between_train_steps": 0.0030395984649658203, "step": 1420} +{"info/global_step": 1421, "train_info/time_within_train_step": 2.674135208129883, "step": 1421} +{"train_info/time_between_train_steps": 0.0030450820922851562, "step": 1421} +{"info/global_step": 1422, "train_info/time_within_train_step": 2.6745660305023193, "step": 1422} +{"train_info/time_between_train_steps": 0.003070354461669922, "step": 1422} +{"info/global_step": 1423, "train_info/time_within_train_step": 2.674314498901367, "step": 1423} +{"train_info/time_between_train_steps": 0.0031092166900634766, "step": 1423} +{"info/global_step": 1424, "train_info/time_within_train_step": 2.675114870071411, "step": 1424} +{"train_info/time_between_train_steps": 0.003147125244140625, "step": 1424} +{"info/global_step": 1425, "train_info/time_within_train_step": 2.673832416534424, "step": 1425} +{"train_info/time_between_train_steps": 0.003293752670288086, "step": 1425} +{"info/global_step": 1426, "train_info/time_within_train_step": 2.673891305923462, "step": 1426} +{"train_info/time_between_train_steps": 0.003002643585205078, "step": 1426} +{"info/global_step": 1427, "train_info/time_within_train_step": 2.673668384552002, "step": 1427} +{"train_info/time_between_train_steps": 0.0030586719512939453, "step": 1427} +{"info/global_step": 1428, "train_info/time_within_train_step": 2.674342155456543, "step": 1428} +{"train_info/time_between_train_steps": 0.003065824508666992, "step": 1428} +{"info/global_step": 1429, "train_info/time_within_train_step": 2.6739933490753174, "step": 1429} +{"train_info/time_between_train_steps": 0.003065824508666992, "step": 1429} +{"info/global_step": 1430, "train_info/time_within_train_step": 2.6739819049835205, "step": 1430} +{"train_info/time_between_train_steps": 0.0031213760375976562, "step": 1430} +{"info/global_step": 1431, "train_info/time_within_train_step": 2.6738216876983643, "step": 1431} +{"train_info/time_between_train_steps": 0.003049135208129883, "step": 1431} +{"info/global_step": 1432, "train_info/time_within_train_step": 2.6757004261016846, "step": 1432} +{"train_info/time_between_train_steps": 0.0030694007873535156, "step": 1432} +{"info/global_step": 1433, "train_info/time_within_train_step": 2.6748218536376953, "step": 1433} +{"train_info/time_between_train_steps": 0.0030562877655029297, "step": 1433} +{"info/global_step": 1434, "train_info/time_within_train_step": 2.67441987991333, "step": 1434} +{"train_info/time_between_train_steps": 0.0030629634857177734, "step": 1434} +{"info/global_step": 1435, "train_info/time_within_train_step": 2.6742563247680664, "step": 1435} +{"train_info/time_between_train_steps": 0.003093242645263672, "step": 1435} +{"info/global_step": 1436, "train_info/time_within_train_step": 2.673354387283325, "step": 1436} +{"train_info/time_between_train_steps": 0.003175020217895508, "step": 1436} +{"info/global_step": 1437, "train_info/time_within_train_step": 2.958991765975952, "step": 1437} +{"train_info/time_between_train_steps": 0.0029900074005126953, "step": 1437} +{"info/global_step": 1438, "train_info/time_within_train_step": 2.6718530654907227, "step": 1438} +{"train_info/time_between_train_steps": 0.003152132034301758, "step": 1438} +{"info/global_step": 1439, "train_info/time_within_train_step": 2.672264814376831, "step": 1439} +{"train_info/time_between_train_steps": 0.0031065940856933594, "step": 1439} +{"info/global_step": 1440, "train_info/time_within_train_step": 2.672152519226074, "step": 1440} +{"train_info/time_between_train_steps": 0.0030782222747802734, "step": 1440} +{"info/global_step": 1441, "train_info/time_within_train_step": 2.6742546558380127, "step": 1441} +{"train_info/time_between_train_steps": 0.0031888484954833984, "step": 1441} +{"info/global_step": 1442, "train_info/time_within_train_step": 2.6749088764190674, "step": 1442} +{"train_info/time_between_train_steps": 0.003182649612426758, "step": 1442} +{"info/global_step": 1443, "train_info/time_within_train_step": 2.6734426021575928, "step": 1443} +{"train_info/time_between_train_steps": 0.0031588077545166016, "step": 1443} +{"info/global_step": 1444, "train_info/time_within_train_step": 2.6721272468566895, "step": 1444} +{"train_info/time_between_train_steps": 0.003141164779663086, "step": 1444} +{"info/global_step": 1445, "train_info/time_within_train_step": 2.6731319427490234, "step": 1445} +{"train_info/time_between_train_steps": 0.003123760223388672, "step": 1445} +{"info/global_step": 1446, "train_info/time_within_train_step": 2.6734673976898193, "step": 1446} +{"train_info/time_between_train_steps": 0.0032203197479248047, "step": 1446} +{"info/global_step": 1447, "train_info/time_within_train_step": 2.673248767852783, "step": 1447} +{"train_info/time_between_train_steps": 0.003224611282348633, "step": 1447} +{"info/global_step": 1448, "train_info/time_within_train_step": 2.6729307174682617, "step": 1448} +{"train_info/time_between_train_steps": 0.0032160282135009766, "step": 1448} +{"info/global_step": 1449, "train_info/time_within_train_step": 2.6733784675598145, "step": 1449} +{"train_info/time_between_train_steps": 0.0032677650451660156, "step": 1449} +{"info/global_step": 1450, "train_info/time_within_train_step": 2.6733853816986084, "step": 1450} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746207402, "_runtime": 4174}, "step": 1450} +{"logs": {"train/loss": 4.3399, "train/learning_rate": 0.0003444444444444444, "train/epoch": 1.2, "_timestamp": 1746207402, "_runtime": 4174}, "step": 1450} +{"train_info/time_between_train_steps": 0.024654150009155273, "step": 1450} +{"info/global_step": 1451, "train_info/time_within_train_step": 2.6721110343933105, "step": 1451} +{"train_info/time_between_train_steps": 0.0031549930572509766, "step": 1451} +{"info/global_step": 1452, "train_info/time_within_train_step": 2.67413330078125, "step": 1452} +{"train_info/time_between_train_steps": 0.0031957626342773438, "step": 1452} +{"info/global_step": 1453, "train_info/time_within_train_step": 2.6735451221466064, "step": 1453} +{"train_info/time_between_train_steps": 0.0032210350036621094, "step": 1453} +{"info/global_step": 1454, "train_info/time_within_train_step": 2.6723482608795166, "step": 1454} +{"train_info/time_between_train_steps": 0.0031189918518066406, "step": 1454} +{"info/global_step": 1455, "train_info/time_within_train_step": 2.7246124744415283, "step": 1455} +{"train_info/time_between_train_steps": 0.0031533241271972656, "step": 1455} +{"info/global_step": 1456, "train_info/time_within_train_step": 2.673603057861328, "step": 1456} +{"train_info/time_between_train_steps": 0.0032265186309814453, "step": 1456} +{"info/global_step": 1457, "train_info/time_within_train_step": 2.6735498905181885, "step": 1457} +{"train_info/time_between_train_steps": 0.003259897232055664, "step": 1457} +{"info/global_step": 1458, "train_info/time_within_train_step": 2.6757700443267822, "step": 1458} +{"train_info/time_between_train_steps": 0.003163576126098633, "step": 1458} +{"info/global_step": 1459, "train_info/time_within_train_step": 2.6725504398345947, "step": 1459} +{"train_info/time_between_train_steps": 0.0031692981719970703, "step": 1459} +{"info/global_step": 1460, "train_info/time_within_train_step": 2.672936201095581, "step": 1460} +{"train_info/time_between_train_steps": 0.003170490264892578, "step": 1460} +{"info/global_step": 1461, "train_info/time_within_train_step": 2.6725385189056396, "step": 1461} +{"train_info/time_between_train_steps": 0.0031888484954833984, "step": 1461} +{"info/global_step": 1462, "train_info/time_within_train_step": 2.6726722717285156, "step": 1462} +{"train_info/time_between_train_steps": 0.003114938735961914, "step": 1462} +{"info/global_step": 1463, "train_info/time_within_train_step": 2.6736574172973633, "step": 1463} +{"train_info/time_between_train_steps": 0.0031638145446777344, "step": 1463} +{"info/global_step": 1464, "train_info/time_within_train_step": 2.6737606525421143, "step": 1464} +{"train_info/time_between_train_steps": 0.0034453868865966797, "step": 1464} +{"info/global_step": 1465, "train_info/time_within_train_step": 2.6744484901428223, "step": 1465} +{"train_info/time_between_train_steps": 0.003215789794921875, "step": 1465} +{"info/global_step": 1466, "train_info/time_within_train_step": 2.6739020347595215, "step": 1466} +{"train_info/time_between_train_steps": 0.003144502639770508, "step": 1466} +{"info/global_step": 1467, "train_info/time_within_train_step": 2.6739120483398438, "step": 1467} +{"train_info/time_between_train_steps": 0.003129720687866211, "step": 1467} +{"info/global_step": 1468, "train_info/time_within_train_step": 2.6741652488708496, "step": 1468} +{"train_info/time_between_train_steps": 0.0033533573150634766, "step": 1468} +{"info/global_step": 1469, "train_info/time_within_train_step": 2.6740427017211914, "step": 1469} +{"train_info/time_between_train_steps": 0.003154277801513672, "step": 1469} +{"info/global_step": 1470, "train_info/time_within_train_step": 2.6731865406036377, "step": 1470} +{"train_info/time_between_train_steps": 0.0031287670135498047, "step": 1470} +{"info/global_step": 1471, "train_info/time_within_train_step": 2.672090768814087, "step": 1471} +{"train_info/time_between_train_steps": 0.0031065940856933594, "step": 1471} +{"info/global_step": 1472, "train_info/time_within_train_step": 2.674579620361328, "step": 1472} +{"train_info/time_between_train_steps": 0.003190755844116211, "step": 1472} +{"info/global_step": 1473, "train_info/time_within_train_step": 2.671518325805664, "step": 1473} +{"train_info/time_between_train_steps": 0.0031037330627441406, "step": 1473} +{"info/global_step": 1474, "train_info/time_within_train_step": 2.6730496883392334, "step": 1474} +{"train_info/time_between_train_steps": 0.0031769275665283203, "step": 1474} +{"info/global_step": 1475, "train_info/time_within_train_step": 2.674243450164795, "step": 1475} +{"train_info/time_between_train_steps": 0.0031714439392089844, "step": 1475} +{"info/global_step": 1476, "train_info/time_within_train_step": 2.6748528480529785, "step": 1476} +{"train_info/time_between_train_steps": 0.0032033920288085938, "step": 1476} +{"info/global_step": 1477, "train_info/time_within_train_step": 2.6740562915802, "step": 1477} +{"train_info/time_between_train_steps": 0.003123044967651367, "step": 1477} +{"info/global_step": 1478, "train_info/time_within_train_step": 2.9455533027648926, "step": 1478} +{"train_info/time_between_train_steps": 0.0030689239501953125, "step": 1478} +{"info/global_step": 1479, "train_info/time_within_train_step": 2.6741220951080322, "step": 1479} +{"train_info/time_between_train_steps": 0.003037691116333008, "step": 1479} +{"info/global_step": 1480, "train_info/time_within_train_step": 2.673034429550171, "step": 1480} +{"train_info/time_between_train_steps": 0.003070354461669922, "step": 1480} +{"info/global_step": 1481, "train_info/time_within_train_step": 2.6717946529388428, "step": 1481} +{"train_info/time_between_train_steps": 0.0030586719512939453, "step": 1481} +{"info/global_step": 1482, "train_info/time_within_train_step": 2.671391725540161, "step": 1482} +{"train_info/time_between_train_steps": 0.002986907958984375, "step": 1482} +{"info/global_step": 1483, "train_info/time_within_train_step": 2.671083450317383, "step": 1483} +{"train_info/time_between_train_steps": 0.003148317337036133, "step": 1483} +{"info/global_step": 1484, "train_info/time_within_train_step": 2.673414707183838, "step": 1484} +{"train_info/time_between_train_steps": 0.0031905174255371094, "step": 1484} +{"info/global_step": 1485, "train_info/time_within_train_step": 2.6727235317230225, "step": 1485} +{"train_info/time_between_train_steps": 0.0031371116638183594, "step": 1485} +{"info/global_step": 1486, "train_info/time_within_train_step": 2.6720821857452393, "step": 1486} +{"train_info/time_between_train_steps": 0.0031566619873046875, "step": 1486} +{"info/global_step": 1487, "train_info/time_within_train_step": 2.672567844390869, "step": 1487} +{"train_info/time_between_train_steps": 0.003104686737060547, "step": 1487} +{"info/global_step": 1488, "train_info/time_within_train_step": 2.673225164413452, "step": 1488} +{"train_info/time_between_train_steps": 0.0032341480255126953, "step": 1488} +{"info/global_step": 1489, "train_info/time_within_train_step": 2.672013759613037, "step": 1489} +{"train_info/time_between_train_steps": 0.003188610076904297, "step": 1489} +{"info/global_step": 1490, "train_info/time_within_train_step": 2.6729109287261963, "step": 1490} +{"train_info/time_between_train_steps": 0.0031964778900146484, "step": 1490} +{"info/global_step": 1491, "train_info/time_within_train_step": 2.6738216876983643, "step": 1491} +{"train_info/time_between_train_steps": 0.003213644027709961, "step": 1491} +{"info/global_step": 1492, "train_info/time_within_train_step": 2.674459218978882, "step": 1492} +{"train_info/time_between_train_steps": 0.003170013427734375, "step": 1492} +{"info/global_step": 1493, "train_info/time_within_train_step": 2.6741223335266113, "step": 1493} +{"train_info/time_between_train_steps": 0.003175973892211914, "step": 1493} +{"info/global_step": 1494, "train_info/time_within_train_step": 2.6728901863098145, "step": 1494} +{"train_info/time_between_train_steps": 0.0032072067260742188, "step": 1494} +{"info/global_step": 1495, "train_info/time_within_train_step": 2.673405885696411, "step": 1495} +{"train_info/time_between_train_steps": 0.0032966136932373047, "step": 1495} +{"info/global_step": 1496, "train_info/time_within_train_step": 2.67232346534729, "step": 1496} +{"train_info/time_between_train_steps": 0.0031690597534179688, "step": 1496} +{"info/global_step": 1497, "train_info/time_within_train_step": 2.671605348587036, "step": 1497} +{"train_info/time_between_train_steps": 0.003161907196044922, "step": 1497} +{"info/global_step": 1498, "train_info/time_within_train_step": 2.6728179454803467, "step": 1498} +{"train_info/time_between_train_steps": 0.003148794174194336, "step": 1498} +{"info/global_step": 1499, "train_info/time_within_train_step": 2.672032356262207, "step": 1499} +{"train_info/time_between_train_steps": 0.0031890869140625, "step": 1499} +{"info/global_step": 1500, "train_info/time_within_train_step": 3.273573398590088, "step": 1500} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746207537, "_runtime": 4309}, "step": 1500} +{"logs": {"train/loss": 4.309, "train/learning_rate": 0.0003333333333333333, "train/epoch": 1.21, "_timestamp": 1746207537, "_runtime": 4309}, "step": 1500} +{"train_info/time_between_train_steps": 14.089911222457886, "step": 1500} +{"info/global_step": 1501, "train_info/time_within_train_step": 2.4810426235198975, "step": 1501} +{"train_info/time_between_train_steps": 0.003290414810180664, "step": 1501} +{"info/global_step": 1502, "train_info/time_within_train_step": 2.459300994873047, "step": 1502} +{"train_info/time_between_train_steps": 0.0031850337982177734, "step": 1502} +{"info/global_step": 1503, "train_info/time_within_train_step": 2.4709982872009277, "step": 1503} +{"train_info/time_between_train_steps": 0.004595279693603516, "step": 1503} +{"info/global_step": 1504, "train_info/time_within_train_step": 2.648719072341919, "step": 1504} +{"train_info/time_between_train_steps": 0.006322383880615234, "step": 1504} +{"info/global_step": 1505, "train_info/time_within_train_step": 2.669948101043701, "step": 1505} +{"train_info/time_between_train_steps": 0.006443023681640625, "step": 1505} +{"info/global_step": 1506, "train_info/time_within_train_step": 2.6710751056671143, "step": 1506} +{"train_info/time_between_train_steps": 0.0063571929931640625, "step": 1506} +{"info/global_step": 1507, "train_info/time_within_train_step": 2.671414375305176, "step": 1507} +{"train_info/time_between_train_steps": 0.006384611129760742, "step": 1507} +{"info/global_step": 1508, "train_info/time_within_train_step": 2.6718149185180664, "step": 1508} +{"train_info/time_between_train_steps": 0.0031654834747314453, "step": 1508} +{"info/global_step": 1509, "train_info/time_within_train_step": 2.6723344326019287, "step": 1509} +{"train_info/time_between_train_steps": 0.006414651870727539, "step": 1509} +{"info/global_step": 1510, "train_info/time_within_train_step": 2.6743316650390625, "step": 1510} +{"train_info/time_between_train_steps": 0.006380796432495117, "step": 1510} +{"info/global_step": 1511, "train_info/time_within_train_step": 2.6762022972106934, "step": 1511} +{"train_info/time_between_train_steps": 0.003164529800415039, "step": 1511} +{"info/global_step": 1512, "train_info/time_within_train_step": 2.67476749420166, "step": 1512} +{"train_info/time_between_train_steps": 0.003216266632080078, "step": 1512} +{"info/global_step": 1513, "train_info/time_within_train_step": 2.67438006401062, "step": 1513} +{"train_info/time_between_train_steps": 0.0032501220703125, "step": 1513} +{"info/global_step": 1514, "train_info/time_within_train_step": 2.6756551265716553, "step": 1514} +{"train_info/time_between_train_steps": 0.00635528564453125, "step": 1514} +{"info/global_step": 1515, "train_info/time_within_train_step": 2.6725480556488037, "step": 1515} +{"train_info/time_between_train_steps": 0.006457090377807617, "step": 1515} +{"info/global_step": 1516, "train_info/time_within_train_step": 2.672502279281616, "step": 1516} +{"train_info/time_between_train_steps": 0.006438016891479492, "step": 1516} +{"info/global_step": 1517, "train_info/time_within_train_step": 2.9632861614227295, "step": 1517} +{"train_info/time_between_train_steps": 0.002994060516357422, "step": 1517} +{"info/global_step": 1518, "train_info/time_within_train_step": 2.6717641353607178, "step": 1518} +{"train_info/time_between_train_steps": 0.0029523372650146484, "step": 1518} +{"info/global_step": 1519, "train_info/time_within_train_step": 2.671665906906128, "step": 1519} +{"train_info/time_between_train_steps": 0.0029556751251220703, "step": 1519} +{"info/global_step": 1520, "train_info/time_within_train_step": 2.672746419906616, "step": 1520} +{"train_info/time_between_train_steps": 0.006143093109130859, "step": 1520} +{"info/global_step": 1521, "train_info/time_within_train_step": 2.673386573791504, "step": 1521} +{"train_info/time_between_train_steps": 0.0061719417572021484, "step": 1521} +{"info/global_step": 1522, "train_info/time_within_train_step": 2.6720187664031982, "step": 1522} +{"train_info/time_between_train_steps": 0.006163597106933594, "step": 1522} +{"info/global_step": 1523, "train_info/time_within_train_step": 2.6725518703460693, "step": 1523} +{"train_info/time_between_train_steps": 0.002938508987426758, "step": 1523} +{"info/global_step": 1524, "train_info/time_within_train_step": 2.6747066974639893, "step": 1524} +{"train_info/time_between_train_steps": 0.006245613098144531, "step": 1524} +{"info/global_step": 1525, "train_info/time_within_train_step": 2.6748640537261963, "step": 1525} +{"train_info/time_between_train_steps": 0.006268024444580078, "step": 1525} +{"info/global_step": 1526, "train_info/time_within_train_step": 2.6744394302368164, "step": 1526} +{"train_info/time_between_train_steps": 0.006200075149536133, "step": 1526} +{"info/global_step": 1527, "train_info/time_within_train_step": 2.6736395359039307, "step": 1527} +{"train_info/time_between_train_steps": 0.003050565719604492, "step": 1527} +{"info/global_step": 1528, "train_info/time_within_train_step": 2.6723928451538086, "step": 1528} +{"train_info/time_between_train_steps": 0.002998828887939453, "step": 1528} +{"info/global_step": 1529, "train_info/time_within_train_step": 2.672267198562622, "step": 1529} +{"train_info/time_between_train_steps": 0.0030670166015625, "step": 1529} +{"info/global_step": 1530, "train_info/time_within_train_step": 2.672842025756836, "step": 1530} +{"train_info/time_between_train_steps": 0.003149747848510742, "step": 1530} +{"info/global_step": 1531, "train_info/time_within_train_step": 2.673403024673462, "step": 1531} +{"train_info/time_between_train_steps": 0.003206968307495117, "step": 1531} +{"info/global_step": 1532, "train_info/time_within_train_step": 2.6746666431427, "step": 1532} +{"train_info/time_between_train_steps": 0.0031936168670654297, "step": 1532} +{"info/global_step": 1533, "train_info/time_within_train_step": 2.673109292984009, "step": 1533} +{"train_info/time_between_train_steps": 0.0032405853271484375, "step": 1533} +{"info/global_step": 1534, "train_info/time_within_train_step": 2.672869920730591, "step": 1534} +{"train_info/time_between_train_steps": 0.0032393932342529297, "step": 1534} +{"info/global_step": 1535, "train_info/time_within_train_step": 2.6728498935699463, "step": 1535} +{"train_info/time_between_train_steps": 0.003197908401489258, "step": 1535} +{"info/global_step": 1536, "train_info/time_within_train_step": 2.675041675567627, "step": 1536} +{"train_info/time_between_train_steps": 0.0032167434692382812, "step": 1536} +{"info/global_step": 1537, "train_info/time_within_train_step": 2.6735544204711914, "step": 1537} +{"train_info/time_between_train_steps": 0.004265546798706055, "step": 1537} +{"info/global_step": 1538, "train_info/time_within_train_step": 2.672961711883545, "step": 1538} +{"train_info/time_between_train_steps": 0.0031898021697998047, "step": 1538} +{"info/global_step": 1539, "train_info/time_within_train_step": 2.673427104949951, "step": 1539} +{"train_info/time_between_train_steps": 0.003262758255004883, "step": 1539} +{"info/global_step": 1540, "train_info/time_within_train_step": 2.672268867492676, "step": 1540} +{"train_info/time_between_train_steps": 0.003193378448486328, "step": 1540} +{"info/global_step": 1541, "train_info/time_within_train_step": 2.6725258827209473, "step": 1541} +{"train_info/time_between_train_steps": 0.0031409263610839844, "step": 1541} +{"info/global_step": 1542, "train_info/time_within_train_step": 2.6712141036987305, "step": 1542} +{"train_info/time_between_train_steps": 0.003236055374145508, "step": 1542} +{"info/global_step": 1543, "train_info/time_within_train_step": 2.6714038848876953, "step": 1543} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 1543} +{"info/global_step": 1544, "train_info/time_within_train_step": 2.671422004699707, "step": 1544} +{"train_info/time_between_train_steps": 0.0032210350036621094, "step": 1544} +{"info/global_step": 1545, "train_info/time_within_train_step": 2.6702191829681396, "step": 1545} +{"train_info/time_between_train_steps": 0.003154754638671875, "step": 1545} +{"info/global_step": 1546, "train_info/time_within_train_step": 2.6712586879730225, "step": 1546} +{"train_info/time_between_train_steps": 0.00307464599609375, "step": 1546} +{"info/global_step": 1547, "train_info/time_within_train_step": 2.6708106994628906, "step": 1547} +{"train_info/time_between_train_steps": 0.003168344497680664, "step": 1547} +{"info/global_step": 1548, "train_info/time_within_train_step": 2.670902729034424, "step": 1548} +{"train_info/time_between_train_steps": 0.003313302993774414, "step": 1548} +{"info/global_step": 1549, "train_info/time_within_train_step": 2.670794725418091, "step": 1549} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 1549} +{"info/global_step": 1550, "train_info/time_within_train_step": 2.669867992401123, "step": 1550} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746207686, "_runtime": 4458}, "step": 1550} +{"logs": {"train/loss": 4.2883, "train/learning_rate": 0.0003222222222222222, "train/epoch": 1.23, "_timestamp": 1746207686, "_runtime": 4458}, "step": 1550} +{"train_info/time_between_train_steps": 0.024417877197265625, "step": 1550} +{"info/global_step": 1551, "train_info/time_within_train_step": 2.6709556579589844, "step": 1551} +{"train_info/time_between_train_steps": 0.0031189918518066406, "step": 1551} +{"info/global_step": 1552, "train_info/time_within_train_step": 2.6706700325012207, "step": 1552} +{"train_info/time_between_train_steps": 0.003128528594970703, "step": 1552} +{"info/global_step": 1553, "train_info/time_within_train_step": 2.672118663787842, "step": 1553} +{"train_info/time_between_train_steps": 0.0031762123107910156, "step": 1553} +{"info/global_step": 1554, "train_info/time_within_train_step": 2.6714560985565186, "step": 1554} +{"train_info/time_between_train_steps": 0.0032656192779541016, "step": 1554} +{"info/global_step": 1555, "train_info/time_within_train_step": 2.6710927486419678, "step": 1555} +{"train_info/time_between_train_steps": 0.0030901432037353516, "step": 1555} +{"info/global_step": 1556, "train_info/time_within_train_step": 2.67086124420166, "step": 1556} +{"train_info/time_between_train_steps": 0.003160238265991211, "step": 1556} +{"info/global_step": 1557, "train_info/time_within_train_step": 2.6709022521972656, "step": 1557} +{"train_info/time_between_train_steps": 0.0030820369720458984, "step": 1557} +{"info/global_step": 1558, "train_info/time_within_train_step": 2.67087721824646, "step": 1558} +{"train_info/time_between_train_steps": 0.003263235092163086, "step": 1558} +{"info/global_step": 1559, "train_info/time_within_train_step": 2.669511318206787, "step": 1559} +{"train_info/time_between_train_steps": 0.003194093704223633, "step": 1559} +{"info/global_step": 1560, "train_info/time_within_train_step": 2.6703238487243652, "step": 1560} +{"train_info/time_between_train_steps": 0.0031554698944091797, "step": 1560} +{"info/global_step": 1561, "train_info/time_within_train_step": 2.6712708473205566, "step": 1561} +{"train_info/time_between_train_steps": 0.0031762123107910156, "step": 1561} +{"info/global_step": 1562, "train_info/time_within_train_step": 2.6702914237976074, "step": 1562} +{"train_info/time_between_train_steps": 0.0031180381774902344, "step": 1562} +{"info/global_step": 1563, "train_info/time_within_train_step": 2.6712188720703125, "step": 1563} +{"train_info/time_between_train_steps": 0.003265857696533203, "step": 1563} +{"info/global_step": 1564, "train_info/time_within_train_step": 2.6716079711914062, "step": 1564} +{"train_info/time_between_train_steps": 0.0031859874725341797, "step": 1564} +{"info/global_step": 1565, "train_info/time_within_train_step": 2.670755624771118, "step": 1565} +{"train_info/time_between_train_steps": 0.0031554698944091797, "step": 1565} +{"info/global_step": 1566, "train_info/time_within_train_step": 2.670365571975708, "step": 1566} +{"train_info/time_between_train_steps": 0.00316619873046875, "step": 1566} +{"info/global_step": 1567, "train_info/time_within_train_step": 2.672865152359009, "step": 1567} +{"train_info/time_between_train_steps": 0.0031824111938476562, "step": 1567} +{"info/global_step": 1568, "train_info/time_within_train_step": 2.672696828842163, "step": 1568} +{"train_info/time_between_train_steps": 0.003162384033203125, "step": 1568} +{"info/global_step": 1569, "train_info/time_within_train_step": 2.6707661151885986, "step": 1569} +{"train_info/time_between_train_steps": 0.003134489059448242, "step": 1569} +{"info/global_step": 1570, "train_info/time_within_train_step": 2.670060634613037, "step": 1570} +{"train_info/time_between_train_steps": 0.0031375885009765625, "step": 1570} +{"info/global_step": 1571, "train_info/time_within_train_step": 2.6698379516601562, "step": 1571} +{"train_info/time_between_train_steps": 0.0031423568725585938, "step": 1571} +{"info/global_step": 1572, "train_info/time_within_train_step": 2.6730895042419434, "step": 1572} +{"train_info/time_between_train_steps": 0.003171682357788086, "step": 1572} +{"info/global_step": 1573, "train_info/time_within_train_step": 2.670609474182129, "step": 1573} +{"train_info/time_between_train_steps": 0.003191232681274414, "step": 1573} +{"info/global_step": 1574, "train_info/time_within_train_step": 2.670657157897949, "step": 1574} +{"train_info/time_between_train_steps": 0.0030875205993652344, "step": 1574} +{"info/global_step": 1575, "train_info/time_within_train_step": 2.671109437942505, "step": 1575} +{"train_info/time_between_train_steps": 0.003148317337036133, "step": 1575} +{"info/global_step": 1576, "train_info/time_within_train_step": 2.671062707901001, "step": 1576} +{"train_info/time_between_train_steps": 0.0031392574310302734, "step": 1576} +{"info/global_step": 1577, "train_info/time_within_train_step": 2.670706033706665, "step": 1577} +{"train_info/time_between_train_steps": 0.0030984878540039062, "step": 1577} +{"info/global_step": 1578, "train_info/time_within_train_step": 2.6717417240142822, "step": 1578} +{"train_info/time_between_train_steps": 0.003123044967651367, "step": 1578} +{"info/global_step": 1579, "train_info/time_within_train_step": 2.6720221042633057, "step": 1579} +{"train_info/time_between_train_steps": 0.0031266212463378906, "step": 1579} +{"info/global_step": 1580, "train_info/time_within_train_step": 2.671595335006714, "step": 1580} +{"train_info/time_between_train_steps": 0.0031571388244628906, "step": 1580} +{"info/global_step": 1581, "train_info/time_within_train_step": 2.6722331047058105, "step": 1581} +{"train_info/time_between_train_steps": 0.003156423568725586, "step": 1581} +{"info/global_step": 1582, "train_info/time_within_train_step": 2.672056198120117, "step": 1582} +{"train_info/time_between_train_steps": 0.0031163692474365234, "step": 1582} +{"info/global_step": 1583, "train_info/time_within_train_step": 2.6710166931152344, "step": 1583} +{"train_info/time_between_train_steps": 0.0031974315643310547, "step": 1583} +{"info/global_step": 1584, "train_info/time_within_train_step": 2.6711955070495605, "step": 1584} +{"train_info/time_between_train_steps": 0.0031147003173828125, "step": 1584} +{"info/global_step": 1585, "train_info/time_within_train_step": 2.669992685317993, "step": 1585} +{"train_info/time_between_train_steps": 0.0031518936157226562, "step": 1585} +{"info/global_step": 1586, "train_info/time_within_train_step": 2.6716268062591553, "step": 1586} +{"train_info/time_between_train_steps": 0.003162860870361328, "step": 1586} +{"info/global_step": 1587, "train_info/time_within_train_step": 2.671914577484131, "step": 1587} +{"train_info/time_between_train_steps": 0.0032927989959716797, "step": 1587} +{"info/global_step": 1588, "train_info/time_within_train_step": 2.670426607131958, "step": 1588} +{"train_info/time_between_train_steps": 0.003114938735961914, "step": 1588} +{"info/global_step": 1589, "train_info/time_within_train_step": 2.671207904815674, "step": 1589} +{"train_info/time_between_train_steps": 0.0031900405883789062, "step": 1589} +{"info/global_step": 1590, "train_info/time_within_train_step": 2.671656370162964, "step": 1590} +{"train_info/time_between_train_steps": 0.003182649612426758, "step": 1590} +{"info/global_step": 1591, "train_info/time_within_train_step": 2.6712279319763184, "step": 1591} +{"train_info/time_between_train_steps": 0.0031571388244628906, "step": 1591} +{"info/global_step": 1592, "train_info/time_within_train_step": 2.672384262084961, "step": 1592} +{"train_info/time_between_train_steps": 0.0031731128692626953, "step": 1592} +{"info/global_step": 1593, "train_info/time_within_train_step": 2.673614501953125, "step": 1593} +{"train_info/time_between_train_steps": 0.003225088119506836, "step": 1593} +{"info/global_step": 1594, "train_info/time_within_train_step": 2.67596697807312, "step": 1594} +{"train_info/time_between_train_steps": 0.0032296180725097656, "step": 1594} +{"info/global_step": 1595, "train_info/time_within_train_step": 2.6722474098205566, "step": 1595} +{"train_info/time_between_train_steps": 0.003200531005859375, "step": 1595} +{"info/global_step": 1596, "train_info/time_within_train_step": 2.7130000591278076, "step": 1596} +{"train_info/time_between_train_steps": 0.0031511783599853516, "step": 1596} +{"info/global_step": 1597, "train_info/time_within_train_step": 2.6723551750183105, "step": 1597} +{"train_info/time_between_train_steps": 0.0031223297119140625, "step": 1597} +{"info/global_step": 1598, "train_info/time_within_train_step": 2.671689748764038, "step": 1598} +{"train_info/time_between_train_steps": 0.0032181739807128906, "step": 1598} +{"info/global_step": 1599, "train_info/time_within_train_step": 2.673288583755493, "step": 1599} +{"train_info/time_between_train_steps": 0.003179311752319336, "step": 1599} +{"info/global_step": 1600, "train_info/time_within_train_step": 2.6711559295654297, "step": 1600} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746207821, "_runtime": 4593}, "step": 1600} +{"logs": {"train/loss": 4.2786, "train/learning_rate": 0.00031111111111111107, "train/epoch": 1.25, "_timestamp": 1746207821, "_runtime": 4593}, "step": 1600} +{"train_info/time_between_train_steps": 13.27854609489441, "step": 1600} +{"info/global_step": 1601, "train_info/time_within_train_step": 2.4748027324676514, "step": 1601} +{"train_info/time_between_train_steps": 0.00321197509765625, "step": 1601} +{"info/global_step": 1602, "train_info/time_within_train_step": 2.4555113315582275, "step": 1602} +{"train_info/time_between_train_steps": 0.0031728744506835938, "step": 1602} +{"info/global_step": 1603, "train_info/time_within_train_step": 2.493997097015381, "step": 1603} +{"train_info/time_between_train_steps": 0.003159761428833008, "step": 1603} +{"info/global_step": 1604, "train_info/time_within_train_step": 2.6662888526916504, "step": 1604} +{"train_info/time_between_train_steps": 0.0031824111938476562, "step": 1604} +{"info/global_step": 1605, "train_info/time_within_train_step": 2.6710479259490967, "step": 1605} +{"train_info/time_between_train_steps": 0.0031855106353759766, "step": 1605} +{"info/global_step": 1606, "train_info/time_within_train_step": 2.6736221313476562, "step": 1606} +{"train_info/time_between_train_steps": 0.003175020217895508, "step": 1606} +{"info/global_step": 1607, "train_info/time_within_train_step": 2.67181134223938, "step": 1607} +{"train_info/time_between_train_steps": 0.003133535385131836, "step": 1607} +{"info/global_step": 1608, "train_info/time_within_train_step": 2.6765940189361572, "step": 1608} +{"train_info/time_between_train_steps": 0.0031299591064453125, "step": 1608} +{"info/global_step": 1609, "train_info/time_within_train_step": 2.6718876361846924, "step": 1609} +{"train_info/time_between_train_steps": 0.0031037330627441406, "step": 1609} +{"info/global_step": 1610, "train_info/time_within_train_step": 2.672067403793335, "step": 1610} +{"train_info/time_between_train_steps": 0.0031404495239257812, "step": 1610} +{"info/global_step": 1611, "train_info/time_within_train_step": 2.6730237007141113, "step": 1611} +{"train_info/time_between_train_steps": 0.003208160400390625, "step": 1611} +{"info/global_step": 1612, "train_info/time_within_train_step": 2.6722123622894287, "step": 1612} +{"train_info/time_between_train_steps": 0.003163576126098633, "step": 1612} +{"info/global_step": 1613, "train_info/time_within_train_step": 2.8269288539886475, "step": 1613} +{"train_info/time_between_train_steps": 0.0029745101928710938, "step": 1613} +{"info/global_step": 1614, "train_info/time_within_train_step": 2.6715593338012695, "step": 1614} +{"train_info/time_between_train_steps": 0.0029768943786621094, "step": 1614} +{"info/global_step": 1615, "train_info/time_within_train_step": 2.671584367752075, "step": 1615} +{"train_info/time_between_train_steps": 0.002969503402709961, "step": 1615} +{"info/global_step": 1616, "train_info/time_within_train_step": 2.6717166900634766, "step": 1616} +{"train_info/time_between_train_steps": 0.002950906753540039, "step": 1616} +{"info/global_step": 1617, "train_info/time_within_train_step": 2.672564744949341, "step": 1617} +{"train_info/time_between_train_steps": 0.002965211868286133, "step": 1617} +{"info/global_step": 1618, "train_info/time_within_train_step": 2.6731510162353516, "step": 1618} +{"train_info/time_between_train_steps": 0.0029807090759277344, "step": 1618} +{"info/global_step": 1619, "train_info/time_within_train_step": 2.6722183227539062, "step": 1619} +{"train_info/time_between_train_steps": 0.0029296875, "step": 1619} +{"info/global_step": 1620, "train_info/time_within_train_step": 2.6722443103790283, "step": 1620} +{"train_info/time_between_train_steps": 0.002936840057373047, "step": 1620} +{"info/global_step": 1621, "train_info/time_within_train_step": 2.6712636947631836, "step": 1621} +{"train_info/time_between_train_steps": 0.0029718875885009766, "step": 1621} +{"info/global_step": 1622, "train_info/time_within_train_step": 2.6712100505828857, "step": 1622} +{"train_info/time_between_train_steps": 0.003195524215698242, "step": 1622} +{"info/global_step": 1623, "train_info/time_within_train_step": 2.6714601516723633, "step": 1623} +{"train_info/time_between_train_steps": 0.002931833267211914, "step": 1623} +{"info/global_step": 1624, "train_info/time_within_train_step": 2.721905469894409, "step": 1624} +{"train_info/time_between_train_steps": 0.0030074119567871094, "step": 1624} +{"info/global_step": 1625, "train_info/time_within_train_step": 2.6709001064300537, "step": 1625} +{"train_info/time_between_train_steps": 0.0029571056365966797, "step": 1625} +{"info/global_step": 1626, "train_info/time_within_train_step": 2.671428680419922, "step": 1626} +{"train_info/time_between_train_steps": 0.0029697418212890625, "step": 1626} +{"info/global_step": 1627, "train_info/time_within_train_step": 2.6728270053863525, "step": 1627} +{"train_info/time_between_train_steps": 0.002956390380859375, "step": 1627} +{"info/global_step": 1628, "train_info/time_within_train_step": 2.672631025314331, "step": 1628} +{"train_info/time_between_train_steps": 0.002939462661743164, "step": 1628} +{"info/global_step": 1629, "train_info/time_within_train_step": 2.6720402240753174, "step": 1629} +{"train_info/time_between_train_steps": 0.002933979034423828, "step": 1629} +{"info/global_step": 1630, "train_info/time_within_train_step": 2.672513723373413, "step": 1630} +{"train_info/time_between_train_steps": 0.0030317306518554688, "step": 1630} +{"info/global_step": 1631, "train_info/time_within_train_step": 2.6715283393859863, "step": 1631} +{"train_info/time_between_train_steps": 0.002971649169921875, "step": 1631} +{"info/global_step": 1632, "train_info/time_within_train_step": 2.6732568740844727, "step": 1632} +{"train_info/time_between_train_steps": 0.002949237823486328, "step": 1632} +{"info/global_step": 1633, "train_info/time_within_train_step": 2.67341685295105, "step": 1633} +{"train_info/time_between_train_steps": 0.002913236618041992, "step": 1633} +{"info/global_step": 1634, "train_info/time_within_train_step": 2.671677827835083, "step": 1634} +{"train_info/time_between_train_steps": 0.002969503402709961, "step": 1634} +{"info/global_step": 1635, "train_info/time_within_train_step": 2.6715221405029297, "step": 1635} +{"train_info/time_between_train_steps": 0.0029630661010742188, "step": 1635} +{"info/global_step": 1636, "train_info/time_within_train_step": 2.671607494354248, "step": 1636} +{"train_info/time_between_train_steps": 0.002951383590698242, "step": 1636} +{"info/global_step": 1637, "train_info/time_within_train_step": 2.6706011295318604, "step": 1637} +{"train_info/time_between_train_steps": 0.003139019012451172, "step": 1637} +{"info/global_step": 1638, "train_info/time_within_train_step": 2.6709182262420654, "step": 1638} +{"train_info/time_between_train_steps": 0.003070354461669922, "step": 1638} +{"info/global_step": 1639, "train_info/time_within_train_step": 2.6715314388275146, "step": 1639} +{"train_info/time_between_train_steps": 0.0032694339752197266, "step": 1639} +{"info/global_step": 1640, "train_info/time_within_train_step": 2.672097682952881, "step": 1640} +{"train_info/time_between_train_steps": 0.0032701492309570312, "step": 1640} +{"info/global_step": 1641, "train_info/time_within_train_step": 2.6719861030578613, "step": 1641} +{"train_info/time_between_train_steps": 0.003163576126098633, "step": 1641} +{"info/global_step": 1642, "train_info/time_within_train_step": 2.6712799072265625, "step": 1642} +{"train_info/time_between_train_steps": 0.0032110214233398438, "step": 1642} +{"info/global_step": 1643, "train_info/time_within_train_step": 2.6705384254455566, "step": 1643} +{"train_info/time_between_train_steps": 0.003244161605834961, "step": 1643} +{"info/global_step": 1644, "train_info/time_within_train_step": 2.672621488571167, "step": 1644} +{"train_info/time_between_train_steps": 0.0031697750091552734, "step": 1644} +{"info/global_step": 1645, "train_info/time_within_train_step": 2.67175030708313, "step": 1645} +{"train_info/time_between_train_steps": 0.003145456314086914, "step": 1645} +{"info/global_step": 1646, "train_info/time_within_train_step": 2.6715474128723145, "step": 1646} +{"train_info/time_between_train_steps": 0.003139972686767578, "step": 1646} +{"info/global_step": 1647, "train_info/time_within_train_step": 2.6719892024993896, "step": 1647} +{"train_info/time_between_train_steps": 0.0031468868255615234, "step": 1647} +{"info/global_step": 1648, "train_info/time_within_train_step": 2.6709036827087402, "step": 1648} +{"train_info/time_between_train_steps": 0.003113269805908203, "step": 1648} +{"info/global_step": 1649, "train_info/time_within_train_step": 2.671698808670044, "step": 1649} +{"train_info/time_between_train_steps": 0.0031232833862304688, "step": 1649} +{"info/global_step": 1650, "train_info/time_within_train_step": 2.6715009212493896, "step": 1650} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746207969, "_runtime": 4741}, "step": 1650} +{"logs": {"train/loss": 4.2504, "train/learning_rate": 0.0003, "train/epoch": 1.26, "_timestamp": 1746207969, "_runtime": 4741}, "step": 1650} +{"train_info/time_between_train_steps": 0.02451300621032715, "step": 1650} +{"info/global_step": 1651, "train_info/time_within_train_step": 2.671355962753296, "step": 1651} +{"train_info/time_between_train_steps": 0.0030975341796875, "step": 1651} +{"info/global_step": 1652, "train_info/time_within_train_step": 2.671651601791382, "step": 1652} +{"train_info/time_between_train_steps": 0.0031142234802246094, "step": 1652} +{"info/global_step": 1653, "train_info/time_within_train_step": 2.6721129417419434, "step": 1653} +{"train_info/time_between_train_steps": 0.0031604766845703125, "step": 1653} +{"info/global_step": 1654, "train_info/time_within_train_step": 2.6709721088409424, "step": 1654} +{"train_info/time_between_train_steps": 0.0032036304473876953, "step": 1654} +{"info/global_step": 1655, "train_info/time_within_train_step": 2.6700901985168457, "step": 1655} +{"train_info/time_between_train_steps": 0.003160715103149414, "step": 1655} +{"info/global_step": 1656, "train_info/time_within_train_step": 2.6707699298858643, "step": 1656} +{"train_info/time_between_train_steps": 0.003226041793823242, "step": 1656} +{"info/global_step": 1657, "train_info/time_within_train_step": 2.67097544670105, "step": 1657} +{"train_info/time_between_train_steps": 0.0031630992889404297, "step": 1657} +{"info/global_step": 1658, "train_info/time_within_train_step": 2.67111873626709, "step": 1658} +{"train_info/time_between_train_steps": 0.0031905174255371094, "step": 1658} +{"info/global_step": 1659, "train_info/time_within_train_step": 2.671407699584961, "step": 1659} +{"train_info/time_between_train_steps": 0.0031197071075439453, "step": 1659} +{"info/global_step": 1660, "train_info/time_within_train_step": 2.6710472106933594, "step": 1660} +{"train_info/time_between_train_steps": 0.0031995773315429688, "step": 1660} +{"info/global_step": 1661, "train_info/time_within_train_step": 2.6714651584625244, "step": 1661} +{"train_info/time_between_train_steps": 0.0030868053436279297, "step": 1661} +{"info/global_step": 1662, "train_info/time_within_train_step": 2.670663833618164, "step": 1662} +{"train_info/time_between_train_steps": 0.0031461715698242188, "step": 1662} +{"info/global_step": 1663, "train_info/time_within_train_step": 2.67209529876709, "step": 1663} +{"train_info/time_between_train_steps": 0.003098011016845703, "step": 1663} +{"info/global_step": 1664, "train_info/time_within_train_step": 2.67151141166687, "step": 1664} +{"train_info/time_between_train_steps": 0.0030994415283203125, "step": 1664} +{"info/global_step": 1665, "train_info/time_within_train_step": 2.6698849201202393, "step": 1665} +{"train_info/time_between_train_steps": 0.003094196319580078, "step": 1665} +{"info/global_step": 1666, "train_info/time_within_train_step": 2.7713582515716553, "step": 1666} +{"train_info/time_between_train_steps": 0.0029964447021484375, "step": 1666} +{"info/global_step": 1667, "train_info/time_within_train_step": 2.669830799102783, "step": 1667} +{"train_info/time_between_train_steps": 0.002991914749145508, "step": 1667} +{"info/global_step": 1668, "train_info/time_within_train_step": 2.6699211597442627, "step": 1668} +{"train_info/time_between_train_steps": 0.0029478073120117188, "step": 1668} +{"info/global_step": 1669, "train_info/time_within_train_step": 2.6698005199432373, "step": 1669} +{"train_info/time_between_train_steps": 0.0029833316802978516, "step": 1669} +{"info/global_step": 1670, "train_info/time_within_train_step": 2.6709823608398438, "step": 1670} +{"train_info/time_between_train_steps": 0.0030307769775390625, "step": 1670} +{"info/global_step": 1671, "train_info/time_within_train_step": 2.6687850952148438, "step": 1671} +{"train_info/time_between_train_steps": 0.0029599666595458984, "step": 1671} +{"info/global_step": 1672, "train_info/time_within_train_step": 2.669084072113037, "step": 1672} +{"train_info/time_between_train_steps": 0.0030143260955810547, "step": 1672} +{"info/global_step": 1673, "train_info/time_within_train_step": 2.6708178520202637, "step": 1673} +{"train_info/time_between_train_steps": 0.003038644790649414, "step": 1673} +{"info/global_step": 1674, "train_info/time_within_train_step": 2.6702353954315186, "step": 1674} +{"train_info/time_between_train_steps": 0.002950906753540039, "step": 1674} +{"info/global_step": 1675, "train_info/time_within_train_step": 2.6693949699401855, "step": 1675} +{"train_info/time_between_train_steps": 0.0031135082244873047, "step": 1675} +{"info/global_step": 1676, "train_info/time_within_train_step": 2.6695327758789062, "step": 1676} +{"train_info/time_between_train_steps": 0.0029888153076171875, "step": 1676} +{"info/global_step": 1677, "train_info/time_within_train_step": 2.6695146560668945, "step": 1677} +{"train_info/time_between_train_steps": 0.003016233444213867, "step": 1677} +{"info/global_step": 1678, "train_info/time_within_train_step": 2.6700820922851562, "step": 1678} +{"train_info/time_between_train_steps": 0.002965688705444336, "step": 1678} +{"info/global_step": 1679, "train_info/time_within_train_step": 2.6698145866394043, "step": 1679} +{"train_info/time_between_train_steps": 0.0030739307403564453, "step": 1679} +{"info/global_step": 1680, "train_info/time_within_train_step": 2.6701998710632324, "step": 1680} +{"train_info/time_between_train_steps": 0.0029675960540771484, "step": 1680} +{"info/global_step": 1681, "train_info/time_within_train_step": 2.669813394546509, "step": 1681} +{"train_info/time_between_train_steps": 0.0029516220092773438, "step": 1681} +{"info/global_step": 1682, "train_info/time_within_train_step": 2.6702301502227783, "step": 1682} +{"train_info/time_between_train_steps": 0.0029773712158203125, "step": 1682} +{"info/global_step": 1683, "train_info/time_within_train_step": 2.6692631244659424, "step": 1683} +{"train_info/time_between_train_steps": 0.0029523372650146484, "step": 1683} +{"info/global_step": 1684, "train_info/time_within_train_step": 2.6707851886749268, "step": 1684} +{"train_info/time_between_train_steps": 0.0029821395874023438, "step": 1684} +{"info/global_step": 1685, "train_info/time_within_train_step": 2.670274496078491, "step": 1685} +{"train_info/time_between_train_steps": 0.003070354461669922, "step": 1685} +{"info/global_step": 1686, "train_info/time_within_train_step": 2.6706676483154297, "step": 1686} +{"train_info/time_between_train_steps": 0.003002643585205078, "step": 1686} +{"info/global_step": 1687, "train_info/time_within_train_step": 2.6713881492614746, "step": 1687} +{"train_info/time_between_train_steps": 0.003034830093383789, "step": 1687} +{"info/global_step": 1688, "train_info/time_within_train_step": 2.6713712215423584, "step": 1688} +{"train_info/time_between_train_steps": 0.003034830093383789, "step": 1688} +{"info/global_step": 1689, "train_info/time_within_train_step": 2.670764684677124, "step": 1689} +{"train_info/time_between_train_steps": 0.003270864486694336, "step": 1689} +{"info/global_step": 1690, "train_info/time_within_train_step": 2.671617031097412, "step": 1690} +{"train_info/time_between_train_steps": 0.003069162368774414, "step": 1690} +{"info/global_step": 1691, "train_info/time_within_train_step": 2.72163987159729, "step": 1691} +{"train_info/time_between_train_steps": 0.003000974655151367, "step": 1691} +{"info/global_step": 1692, "train_info/time_within_train_step": 2.670358180999756, "step": 1692} +{"train_info/time_between_train_steps": 0.002987384796142578, "step": 1692} +{"info/global_step": 1693, "train_info/time_within_train_step": 2.6706626415252686, "step": 1693} +{"train_info/time_between_train_steps": 0.0030002593994140625, "step": 1693} +{"info/global_step": 1694, "train_info/time_within_train_step": 2.6694693565368652, "step": 1694} +{"train_info/time_between_train_steps": 0.0029828548431396484, "step": 1694} +{"info/global_step": 1695, "train_info/time_within_train_step": 2.6691677570343018, "step": 1695} +{"train_info/time_between_train_steps": 0.0030679702758789062, "step": 1695} +{"info/global_step": 1696, "train_info/time_within_train_step": 2.6696290969848633, "step": 1696} +{"train_info/time_between_train_steps": 0.003009319305419922, "step": 1696} +{"info/global_step": 1697, "train_info/time_within_train_step": 2.668625831604004, "step": 1697} +{"train_info/time_between_train_steps": 0.003011941909790039, "step": 1697} +{"info/global_step": 1698, "train_info/time_within_train_step": 2.6698403358459473, "step": 1698} +{"train_info/time_between_train_steps": 0.003011465072631836, "step": 1698} +{"info/global_step": 1699, "train_info/time_within_train_step": 2.6693663597106934, "step": 1699} +{"train_info/time_between_train_steps": 0.003011941909790039, "step": 1699} +{"info/global_step": 1700, "train_info/time_within_train_step": 2.669243335723877, "step": 1700} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746208103, "_runtime": 4875}, "step": 1700} +{"logs": {"train/loss": 4.2337, "train/learning_rate": 0.0002888888888888888, "train/epoch": 1.28, "_timestamp": 1746208103, "_runtime": 4875}, "step": 1700} +{"train_info/time_between_train_steps": 13.14522123336792, "step": 1700} +{"info/global_step": 1701, "train_info/time_within_train_step": 2.4691591262817383, "step": 1701} +{"train_info/time_between_train_steps": 0.0030345916748046875, "step": 1701} +{"info/global_step": 1702, "train_info/time_within_train_step": 2.458085536956787, "step": 1702} +{"train_info/time_between_train_steps": 0.0030117034912109375, "step": 1702} +{"info/global_step": 1703, "train_info/time_within_train_step": 2.5154361724853516, "step": 1703} +{"train_info/time_between_train_steps": 0.0031516551971435547, "step": 1703} +{"info/global_step": 1704, "train_info/time_within_train_step": 2.667337656021118, "step": 1704} +{"train_info/time_between_train_steps": 0.003313779830932617, "step": 1704} +{"info/global_step": 1705, "train_info/time_within_train_step": 2.6717677116394043, "step": 1705} +{"train_info/time_between_train_steps": 0.003245830535888672, "step": 1705} +{"info/global_step": 1706, "train_info/time_within_train_step": 2.6702561378479004, "step": 1706} +{"train_info/time_between_train_steps": 0.002988576889038086, "step": 1706} +{"info/global_step": 1707, "train_info/time_within_train_step": 2.6707534790039062, "step": 1707} +{"train_info/time_between_train_steps": 0.003008127212524414, "step": 1707} +{"info/global_step": 1708, "train_info/time_within_train_step": 2.6698760986328125, "step": 1708} +{"train_info/time_between_train_steps": 0.0031380653381347656, "step": 1708} +{"info/global_step": 1709, "train_info/time_within_train_step": 2.6705527305603027, "step": 1709} +{"train_info/time_between_train_steps": 0.003080129623413086, "step": 1709} +{"info/global_step": 1710, "train_info/time_within_train_step": 2.6700379848480225, "step": 1710} +{"train_info/time_between_train_steps": 0.003137826919555664, "step": 1710} +{"info/global_step": 1711, "train_info/time_within_train_step": 2.671241283416748, "step": 1711} +{"train_info/time_between_train_steps": 0.0032455921173095703, "step": 1711} +{"info/global_step": 1712, "train_info/time_within_train_step": 2.6724607944488525, "step": 1712} +{"train_info/time_between_train_steps": 0.0033872127532958984, "step": 1712} +{"info/global_step": 1713, "train_info/time_within_train_step": 2.6728928089141846, "step": 1713} +{"train_info/time_between_train_steps": 0.0033249855041503906, "step": 1713} +{"info/global_step": 1714, "train_info/time_within_train_step": 2.673959732055664, "step": 1714} +{"train_info/time_between_train_steps": 0.003243684768676758, "step": 1714} +{"info/global_step": 1715, "train_info/time_within_train_step": 2.6730644702911377, "step": 1715} +{"train_info/time_between_train_steps": 0.003186464309692383, "step": 1715} +{"info/global_step": 1716, "train_info/time_within_train_step": 2.6747875213623047, "step": 1716} +{"train_info/time_between_train_steps": 0.0031893253326416016, "step": 1716} +{"info/global_step": 1717, "train_info/time_within_train_step": 2.7237179279327393, "step": 1717} +{"train_info/time_between_train_steps": 0.003361940383911133, "step": 1717} +{"info/global_step": 1718, "train_info/time_within_train_step": 2.67321515083313, "step": 1718} +{"train_info/time_between_train_steps": 0.003215312957763672, "step": 1718} +{"info/global_step": 1719, "train_info/time_within_train_step": 2.6734302043914795, "step": 1719} +{"train_info/time_between_train_steps": 0.003290414810180664, "step": 1719} +{"info/global_step": 1720, "train_info/time_within_train_step": 2.6729588508605957, "step": 1720} +{"train_info/time_between_train_steps": 0.0032799243927001953, "step": 1720} +{"info/global_step": 1721, "train_info/time_within_train_step": 2.6729989051818848, "step": 1721} +{"train_info/time_between_train_steps": 0.0034847259521484375, "step": 1721} +{"info/global_step": 1722, "train_info/time_within_train_step": 2.672572135925293, "step": 1722} +{"train_info/time_between_train_steps": 0.003475189208984375, "step": 1722} +{"info/global_step": 1723, "train_info/time_within_train_step": 2.6727023124694824, "step": 1723} +{"train_info/time_between_train_steps": 0.003543376922607422, "step": 1723} +{"info/global_step": 1724, "train_info/time_within_train_step": 2.6719698905944824, "step": 1724} +{"train_info/time_between_train_steps": 0.0035636425018310547, "step": 1724} +{"info/global_step": 1725, "train_info/time_within_train_step": 2.6728179454803467, "step": 1725} +{"train_info/time_between_train_steps": 0.00394129753112793, "step": 1725} +{"info/global_step": 1726, "train_info/time_within_train_step": 2.6747801303863525, "step": 1726} +{"train_info/time_between_train_steps": 0.0036695003509521484, "step": 1726} +{"info/global_step": 1727, "train_info/time_within_train_step": 2.673034429550171, "step": 1727} +{"train_info/time_between_train_steps": 0.003679037094116211, "step": 1727} +{"info/global_step": 1728, "train_info/time_within_train_step": 2.6736714839935303, "step": 1728} +{"train_info/time_between_train_steps": 0.0034635066986083984, "step": 1728} +{"train_info/time_between_train_steps": 2.3512256145477295, "step": 1728} +{"info/global_step": 1729, "train_info/time_within_train_step": 2.910949230194092, "step": 1729} +{"train_info/time_between_train_steps": 0.0032629966735839844, "step": 1729} +{"info/global_step": 1730, "train_info/time_within_train_step": 2.7217440605163574, "step": 1730} +{"train_info/time_between_train_steps": 0.0032041072845458984, "step": 1730} +{"info/global_step": 1731, "train_info/time_within_train_step": 2.6709578037261963, "step": 1731} +{"train_info/time_between_train_steps": 0.003173828125, "step": 1731} +{"info/global_step": 1732, "train_info/time_within_train_step": 2.6714680194854736, "step": 1732} +{"train_info/time_between_train_steps": 0.003179311752319336, "step": 1732} +{"info/global_step": 1733, "train_info/time_within_train_step": 2.6718623638153076, "step": 1733} +{"train_info/time_between_train_steps": 0.003221750259399414, "step": 1733} +{"info/global_step": 1734, "train_info/time_within_train_step": 2.671285629272461, "step": 1734} +{"train_info/time_between_train_steps": 0.003173828125, "step": 1734} +{"info/global_step": 1735, "train_info/time_within_train_step": 2.670900344848633, "step": 1735} +{"train_info/time_between_train_steps": 0.003175497055053711, "step": 1735} +{"info/global_step": 1736, "train_info/time_within_train_step": 2.6735599040985107, "step": 1736} +{"train_info/time_between_train_steps": 0.003215789794921875, "step": 1736} +{"info/global_step": 1737, "train_info/time_within_train_step": 2.672349691390991, "step": 1737} +{"train_info/time_between_train_steps": 0.003244161605834961, "step": 1737} +{"info/global_step": 1738, "train_info/time_within_train_step": 2.672337532043457, "step": 1738} +{"train_info/time_between_train_steps": 0.003169536590576172, "step": 1738} +{"info/global_step": 1739, "train_info/time_within_train_step": 2.6719565391540527, "step": 1739} +{"train_info/time_between_train_steps": 0.003335237503051758, "step": 1739} +{"info/global_step": 1740, "train_info/time_within_train_step": 2.671396255493164, "step": 1740} +{"train_info/time_between_train_steps": 0.0034105777740478516, "step": 1740} +{"info/global_step": 1741, "train_info/time_within_train_step": 2.6724448204040527, "step": 1741} +{"train_info/time_between_train_steps": 0.003515481948852539, "step": 1741} +{"info/global_step": 1742, "train_info/time_within_train_step": 2.674163818359375, "step": 1742} +{"train_info/time_between_train_steps": 0.003640890121459961, "step": 1742} +{"info/global_step": 1743, "train_info/time_within_train_step": 2.6712522506713867, "step": 1743} +{"train_info/time_between_train_steps": 0.003520965576171875, "step": 1743} +{"info/global_step": 1744, "train_info/time_within_train_step": 2.7107367515563965, "step": 1744} +{"train_info/time_between_train_steps": 0.003542184829711914, "step": 1744} +{"info/global_step": 1745, "train_info/time_within_train_step": 2.6724252700805664, "step": 1745} +{"train_info/time_between_train_steps": 0.0034399032592773438, "step": 1745} +{"info/global_step": 1746, "train_info/time_within_train_step": 2.671314239501953, "step": 1746} +{"train_info/time_between_train_steps": 0.0034821033477783203, "step": 1746} +{"info/global_step": 1747, "train_info/time_within_train_step": 2.67230224609375, "step": 1747} +{"train_info/time_between_train_steps": 0.0033829212188720703, "step": 1747} +{"info/global_step": 1748, "train_info/time_within_train_step": 2.6726646423339844, "step": 1748} +{"train_info/time_between_train_steps": 0.0034689903259277344, "step": 1748} +{"info/global_step": 1749, "train_info/time_within_train_step": 2.6732866764068604, "step": 1749} +{"train_info/time_between_train_steps": 0.0035147666931152344, "step": 1749} +{"info/global_step": 1750, "train_info/time_within_train_step": 3.250312089920044, "step": 1750} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746208254, "_runtime": 5026}, "step": 1750} +{"logs": {"train/loss": 4.2348, "train/learning_rate": 0.0002777777777777778, "train/epoch": 2.01, "_timestamp": 1746208254, "_runtime": 5026}, "step": 1750} +{"train_info/time_between_train_steps": 0.025243043899536133, "step": 1750} +{"info/global_step": 1751, "train_info/time_within_train_step": 2.671491861343384, "step": 1751} +{"train_info/time_between_train_steps": 0.0034322738647460938, "step": 1751} +{"info/global_step": 1752, "train_info/time_within_train_step": 2.6713058948516846, "step": 1752} +{"train_info/time_between_train_steps": 0.0034711360931396484, "step": 1752} +{"info/global_step": 1753, "train_info/time_within_train_step": 2.6718671321868896, "step": 1753} +{"train_info/time_between_train_steps": 0.003452777862548828, "step": 1753} +{"info/global_step": 1754, "train_info/time_within_train_step": 2.6721034049987793, "step": 1754} +{"train_info/time_between_train_steps": 0.003565073013305664, "step": 1754} +{"info/global_step": 1755, "train_info/time_within_train_step": 2.6718461513519287, "step": 1755} +{"train_info/time_between_train_steps": 0.0035233497619628906, "step": 1755} +{"info/global_step": 1756, "train_info/time_within_train_step": 2.671767234802246, "step": 1756} +{"train_info/time_between_train_steps": 0.005029201507568359, "step": 1756} +{"info/global_step": 1757, "train_info/time_within_train_step": 2.6731154918670654, "step": 1757} +{"train_info/time_between_train_steps": 0.0035238265991210938, "step": 1757} +{"info/global_step": 1758, "train_info/time_within_train_step": 2.673306465148926, "step": 1758} +{"train_info/time_between_train_steps": 0.0035758018493652344, "step": 1758} +{"info/global_step": 1759, "train_info/time_within_train_step": 2.6727285385131836, "step": 1759} +{"train_info/time_between_train_steps": 0.003499746322631836, "step": 1759} +{"info/global_step": 1760, "train_info/time_within_train_step": 2.6734201908111572, "step": 1760} +{"train_info/time_between_train_steps": 0.0035970211029052734, "step": 1760} +{"info/global_step": 1761, "train_info/time_within_train_step": 2.6735823154449463, "step": 1761} +{"train_info/time_between_train_steps": 0.003469705581665039, "step": 1761} +{"info/global_step": 1762, "train_info/time_within_train_step": 2.672016143798828, "step": 1762} +{"train_info/time_between_train_steps": 0.0035555362701416016, "step": 1762} +{"info/global_step": 1763, "train_info/time_within_train_step": 2.6732380390167236, "step": 1763} +{"train_info/time_between_train_steps": 0.003518342971801758, "step": 1763} +{"info/global_step": 1764, "train_info/time_within_train_step": 2.6742641925811768, "step": 1764} +{"train_info/time_between_train_steps": 0.0034558773040771484, "step": 1764} +{"info/global_step": 1765, "train_info/time_within_train_step": 2.6734464168548584, "step": 1765} +{"train_info/time_between_train_steps": 0.0035254955291748047, "step": 1765} +{"info/global_step": 1766, "train_info/time_within_train_step": 2.6728758811950684, "step": 1766} +{"train_info/time_between_train_steps": 0.003506898880004883, "step": 1766} +{"info/global_step": 1767, "train_info/time_within_train_step": 2.672232151031494, "step": 1767} +{"train_info/time_between_train_steps": 0.0034906864166259766, "step": 1767} +{"info/global_step": 1768, "train_info/time_within_train_step": 2.6742300987243652, "step": 1768} +{"train_info/time_between_train_steps": 0.0035398006439208984, "step": 1768} +{"info/global_step": 1769, "train_info/time_within_train_step": 2.6722559928894043, "step": 1769} +{"train_info/time_between_train_steps": 0.003442525863647461, "step": 1769} +{"info/global_step": 1770, "train_info/time_within_train_step": 2.673048734664917, "step": 1770} +{"train_info/time_between_train_steps": 0.003488779067993164, "step": 1770} +{"info/global_step": 1771, "train_info/time_within_train_step": 2.6725049018859863, "step": 1771} +{"train_info/time_between_train_steps": 0.003503561019897461, "step": 1771} +{"info/global_step": 1772, "train_info/time_within_train_step": 2.67244291305542, "step": 1772} +{"train_info/time_between_train_steps": 0.0035021305084228516, "step": 1772} +{"info/global_step": 1773, "train_info/time_within_train_step": 2.672450542449951, "step": 1773} +{"train_info/time_between_train_steps": 0.003502368927001953, "step": 1773} +{"info/global_step": 1774, "train_info/time_within_train_step": 2.673257350921631, "step": 1774} +{"train_info/time_between_train_steps": 0.0034983158111572266, "step": 1774} +{"info/global_step": 1775, "train_info/time_within_train_step": 2.6741113662719727, "step": 1775} +{"train_info/time_between_train_steps": 0.003552675247192383, "step": 1775} +{"info/global_step": 1776, "train_info/time_within_train_step": 2.673001766204834, "step": 1776} +{"train_info/time_between_train_steps": 0.003528118133544922, "step": 1776} +{"info/global_step": 1777, "train_info/time_within_train_step": 2.673956871032715, "step": 1777} +{"train_info/time_between_train_steps": 0.003518342971801758, "step": 1777} +{"info/global_step": 1778, "train_info/time_within_train_step": 2.675250291824341, "step": 1778} +{"train_info/time_between_train_steps": 0.0035436153411865234, "step": 1778} +{"info/global_step": 1779, "train_info/time_within_train_step": 2.67558217048645, "step": 1779} +{"train_info/time_between_train_steps": 0.0034711360931396484, "step": 1779} +{"info/global_step": 1780, "train_info/time_within_train_step": 2.6742212772369385, "step": 1780} +{"train_info/time_between_train_steps": 0.00412440299987793, "step": 1780} +{"info/global_step": 1781, "train_info/time_within_train_step": 2.673421859741211, "step": 1781} +{"train_info/time_between_train_steps": 0.003501415252685547, "step": 1781} +{"info/global_step": 1782, "train_info/time_within_train_step": 2.673938035964966, "step": 1782} +{"train_info/time_between_train_steps": 0.0034847259521484375, "step": 1782} +{"info/global_step": 1783, "train_info/time_within_train_step": 2.9901201725006104, "step": 1783} +{"train_info/time_between_train_steps": 0.003348827362060547, "step": 1783} +{"info/global_step": 1784, "train_info/time_within_train_step": 2.6769702434539795, "step": 1784} +{"train_info/time_between_train_steps": 0.003269672393798828, "step": 1784} +{"info/global_step": 1785, "train_info/time_within_train_step": 2.6724112033843994, "step": 1785} +{"train_info/time_between_train_steps": 0.003282308578491211, "step": 1785} +{"info/global_step": 1786, "train_info/time_within_train_step": 2.6716761589050293, "step": 1786} +{"train_info/time_between_train_steps": 0.003252744674682617, "step": 1786} +{"info/global_step": 1787, "train_info/time_within_train_step": 2.671795606613159, "step": 1787} +{"train_info/time_between_train_steps": 0.003275632858276367, "step": 1787} +{"info/global_step": 1788, "train_info/time_within_train_step": 2.671426773071289, "step": 1788} +{"train_info/time_between_train_steps": 0.003230571746826172, "step": 1788} +{"info/global_step": 1789, "train_info/time_within_train_step": 2.672689199447632, "step": 1789} +{"train_info/time_between_train_steps": 0.003256082534790039, "step": 1789} +{"info/global_step": 1790, "train_info/time_within_train_step": 2.672495126724243, "step": 1790} +{"train_info/time_between_train_steps": 0.004463911056518555, "step": 1790} +{"info/global_step": 1791, "train_info/time_within_train_step": 2.8393142223358154, "step": 1791} +{"train_info/time_between_train_steps": 0.0033626556396484375, "step": 1791} +{"info/global_step": 1792, "train_info/time_within_train_step": 2.6726346015930176, "step": 1792} +{"train_info/time_between_train_steps": 0.0033431053161621094, "step": 1792} +{"info/global_step": 1793, "train_info/time_within_train_step": 2.6721086502075195, "step": 1793} +{"train_info/time_between_train_steps": 0.003353118896484375, "step": 1793} +{"info/global_step": 1794, "train_info/time_within_train_step": 2.673673152923584, "step": 1794} +{"train_info/time_between_train_steps": 0.003332853317260742, "step": 1794} +{"info/global_step": 1795, "train_info/time_within_train_step": 2.672344207763672, "step": 1795} +{"train_info/time_between_train_steps": 0.0033342838287353516, "step": 1795} +{"info/global_step": 1796, "train_info/time_within_train_step": 2.672569513320923, "step": 1796} +{"train_info/time_between_train_steps": 0.003286123275756836, "step": 1796} +{"info/global_step": 1797, "train_info/time_within_train_step": 2.6725447177886963, "step": 1797} +{"train_info/time_between_train_steps": 0.0033469200134277344, "step": 1797} +{"info/global_step": 1798, "train_info/time_within_train_step": 2.6728267669677734, "step": 1798} +{"train_info/time_between_train_steps": 0.003417491912841797, "step": 1798} +{"info/global_step": 1799, "train_info/time_within_train_step": 2.672259569168091, "step": 1799} +{"train_info/time_between_train_steps": 0.003306865692138672, "step": 1799} +{"info/global_step": 1800, "train_info/time_within_train_step": 2.672694206237793, "step": 1800} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746208389, "_runtime": 5161}, "step": 1800} +{"logs": {"train/loss": 4.1786, "train/learning_rate": 0.0002666666666666666, "train/epoch": 2.02, "_timestamp": 1746208389, "_runtime": 5161}, "step": 1800} +{"train_info/time_between_train_steps": 14.369325399398804, "step": 1800} +{"info/global_step": 1801, "train_info/time_within_train_step": 2.4726181030273438, "step": 1801} +{"train_info/time_between_train_steps": 0.003348112106323242, "step": 1801} +{"info/global_step": 1802, "train_info/time_within_train_step": 2.4581384658813477, "step": 1802} +{"train_info/time_between_train_steps": 0.003390789031982422, "step": 1802} +{"info/global_step": 1803, "train_info/time_within_train_step": 2.4597110748291016, "step": 1803} +{"train_info/time_between_train_steps": 0.0035543441772460938, "step": 1803} +{"info/global_step": 1804, "train_info/time_within_train_step": 2.6377081871032715, "step": 1804} +{"train_info/time_between_train_steps": 0.0035560131072998047, "step": 1804} +{"info/global_step": 1805, "train_info/time_within_train_step": 2.6752681732177734, "step": 1805} +{"train_info/time_between_train_steps": 0.0038726329803466797, "step": 1805} +{"info/global_step": 1806, "train_info/time_within_train_step": 2.676447868347168, "step": 1806} +{"train_info/time_between_train_steps": 0.0037491321563720703, "step": 1806} +{"info/global_step": 1807, "train_info/time_within_train_step": 2.673240900039673, "step": 1807} +{"train_info/time_between_train_steps": 0.0037147998809814453, "step": 1807} +{"info/global_step": 1808, "train_info/time_within_train_step": 2.673767566680908, "step": 1808} +{"train_info/time_between_train_steps": 0.0037322044372558594, "step": 1808} +{"info/global_step": 1809, "train_info/time_within_train_step": 2.6729907989501953, "step": 1809} +{"train_info/time_between_train_steps": 0.0035736560821533203, "step": 1809} +{"info/global_step": 1810, "train_info/time_within_train_step": 2.6729865074157715, "step": 1810} +{"train_info/time_between_train_steps": 0.0035173892974853516, "step": 1810} +{"info/global_step": 1811, "train_info/time_within_train_step": 2.674133539199829, "step": 1811} +{"train_info/time_between_train_steps": 0.0035359859466552734, "step": 1811} +{"info/global_step": 1812, "train_info/time_within_train_step": 2.6730356216430664, "step": 1812} +{"train_info/time_between_train_steps": 0.003610372543334961, "step": 1812} +{"info/global_step": 1813, "train_info/time_within_train_step": 2.6754555702209473, "step": 1813} +{"train_info/time_between_train_steps": 0.003676891326904297, "step": 1813} +{"info/global_step": 1814, "train_info/time_within_train_step": 2.6772234439849854, "step": 1814} +{"train_info/time_between_train_steps": 0.0038979053497314453, "step": 1814} +{"info/global_step": 1815, "train_info/time_within_train_step": 2.676302671432495, "step": 1815} +{"train_info/time_between_train_steps": 0.0037376880645751953, "step": 1815} +{"info/global_step": 1816, "train_info/time_within_train_step": 2.6758975982666016, "step": 1816} +{"train_info/time_between_train_steps": 0.0037136077880859375, "step": 1816} +{"info/global_step": 1817, "train_info/time_within_train_step": 2.6750409603118896, "step": 1817} +{"train_info/time_between_train_steps": 0.003737926483154297, "step": 1817} +{"info/global_step": 1818, "train_info/time_within_train_step": 2.6759564876556396, "step": 1818} +{"train_info/time_between_train_steps": 0.0037713050842285156, "step": 1818} +{"info/global_step": 1819, "train_info/time_within_train_step": 2.6764602661132812, "step": 1819} +{"train_info/time_between_train_steps": 0.0037186145782470703, "step": 1819} +{"info/global_step": 1820, "train_info/time_within_train_step": 2.677872896194458, "step": 1820} +{"train_info/time_between_train_steps": 0.003686666488647461, "step": 1820} +{"info/global_step": 1821, "train_info/time_within_train_step": 2.6745269298553467, "step": 1821} +{"train_info/time_between_train_steps": 0.0037186145782470703, "step": 1821} +{"info/global_step": 1822, "train_info/time_within_train_step": 2.6756491661071777, "step": 1822} +{"train_info/time_between_train_steps": 0.0036773681640625, "step": 1822} +{"info/global_step": 1823, "train_info/time_within_train_step": 2.6744558811187744, "step": 1823} +{"train_info/time_between_train_steps": 0.00370025634765625, "step": 1823} +{"info/global_step": 1824, "train_info/time_within_train_step": 2.675363779067993, "step": 1824} +{"train_info/time_between_train_steps": 0.0037202835083007812, "step": 1824} +{"info/global_step": 1825, "train_info/time_within_train_step": 2.6749048233032227, "step": 1825} +{"train_info/time_between_train_steps": 0.003711223602294922, "step": 1825} +{"info/global_step": 1826, "train_info/time_within_train_step": 2.676234483718872, "step": 1826} +{"train_info/time_between_train_steps": 0.0038068294525146484, "step": 1826} +{"info/global_step": 1827, "train_info/time_within_train_step": 2.675028085708618, "step": 1827} +{"train_info/time_between_train_steps": 0.0037050247192382812, "step": 1827} +{"info/global_step": 1828, "train_info/time_within_train_step": 2.6761314868927, "step": 1828} +{"train_info/time_between_train_steps": 0.0037031173706054688, "step": 1828} +{"info/global_step": 1829, "train_info/time_within_train_step": 2.6755244731903076, "step": 1829} +{"train_info/time_between_train_steps": 0.0036783218383789062, "step": 1829} +{"info/global_step": 1830, "train_info/time_within_train_step": 2.6753718852996826, "step": 1830} +{"train_info/time_between_train_steps": 0.003668069839477539, "step": 1830} +{"info/global_step": 1831, "train_info/time_within_train_step": 2.6762754917144775, "step": 1831} +{"train_info/time_between_train_steps": 0.0036575794219970703, "step": 1831} +{"info/global_step": 1832, "train_info/time_within_train_step": 2.675424575805664, "step": 1832} +{"train_info/time_between_train_steps": 0.0036776065826416016, "step": 1832} +{"info/global_step": 1833, "train_info/time_within_train_step": 2.674996852874756, "step": 1833} +{"train_info/time_between_train_steps": 0.0036733150482177734, "step": 1833} +{"info/global_step": 1834, "train_info/time_within_train_step": 2.67399263381958, "step": 1834} +{"train_info/time_between_train_steps": 0.003706216812133789, "step": 1834} +{"info/global_step": 1835, "train_info/time_within_train_step": 2.67688250541687, "step": 1835} +{"train_info/time_between_train_steps": 0.004011869430541992, "step": 1835} +{"info/global_step": 1836, "train_info/time_within_train_step": 2.675950765609741, "step": 1836} +{"train_info/time_between_train_steps": 0.0036733150482177734, "step": 1836} +{"info/global_step": 1837, "train_info/time_within_train_step": 2.673780918121338, "step": 1837} +{"train_info/time_between_train_steps": 0.0036797523498535156, "step": 1837} +{"info/global_step": 1838, "train_info/time_within_train_step": 2.673861503601074, "step": 1838} +{"train_info/time_between_train_steps": 0.003750324249267578, "step": 1838} +{"info/global_step": 1839, "train_info/time_within_train_step": 2.6746184825897217, "step": 1839} +{"train_info/time_between_train_steps": 0.0036656856536865234, "step": 1839} +{"info/global_step": 1840, "train_info/time_within_train_step": 2.6750450134277344, "step": 1840} +{"train_info/time_between_train_steps": 0.0036764144897460938, "step": 1840} +{"info/global_step": 1841, "train_info/time_within_train_step": 2.6745309829711914, "step": 1841} +{"train_info/time_between_train_steps": 0.0036513805389404297, "step": 1841} +{"info/global_step": 1842, "train_info/time_within_train_step": 2.6742749214172363, "step": 1842} +{"train_info/time_between_train_steps": 0.0036725997924804688, "step": 1842} +{"info/global_step": 1843, "train_info/time_within_train_step": 2.6756060123443604, "step": 1843} +{"train_info/time_between_train_steps": 0.0037338733673095703, "step": 1843} +{"info/global_step": 1844, "train_info/time_within_train_step": 2.67478609085083, "step": 1844} +{"train_info/time_between_train_steps": 0.003662109375, "step": 1844} +{"info/global_step": 1845, "train_info/time_within_train_step": 2.6748697757720947, "step": 1845} +{"train_info/time_between_train_steps": 0.0038514137268066406, "step": 1845} +{"info/global_step": 1846, "train_info/time_within_train_step": 2.6736996173858643, "step": 1846} +{"train_info/time_between_train_steps": 0.0035207271575927734, "step": 1846} +{"info/global_step": 1847, "train_info/time_within_train_step": 2.671523332595825, "step": 1847} +{"train_info/time_between_train_steps": 0.0035080909729003906, "step": 1847} +{"info/global_step": 1848, "train_info/time_within_train_step": 2.672140121459961, "step": 1848} +{"train_info/time_between_train_steps": 0.0034651756286621094, "step": 1848} +{"info/global_step": 1849, "train_info/time_within_train_step": 2.67248272895813, "step": 1849} +{"train_info/time_between_train_steps": 0.0035676956176757812, "step": 1849} +{"info/global_step": 1850, "train_info/time_within_train_step": 2.674370765686035, "step": 1850} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746208538, "_runtime": 5310}, "step": 1850} +{"logs": {"train/loss": 4.1702, "train/learning_rate": 0.00025555555555555553, "train/epoch": 2.04, "_timestamp": 1746208538, "_runtime": 5310}, "step": 1850} +{"train_info/time_between_train_steps": 0.025768280029296875, "step": 1850} +{"info/global_step": 1851, "train_info/time_within_train_step": 2.674462080001831, "step": 1851} +{"train_info/time_between_train_steps": 0.003672361373901367, "step": 1851} +{"info/global_step": 1852, "train_info/time_within_train_step": 2.6739652156829834, "step": 1852} +{"train_info/time_between_train_steps": 0.003643035888671875, "step": 1852} +{"info/global_step": 1853, "train_info/time_within_train_step": 2.67290997505188, "step": 1853} +{"train_info/time_between_train_steps": 0.21445631980895996, "step": 1853} +{"info/global_step": 1854, "train_info/time_within_train_step": 2.6724441051483154, "step": 1854} +{"train_info/time_between_train_steps": 0.004131793975830078, "step": 1854} +{"info/global_step": 1855, "train_info/time_within_train_step": 2.673457384109497, "step": 1855} +{"train_info/time_between_train_steps": 0.0034651756286621094, "step": 1855} +{"info/global_step": 1856, "train_info/time_within_train_step": 3.0600225925445557, "step": 1856} +{"train_info/time_between_train_steps": 0.0037200450897216797, "step": 1856} +{"info/global_step": 1857, "train_info/time_within_train_step": 2.674454689025879, "step": 1857} +{"train_info/time_between_train_steps": 0.003656148910522461, "step": 1857} +{"info/global_step": 1858, "train_info/time_within_train_step": 2.6727700233459473, "step": 1858} +{"train_info/time_between_train_steps": 0.0036423206329345703, "step": 1858} +{"info/global_step": 1859, "train_info/time_within_train_step": 2.672903060913086, "step": 1859} +{"train_info/time_between_train_steps": 0.003690481185913086, "step": 1859} +{"info/global_step": 1860, "train_info/time_within_train_step": 2.672314405441284, "step": 1860} +{"train_info/time_between_train_steps": 0.0036573410034179688, "step": 1860} +{"info/global_step": 1861, "train_info/time_within_train_step": 2.6724627017974854, "step": 1861} +{"train_info/time_between_train_steps": 0.0037546157836914062, "step": 1861} +{"info/global_step": 1862, "train_info/time_within_train_step": 2.6717169284820557, "step": 1862} +{"train_info/time_between_train_steps": 0.003743410110473633, "step": 1862} +{"info/global_step": 1863, "train_info/time_within_train_step": 2.6738944053649902, "step": 1863} +{"train_info/time_between_train_steps": 0.0036673545837402344, "step": 1863} +{"info/global_step": 1864, "train_info/time_within_train_step": 2.6726090908050537, "step": 1864} +{"train_info/time_between_train_steps": 0.0035965442657470703, "step": 1864} +{"info/global_step": 1865, "train_info/time_within_train_step": 2.6737656593322754, "step": 1865} +{"train_info/time_between_train_steps": 0.0036869049072265625, "step": 1865} +{"info/global_step": 1866, "train_info/time_within_train_step": 2.673335075378418, "step": 1866} +{"train_info/time_between_train_steps": 0.003648996353149414, "step": 1866} +{"info/global_step": 1867, "train_info/time_within_train_step": 2.672816514968872, "step": 1867} +{"train_info/time_between_train_steps": 0.0036683082580566406, "step": 1867} +{"info/global_step": 1868, "train_info/time_within_train_step": 2.672778367996216, "step": 1868} +{"train_info/time_between_train_steps": 0.0037078857421875, "step": 1868} +{"info/global_step": 1869, "train_info/time_within_train_step": 2.673670530319214, "step": 1869} +{"train_info/time_between_train_steps": 0.0036995410919189453, "step": 1869} +{"info/global_step": 1870, "train_info/time_within_train_step": 2.67498779296875, "step": 1870} +{"train_info/time_between_train_steps": 0.0037331581115722656, "step": 1870} +{"info/global_step": 1871, "train_info/time_within_train_step": 2.675424814224243, "step": 1871} +{"train_info/time_between_train_steps": 0.0037469863891601562, "step": 1871} +{"info/global_step": 1872, "train_info/time_within_train_step": 2.6747324466705322, "step": 1872} +{"train_info/time_between_train_steps": 0.0036478042602539062, "step": 1872} +{"info/global_step": 1873, "train_info/time_within_train_step": 2.6746768951416016, "step": 1873} +{"train_info/time_between_train_steps": 0.003808736801147461, "step": 1873} +{"info/global_step": 1874, "train_info/time_within_train_step": 2.6752853393554688, "step": 1874} +{"train_info/time_between_train_steps": 0.0037822723388671875, "step": 1874} +{"info/global_step": 1875, "train_info/time_within_train_step": 2.6757724285125732, "step": 1875} +{"train_info/time_between_train_steps": 0.0038356781005859375, "step": 1875} +{"info/global_step": 1876, "train_info/time_within_train_step": 2.6752195358276367, "step": 1876} +{"train_info/time_between_train_steps": 0.003911018371582031, "step": 1876} +{"info/global_step": 1877, "train_info/time_within_train_step": 2.674410820007324, "step": 1877} +{"train_info/time_between_train_steps": 0.004110813140869141, "step": 1877} +{"info/global_step": 1878, "train_info/time_within_train_step": 2.6742441654205322, "step": 1878} +{"train_info/time_between_train_steps": 0.003911256790161133, "step": 1878} +{"info/global_step": 1879, "train_info/time_within_train_step": 2.6723875999450684, "step": 1879} +{"train_info/time_between_train_steps": 0.0039789676666259766, "step": 1879} +{"info/global_step": 1880, "train_info/time_within_train_step": 2.674374580383301, "step": 1880} +{"train_info/time_between_train_steps": 0.003943920135498047, "step": 1880} +{"info/global_step": 1881, "train_info/time_within_train_step": 2.6749331951141357, "step": 1881} +{"train_info/time_between_train_steps": 0.003779172897338867, "step": 1881} +{"info/global_step": 1882, "train_info/time_within_train_step": 2.676703453063965, "step": 1882} +{"train_info/time_between_train_steps": 0.0037689208984375, "step": 1882} +{"info/global_step": 1883, "train_info/time_within_train_step": 2.6733007431030273, "step": 1883} +{"train_info/time_between_train_steps": 0.0036857128143310547, "step": 1883} +{"info/global_step": 1884, "train_info/time_within_train_step": 2.6738548278808594, "step": 1884} +{"train_info/time_between_train_steps": 0.0036313533782958984, "step": 1884} +{"info/global_step": 1885, "train_info/time_within_train_step": 2.6739466190338135, "step": 1885} +{"train_info/time_between_train_steps": 0.0037360191345214844, "step": 1885} +{"info/global_step": 1886, "train_info/time_within_train_step": 2.673525333404541, "step": 1886} +{"train_info/time_between_train_steps": 0.004397153854370117, "step": 1886} +{"info/global_step": 1887, "train_info/time_within_train_step": 2.6718838214874268, "step": 1887} +{"train_info/time_between_train_steps": 0.0036954879760742188, "step": 1887} +{"info/global_step": 1888, "train_info/time_within_train_step": 2.672926425933838, "step": 1888} +{"train_info/time_between_train_steps": 0.0037178993225097656, "step": 1888} +{"info/global_step": 1889, "train_info/time_within_train_step": 2.6732447147369385, "step": 1889} +{"train_info/time_between_train_steps": 0.0038297176361083984, "step": 1889} +{"info/global_step": 1890, "train_info/time_within_train_step": 2.677532911300659, "step": 1890} +{"train_info/time_between_train_steps": 0.0035736560821533203, "step": 1890} +{"info/global_step": 1891, "train_info/time_within_train_step": 2.6718878746032715, "step": 1891} +{"train_info/time_between_train_steps": 0.0036818981170654297, "step": 1891} +{"info/global_step": 1892, "train_info/time_within_train_step": 2.6719822883605957, "step": 1892} +{"train_info/time_between_train_steps": 0.0035626888275146484, "step": 1892} +{"info/global_step": 1893, "train_info/time_within_train_step": 2.671816110610962, "step": 1893} +{"train_info/time_between_train_steps": 0.0035300254821777344, "step": 1893} +{"info/global_step": 1894, "train_info/time_within_train_step": 2.6746842861175537, "step": 1894} +{"train_info/time_between_train_steps": 0.0038459300994873047, "step": 1894} +{"info/global_step": 1895, "train_info/time_within_train_step": 2.673978328704834, "step": 1895} +{"train_info/time_between_train_steps": 0.0036385059356689453, "step": 1895} +{"info/global_step": 1896, "train_info/time_within_train_step": 2.6723833084106445, "step": 1896} +{"train_info/time_between_train_steps": 0.003643512725830078, "step": 1896} +{"info/global_step": 1897, "train_info/time_within_train_step": 2.673449993133545, "step": 1897} +{"train_info/time_between_train_steps": 0.0035812854766845703, "step": 1897} +{"info/global_step": 1898, "train_info/time_within_train_step": 2.673583984375, "step": 1898} +{"train_info/time_between_train_steps": 0.0036280155181884766, "step": 1898} +{"info/global_step": 1899, "train_info/time_within_train_step": 2.674617052078247, "step": 1899} +{"train_info/time_between_train_steps": 0.0036585330963134766, "step": 1899} +{"info/global_step": 1900, "train_info/time_within_train_step": 2.674501657485962, "step": 1900} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746208674, "_runtime": 5446}, "step": 1900} +{"logs": {"train/loss": 4.1602, "train/learning_rate": 0.00024444444444444443, "train/epoch": 2.06, "_timestamp": 1746208674, "_runtime": 5446}, "step": 1900} +{"train_info/time_between_train_steps": 12.873475074768066, "step": 1900} +{"info/global_step": 1901, "train_info/time_within_train_step": 2.4765872955322266, "step": 1901} +{"train_info/time_between_train_steps": 0.0034503936767578125, "step": 1901} +{"info/global_step": 1902, "train_info/time_within_train_step": 2.457956075668335, "step": 1902} +{"train_info/time_between_train_steps": 0.003496408462524414, "step": 1902} +{"info/global_step": 1903, "train_info/time_within_train_step": 2.470698595046997, "step": 1903} +{"train_info/time_between_train_steps": 0.0035402774810791016, "step": 1903} +{"info/global_step": 1904, "train_info/time_within_train_step": 2.6517393589019775, "step": 1904} +{"train_info/time_between_train_steps": 0.003725290298461914, "step": 1904} +{"info/global_step": 1905, "train_info/time_within_train_step": 2.6704483032226562, "step": 1905} +{"train_info/time_between_train_steps": 0.003520965576171875, "step": 1905} +{"info/global_step": 1906, "train_info/time_within_train_step": 3.0593109130859375, "step": 1906} +{"train_info/time_between_train_steps": 0.0033707618713378906, "step": 1906} +{"info/global_step": 1907, "train_info/time_within_train_step": 2.670971155166626, "step": 1907} +{"train_info/time_between_train_steps": 0.0033211708068847656, "step": 1907} +{"info/global_step": 1908, "train_info/time_within_train_step": 2.671356678009033, "step": 1908} +{"train_info/time_between_train_steps": 0.0032846927642822266, "step": 1908} +{"info/global_step": 1909, "train_info/time_within_train_step": 2.6729846000671387, "step": 1909} +{"train_info/time_between_train_steps": 0.003292083740234375, "step": 1909} +{"info/global_step": 1910, "train_info/time_within_train_step": 2.6738715171813965, "step": 1910} +{"train_info/time_between_train_steps": 0.0035202503204345703, "step": 1910} +{"info/global_step": 1911, "train_info/time_within_train_step": 2.6819510459899902, "step": 1911} +{"train_info/time_between_train_steps": 0.003469228744506836, "step": 1911} +{"info/global_step": 1912, "train_info/time_within_train_step": 2.6759607791900635, "step": 1912} +{"train_info/time_between_train_steps": 0.005876779556274414, "step": 1912} +{"info/global_step": 1913, "train_info/time_within_train_step": 2.6758625507354736, "step": 1913} +{"train_info/time_between_train_steps": 0.0038084983825683594, "step": 1913} +{"info/global_step": 1914, "train_info/time_within_train_step": 2.676805257797241, "step": 1914} +{"train_info/time_between_train_steps": 0.003804445266723633, "step": 1914} +{"info/global_step": 1915, "train_info/time_within_train_step": 2.677062749862671, "step": 1915} +{"train_info/time_between_train_steps": 0.0037679672241210938, "step": 1915} +{"info/global_step": 1916, "train_info/time_within_train_step": 2.8769726753234863, "step": 1916} +{"train_info/time_between_train_steps": 0.0035741329193115234, "step": 1916} +{"info/global_step": 1917, "train_info/time_within_train_step": 2.6751010417938232, "step": 1917} +{"train_info/time_between_train_steps": 0.0035300254821777344, "step": 1917} +{"info/global_step": 1918, "train_info/time_within_train_step": 2.675166368484497, "step": 1918} +{"train_info/time_between_train_steps": 0.003545999526977539, "step": 1918} +{"info/global_step": 1919, "train_info/time_within_train_step": 2.677932024002075, "step": 1919} +{"train_info/time_between_train_steps": 0.0035271644592285156, "step": 1919} +{"info/global_step": 1920, "train_info/time_within_train_step": 2.674867868423462, "step": 1920} +{"train_info/time_between_train_steps": 0.0035223960876464844, "step": 1920} +{"info/global_step": 1921, "train_info/time_within_train_step": 2.675781011581421, "step": 1921} +{"train_info/time_between_train_steps": 0.0034804344177246094, "step": 1921} +{"info/global_step": 1922, "train_info/time_within_train_step": 2.6756720542907715, "step": 1922} +{"train_info/time_between_train_steps": 0.0035092830657958984, "step": 1922} +{"info/global_step": 1923, "train_info/time_within_train_step": 2.675942897796631, "step": 1923} +{"train_info/time_between_train_steps": 0.003519296646118164, "step": 1923} +{"info/global_step": 1924, "train_info/time_within_train_step": 2.6751341819763184, "step": 1924} +{"train_info/time_between_train_steps": 0.0035309791564941406, "step": 1924} +{"info/global_step": 1925, "train_info/time_within_train_step": 2.6744284629821777, "step": 1925} +{"train_info/time_between_train_steps": 0.0035762786865234375, "step": 1925} +{"info/global_step": 1926, "train_info/time_within_train_step": 2.673340082168579, "step": 1926} +{"train_info/time_between_train_steps": 0.0034995079040527344, "step": 1926} +{"info/global_step": 1927, "train_info/time_within_train_step": 2.675367593765259, "step": 1927} +{"train_info/time_between_train_steps": 0.0035452842712402344, "step": 1927} +{"info/global_step": 1928, "train_info/time_within_train_step": 2.675302028656006, "step": 1928} +{"train_info/time_between_train_steps": 0.003720998764038086, "step": 1928} +{"info/global_step": 1929, "train_info/time_within_train_step": 2.6781163215637207, "step": 1929} +{"train_info/time_between_train_steps": 0.003627300262451172, "step": 1929} +{"info/global_step": 1930, "train_info/time_within_train_step": 2.6767799854278564, "step": 1930} +{"train_info/time_between_train_steps": 0.0035512447357177734, "step": 1930} +{"info/global_step": 1931, "train_info/time_within_train_step": 2.674482583999634, "step": 1931} +{"train_info/time_between_train_steps": 0.0034301280975341797, "step": 1931} +{"info/global_step": 1932, "train_info/time_within_train_step": 2.673663854598999, "step": 1932} +{"train_info/time_between_train_steps": 0.00362396240234375, "step": 1932} +{"info/global_step": 1933, "train_info/time_within_train_step": 2.675368309020996, "step": 1933} +{"train_info/time_between_train_steps": 0.0036537647247314453, "step": 1933} +{"info/global_step": 1934, "train_info/time_within_train_step": 2.6753432750701904, "step": 1934} +{"train_info/time_between_train_steps": 0.0034999847412109375, "step": 1934} +{"info/global_step": 1935, "train_info/time_within_train_step": 2.675464153289795, "step": 1935} +{"train_info/time_between_train_steps": 0.003742694854736328, "step": 1935} +{"info/global_step": 1936, "train_info/time_within_train_step": 2.6773312091827393, "step": 1936} +{"train_info/time_between_train_steps": 0.0036704540252685547, "step": 1936} +{"info/global_step": 1937, "train_info/time_within_train_step": 2.677290439605713, "step": 1937} +{"train_info/time_between_train_steps": 0.003641843795776367, "step": 1937} +{"info/global_step": 1938, "train_info/time_within_train_step": 2.6760401725769043, "step": 1938} +{"train_info/time_between_train_steps": 0.0035049915313720703, "step": 1938} +{"info/global_step": 1939, "train_info/time_within_train_step": 2.6765618324279785, "step": 1939} +{"train_info/time_between_train_steps": 0.003492593765258789, "step": 1939} +{"info/global_step": 1940, "train_info/time_within_train_step": 2.677536725997925, "step": 1940} +{"train_info/time_between_train_steps": 0.0036165714263916016, "step": 1940} +{"info/global_step": 1941, "train_info/time_within_train_step": 2.6760387420654297, "step": 1941} +{"train_info/time_between_train_steps": 0.003683328628540039, "step": 1941} +{"info/global_step": 1942, "train_info/time_within_train_step": 2.6747443675994873, "step": 1942} +{"train_info/time_between_train_steps": 0.0036575794219970703, "step": 1942} +{"info/global_step": 1943, "train_info/time_within_train_step": 2.675290584564209, "step": 1943} +{"train_info/time_between_train_steps": 0.0035927295684814453, "step": 1943} +{"info/global_step": 1944, "train_info/time_within_train_step": 2.6759674549102783, "step": 1944} +{"train_info/time_between_train_steps": 0.0035643577575683594, "step": 1944} +{"info/global_step": 1945, "train_info/time_within_train_step": 3.09519624710083, "step": 1945} +{"train_info/time_between_train_steps": 0.0033152103424072266, "step": 1945} +{"info/global_step": 1946, "train_info/time_within_train_step": 2.673001766204834, "step": 1946} +{"train_info/time_between_train_steps": 0.0033185482025146484, "step": 1946} +{"info/global_step": 1947, "train_info/time_within_train_step": 2.6718719005584717, "step": 1947} +{"train_info/time_between_train_steps": 0.003270387649536133, "step": 1947} +{"info/global_step": 1948, "train_info/time_within_train_step": 2.672412157058716, "step": 1948} +{"train_info/time_between_train_steps": 0.003255128860473633, "step": 1948} +{"info/global_step": 1949, "train_info/time_within_train_step": 2.6727001667022705, "step": 1949} +{"train_info/time_between_train_steps": 0.0032515525817871094, "step": 1949} +{"info/global_step": 1950, "train_info/time_within_train_step": 2.673935890197754, "step": 1950} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746208822, "_runtime": 5594}, "step": 1950} +{"logs": {"train/loss": 4.1409, "train/learning_rate": 0.0002333333333333333, "train/epoch": 2.07, "_timestamp": 1746208822, "_runtime": 5594}, "step": 1950} +{"train_info/time_between_train_steps": 0.024290084838867188, "step": 1950} +{"info/global_step": 1951, "train_info/time_within_train_step": 2.6732258796691895, "step": 1951} +{"train_info/time_between_train_steps": 0.003927469253540039, "step": 1951} +{"info/global_step": 1952, "train_info/time_within_train_step": 2.6721367835998535, "step": 1952} +{"train_info/time_between_train_steps": 0.003243684768676758, "step": 1952} +{"info/global_step": 1953, "train_info/time_within_train_step": 2.6723875999450684, "step": 1953} +{"train_info/time_between_train_steps": 0.003292560577392578, "step": 1953} +{"info/global_step": 1954, "train_info/time_within_train_step": 2.6727938652038574, "step": 1954} +{"train_info/time_between_train_steps": 0.0032851696014404297, "step": 1954} +{"info/global_step": 1955, "train_info/time_within_train_step": 2.672611713409424, "step": 1955} +{"train_info/time_between_train_steps": 0.0033025741577148438, "step": 1955} +{"info/global_step": 1956, "train_info/time_within_train_step": 2.6768839359283447, "step": 1956} +{"train_info/time_between_train_steps": 0.0033278465270996094, "step": 1956} +{"info/global_step": 1957, "train_info/time_within_train_step": 2.6714398860931396, "step": 1957} +{"train_info/time_between_train_steps": 0.003293275833129883, "step": 1957} +{"info/global_step": 1958, "train_info/time_within_train_step": 2.6723251342773438, "step": 1958} +{"train_info/time_between_train_steps": 0.0032629966735839844, "step": 1958} +{"info/global_step": 1959, "train_info/time_within_train_step": 2.671152114868164, "step": 1959} +{"train_info/time_between_train_steps": 0.0032842159271240234, "step": 1959} +{"info/global_step": 1960, "train_info/time_within_train_step": 2.6722054481506348, "step": 1960} +{"train_info/time_between_train_steps": 0.0032415390014648438, "step": 1960} +{"info/global_step": 1961, "train_info/time_within_train_step": 2.6726455688476562, "step": 1961} +{"train_info/time_between_train_steps": 0.0032939910888671875, "step": 1961} +{"info/global_step": 1962, "train_info/time_within_train_step": 2.6723766326904297, "step": 1962} +{"train_info/time_between_train_steps": 0.0032651424407958984, "step": 1962} +{"info/global_step": 1963, "train_info/time_within_train_step": 2.672698497772217, "step": 1963} +{"train_info/time_between_train_steps": 0.0032987594604492188, "step": 1963} +{"info/global_step": 1964, "train_info/time_within_train_step": 2.6725337505340576, "step": 1964} +{"train_info/time_between_train_steps": 0.003244161605834961, "step": 1964} +{"info/global_step": 1965, "train_info/time_within_train_step": 2.673630475997925, "step": 1965} +{"train_info/time_between_train_steps": 0.0033583641052246094, "step": 1965} +{"info/global_step": 1966, "train_info/time_within_train_step": 2.672332525253296, "step": 1966} +{"train_info/time_between_train_steps": 0.0032367706298828125, "step": 1966} +{"info/global_step": 1967, "train_info/time_within_train_step": 2.6732900142669678, "step": 1967} +{"train_info/time_between_train_steps": 0.0032160282135009766, "step": 1967} +{"info/global_step": 1968, "train_info/time_within_train_step": 2.672370672225952, "step": 1968} +{"train_info/time_between_train_steps": 0.0032262802124023438, "step": 1968} +{"info/global_step": 1969, "train_info/time_within_train_step": 2.6707963943481445, "step": 1969} +{"train_info/time_between_train_steps": 0.003256082534790039, "step": 1969} +{"info/global_step": 1970, "train_info/time_within_train_step": 2.6729485988616943, "step": 1970} +{"train_info/time_between_train_steps": 0.0032210350036621094, "step": 1970} +{"info/global_step": 1971, "train_info/time_within_train_step": 2.6719377040863037, "step": 1971} +{"train_info/time_between_train_steps": 0.0032074451446533203, "step": 1971} +{"info/global_step": 1972, "train_info/time_within_train_step": 2.671377420425415, "step": 1972} +{"train_info/time_between_train_steps": 0.0032846927642822266, "step": 1972} +{"info/global_step": 1973, "train_info/time_within_train_step": 2.671078681945801, "step": 1973} +{"train_info/time_between_train_steps": 0.003224611282348633, "step": 1973} +{"info/global_step": 1974, "train_info/time_within_train_step": 2.672671318054199, "step": 1974} +{"train_info/time_between_train_steps": 0.0032813549041748047, "step": 1974} +{"info/global_step": 1975, "train_info/time_within_train_step": 2.671943187713623, "step": 1975} +{"train_info/time_between_train_steps": 0.00322723388671875, "step": 1975} +{"info/global_step": 1976, "train_info/time_within_train_step": 2.6722028255462646, "step": 1976} +{"train_info/time_between_train_steps": 0.0032389163970947266, "step": 1976} +{"info/global_step": 1977, "train_info/time_within_train_step": 2.671902894973755, "step": 1977} +{"train_info/time_between_train_steps": 0.003326416015625, "step": 1977} +{"info/global_step": 1978, "train_info/time_within_train_step": 2.672527313232422, "step": 1978} +{"train_info/time_between_train_steps": 0.13592791557312012, "step": 1978} +{"info/global_step": 1979, "train_info/time_within_train_step": 2.672630548477173, "step": 1979} +{"train_info/time_between_train_steps": 0.003269672393798828, "step": 1979} +{"info/global_step": 1980, "train_info/time_within_train_step": 2.6710000038146973, "step": 1980} +{"train_info/time_between_train_steps": 0.0033135414123535156, "step": 1980} +{"info/global_step": 1981, "train_info/time_within_train_step": 2.670736074447632, "step": 1981} +{"train_info/time_between_train_steps": 0.0032558441162109375, "step": 1981} +{"info/global_step": 1982, "train_info/time_within_train_step": 2.67036771774292, "step": 1982} +{"train_info/time_between_train_steps": 0.0032472610473632812, "step": 1982} +{"info/global_step": 1983, "train_info/time_within_train_step": 2.6717636585235596, "step": 1983} +{"train_info/time_between_train_steps": 0.0032460689544677734, "step": 1983} +{"info/global_step": 1984, "train_info/time_within_train_step": 2.671463966369629, "step": 1984} +{"train_info/time_between_train_steps": 0.0032548904418945312, "step": 1984} +{"info/global_step": 1985, "train_info/time_within_train_step": 2.6718637943267822, "step": 1985} +{"train_info/time_between_train_steps": 0.003298521041870117, "step": 1985} +{"info/global_step": 1986, "train_info/time_within_train_step": 2.9746901988983154, "step": 1986} +{"train_info/time_between_train_steps": 0.0032782554626464844, "step": 1986} +{"info/global_step": 1987, "train_info/time_within_train_step": 2.6714770793914795, "step": 1987} +{"train_info/time_between_train_steps": 0.003312826156616211, "step": 1987} +{"info/global_step": 1988, "train_info/time_within_train_step": 2.6706860065460205, "step": 1988} +{"train_info/time_between_train_steps": 0.0032541751861572266, "step": 1988} +{"info/global_step": 1989, "train_info/time_within_train_step": 2.7251763343811035, "step": 1989} +{"train_info/time_between_train_steps": 0.003279447555541992, "step": 1989} +{"info/global_step": 1990, "train_info/time_within_train_step": 2.671354293823242, "step": 1990} +{"train_info/time_between_train_steps": 0.0032300949096679688, "step": 1990} +{"info/global_step": 1991, "train_info/time_within_train_step": 2.672076463699341, "step": 1991} +{"train_info/time_between_train_steps": 0.003309488296508789, "step": 1991} +{"info/global_step": 1992, "train_info/time_within_train_step": 2.6714189052581787, "step": 1992} +{"train_info/time_between_train_steps": 0.003282785415649414, "step": 1992} +{"info/global_step": 1993, "train_info/time_within_train_step": 2.6724026203155518, "step": 1993} +{"train_info/time_between_train_steps": 0.003248453140258789, "step": 1993} +{"info/global_step": 1994, "train_info/time_within_train_step": 2.6719138622283936, "step": 1994} +{"train_info/time_between_train_steps": 0.003283977508544922, "step": 1994} +{"info/global_step": 1995, "train_info/time_within_train_step": 2.672440528869629, "step": 1995} +{"train_info/time_between_train_steps": 0.003297090530395508, "step": 1995} +{"info/global_step": 1996, "train_info/time_within_train_step": 2.672297716140747, "step": 1996} +{"train_info/time_between_train_steps": 0.0032715797424316406, "step": 1996} +{"info/global_step": 1997, "train_info/time_within_train_step": 2.6719746589660645, "step": 1997} +{"train_info/time_between_train_steps": 0.003236055374145508, "step": 1997} +{"info/global_step": 1998, "train_info/time_within_train_step": 2.671644449234009, "step": 1998} +{"train_info/time_between_train_steps": 0.0032494068145751953, "step": 1998} +{"info/global_step": 1999, "train_info/time_within_train_step": 2.6705610752105713, "step": 1999} +{"train_info/time_between_train_steps": 0.0032529830932617188, "step": 1999} +{"info/global_step": 2000, "train_info/time_within_train_step": 3.242499351501465, "step": 2000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746208958, "_runtime": 5730}, "step": 2000} +{"logs": {"train/loss": 4.1139, "train/learning_rate": 0.00022222222222222218, "train/epoch": 2.09, "_timestamp": 1746208958, "_runtime": 5730}, "step": 2000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746208963, "_runtime": 5735}, "step": 2000} +{"logs": {"eval/loss": 4.485419750213623, "eval/runtime": 5.5917, "eval/samples_per_second": 36.125, "eval/steps_per_second": 1.252, "train/epoch": 2.09, "_timestamp": 1746208963, "_runtime": 5735}, "step": 2000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746208963, "_runtime": 5735}, "step": 2000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.485419750213623, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 88.71418079510764, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.5917, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.125, "train/epoch": 2.09, "_timestamp": 1746208963, "_runtime": 5735}, "step": 2000} +{"train_info/time_between_train_steps": 18.598517894744873, "step": 2000} +{"info/global_step": 2001, "train_info/time_within_train_step": 2.4773964881896973, "step": 2001} +{"train_info/time_between_train_steps": 0.0032677650451660156, "step": 2001} +{"info/global_step": 2002, "train_info/time_within_train_step": 2.45674204826355, "step": 2002} +{"train_info/time_between_train_steps": 0.0035982131958007812, "step": 2002} +{"info/global_step": 2003, "train_info/time_within_train_step": 2.4650521278381348, "step": 2003} +{"train_info/time_between_train_steps": 0.003260374069213867, "step": 2003} +{"info/global_step": 2004, "train_info/time_within_train_step": 2.645087718963623, "step": 2004} +{"train_info/time_between_train_steps": 0.0032596588134765625, "step": 2004} +{"info/global_step": 2005, "train_info/time_within_train_step": 2.6713452339172363, "step": 2005} +{"train_info/time_between_train_steps": 0.0032453536987304688, "step": 2005} +{"info/global_step": 2006, "train_info/time_within_train_step": 2.6712114810943604, "step": 2006} +{"train_info/time_between_train_steps": 0.0032460689544677734, "step": 2006} +{"info/global_step": 2007, "train_info/time_within_train_step": 2.6716930866241455, "step": 2007} +{"train_info/time_between_train_steps": 0.003242015838623047, "step": 2007} +{"info/global_step": 2008, "train_info/time_within_train_step": 2.6711416244506836, "step": 2008} +{"train_info/time_between_train_steps": 0.0032465457916259766, "step": 2008} +{"info/global_step": 2009, "train_info/time_within_train_step": 2.671719789505005, "step": 2009} +{"train_info/time_between_train_steps": 0.003235340118408203, "step": 2009} +{"info/global_step": 2010, "train_info/time_within_train_step": 2.6726109981536865, "step": 2010} +{"train_info/time_between_train_steps": 0.0032863616943359375, "step": 2010} +{"info/global_step": 2011, "train_info/time_within_train_step": 2.673830509185791, "step": 2011} +{"train_info/time_between_train_steps": 0.003245115280151367, "step": 2011} +{"info/global_step": 2012, "train_info/time_within_train_step": 2.6780099868774414, "step": 2012} +{"train_info/time_between_train_steps": 0.003264904022216797, "step": 2012} +{"info/global_step": 2013, "train_info/time_within_train_step": 2.6725528240203857, "step": 2013} +{"train_info/time_between_train_steps": 0.003243684768676758, "step": 2013} +{"info/global_step": 2014, "train_info/time_within_train_step": 2.673604726791382, "step": 2014} +{"train_info/time_between_train_steps": 0.0032911300659179688, "step": 2014} +{"info/global_step": 2015, "train_info/time_within_train_step": 2.67343807220459, "step": 2015} +{"train_info/time_between_train_steps": 0.0032591819763183594, "step": 2015} +{"info/global_step": 2016, "train_info/time_within_train_step": 2.6771514415740967, "step": 2016} +{"train_info/time_between_train_steps": 0.0032782554626464844, "step": 2016} +{"info/global_step": 2017, "train_info/time_within_train_step": 2.710287570953369, "step": 2017} +{"train_info/time_between_train_steps": 0.003261089324951172, "step": 2017} +{"info/global_step": 2018, "train_info/time_within_train_step": 2.6736998558044434, "step": 2018} +{"train_info/time_between_train_steps": 0.003242969512939453, "step": 2018} +{"info/global_step": 2019, "train_info/time_within_train_step": 2.6728479862213135, "step": 2019} +{"train_info/time_between_train_steps": 0.0032265186309814453, "step": 2019} +{"info/global_step": 2020, "train_info/time_within_train_step": 2.673245429992676, "step": 2020} +{"train_info/time_between_train_steps": 0.0034477710723876953, "step": 2020} +{"info/global_step": 2021, "train_info/time_within_train_step": 2.6738011837005615, "step": 2021} +{"train_info/time_between_train_steps": 0.0034456253051757812, "step": 2021} +{"info/global_step": 2022, "train_info/time_within_train_step": 2.6737096309661865, "step": 2022} +{"train_info/time_between_train_steps": 0.0033941268920898438, "step": 2022} +{"info/global_step": 2023, "train_info/time_within_train_step": 2.674837827682495, "step": 2023} +{"train_info/time_between_train_steps": 0.003493070602416992, "step": 2023} +{"info/global_step": 2024, "train_info/time_within_train_step": 2.672501564025879, "step": 2024} +{"train_info/time_between_train_steps": 0.003607034683227539, "step": 2024} +{"info/global_step": 2025, "train_info/time_within_train_step": 2.673510789871216, "step": 2025} +{"train_info/time_between_train_steps": 0.0035588741302490234, "step": 2025} +{"info/global_step": 2026, "train_info/time_within_train_step": 2.6741600036621094, "step": 2026} +{"train_info/time_between_train_steps": 0.003525972366333008, "step": 2026} +{"info/global_step": 2027, "train_info/time_within_train_step": 2.673478126525879, "step": 2027} +{"train_info/time_between_train_steps": 0.0035300254821777344, "step": 2027} +{"info/global_step": 2028, "train_info/time_within_train_step": 2.6732382774353027, "step": 2028} +{"train_info/time_between_train_steps": 0.0035643577575683594, "step": 2028} +{"info/global_step": 2029, "train_info/time_within_train_step": 2.674168109893799, "step": 2029} +{"train_info/time_between_train_steps": 0.00360107421875, "step": 2029} +{"info/global_step": 2030, "train_info/time_within_train_step": 2.6742470264434814, "step": 2030} +{"train_info/time_between_train_steps": 0.003555774688720703, "step": 2030} +{"info/global_step": 2031, "train_info/time_within_train_step": 2.6738381385803223, "step": 2031} +{"train_info/time_between_train_steps": 0.003678560256958008, "step": 2031} +{"info/global_step": 2032, "train_info/time_within_train_step": 2.673330783843994, "step": 2032} +{"train_info/time_between_train_steps": 0.0035066604614257812, "step": 2032} +{"info/global_step": 2033, "train_info/time_within_train_step": 2.671675205230713, "step": 2033} +{"train_info/time_between_train_steps": 0.003559112548828125, "step": 2033} +{"info/global_step": 2034, "train_info/time_within_train_step": 2.674820899963379, "step": 2034} +{"train_info/time_between_train_steps": 0.0034942626953125, "step": 2034} +{"info/global_step": 2035, "train_info/time_within_train_step": 2.672800064086914, "step": 2035} +{"train_info/time_between_train_steps": 0.0033805370330810547, "step": 2035} +{"info/global_step": 2036, "train_info/time_within_train_step": 2.6738760471343994, "step": 2036} +{"train_info/time_between_train_steps": 0.003490447998046875, "step": 2036} +{"info/global_step": 2037, "train_info/time_within_train_step": 2.6732070446014404, "step": 2037} +{"train_info/time_between_train_steps": 0.0033736228942871094, "step": 2037} +{"info/global_step": 2038, "train_info/time_within_train_step": 2.6718485355377197, "step": 2038} +{"train_info/time_between_train_steps": 0.0035135746002197266, "step": 2038} +{"info/global_step": 2039, "train_info/time_within_train_step": 2.6721725463867188, "step": 2039} +{"train_info/time_between_train_steps": 0.0035715103149414062, "step": 2039} +{"info/global_step": 2040, "train_info/time_within_train_step": 2.674299716949463, "step": 2040} +{"train_info/time_between_train_steps": 0.0034933090209960938, "step": 2040} +{"info/global_step": 2041, "train_info/time_within_train_step": 2.8505165576934814, "step": 2041} +{"train_info/time_between_train_steps": 0.0033354759216308594, "step": 2041} +{"info/global_step": 2042, "train_info/time_within_train_step": 2.672377824783325, "step": 2042} +{"train_info/time_between_train_steps": 0.003329753875732422, "step": 2042} +{"info/global_step": 2043, "train_info/time_within_train_step": 3.0540506839752197, "step": 2043} +{"train_info/time_between_train_steps": 0.0032911300659179688, "step": 2043} +{"info/global_step": 2044, "train_info/time_within_train_step": 2.6724443435668945, "step": 2044} +{"train_info/time_between_train_steps": 0.0032432079315185547, "step": 2044} +{"info/global_step": 2045, "train_info/time_within_train_step": 2.671812057495117, "step": 2045} +{"train_info/time_between_train_steps": 0.003299236297607422, "step": 2045} +{"info/global_step": 2046, "train_info/time_within_train_step": 2.67086124420166, "step": 2046} +{"train_info/time_between_train_steps": 0.003277301788330078, "step": 2046} +{"info/global_step": 2047, "train_info/time_within_train_step": 2.6713414192199707, "step": 2047} +{"train_info/time_between_train_steps": 0.0032515525817871094, "step": 2047} +{"info/global_step": 2048, "train_info/time_within_train_step": 2.6712725162506104, "step": 2048} +{"train_info/time_between_train_steps": 0.003226757049560547, "step": 2048} +{"info/global_step": 2049, "train_info/time_within_train_step": 2.6723015308380127, "step": 2049} +{"train_info/time_between_train_steps": 0.0032722949981689453, "step": 2049} +{"info/global_step": 2050, "train_info/time_within_train_step": 2.6704750061035156, "step": 2050} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746209111, "_runtime": 5883}, "step": 2050} +{"logs": {"train/loss": 4.1113, "train/learning_rate": 0.0002111111111111111, "train/epoch": 2.11, "_timestamp": 1746209111, "_runtime": 5883}, "step": 2050} +{"train_info/time_between_train_steps": 0.02485823631286621, "step": 2050} +{"info/global_step": 2051, "train_info/time_within_train_step": 2.6713180541992188, "step": 2051} +{"train_info/time_between_train_steps": 0.0032324790954589844, "step": 2051} +{"info/global_step": 2052, "train_info/time_within_train_step": 2.669545888900757, "step": 2052} +{"train_info/time_between_train_steps": 0.003307342529296875, "step": 2052} +{"info/global_step": 2053, "train_info/time_within_train_step": 2.669715642929077, "step": 2053} +{"train_info/time_between_train_steps": 0.003235340118408203, "step": 2053} +{"info/global_step": 2054, "train_info/time_within_train_step": 2.6696770191192627, "step": 2054} +{"train_info/time_between_train_steps": 0.0032575130462646484, "step": 2054} +{"info/global_step": 2055, "train_info/time_within_train_step": 2.671147584915161, "step": 2055} +{"train_info/time_between_train_steps": 0.0032491683959960938, "step": 2055} +{"info/global_step": 2056, "train_info/time_within_train_step": 2.6714892387390137, "step": 2056} +{"train_info/time_between_train_steps": 0.0038907527923583984, "step": 2056} +{"info/global_step": 2057, "train_info/time_within_train_step": 2.672659397125244, "step": 2057} +{"train_info/time_between_train_steps": 0.0033278465270996094, "step": 2057} +{"info/global_step": 2058, "train_info/time_within_train_step": 2.673754930496216, "step": 2058} +{"train_info/time_between_train_steps": 0.003351926803588867, "step": 2058} +{"info/global_step": 2059, "train_info/time_within_train_step": 2.6747138500213623, "step": 2059} +{"train_info/time_between_train_steps": 0.003491640090942383, "step": 2059} +{"info/global_step": 2060, "train_info/time_within_train_step": 2.6743171215057373, "step": 2060} +{"train_info/time_between_train_steps": 0.003334522247314453, "step": 2060} +{"info/global_step": 2061, "train_info/time_within_train_step": 2.6730551719665527, "step": 2061} +{"train_info/time_between_train_steps": 0.0033462047576904297, "step": 2061} +{"info/global_step": 2062, "train_info/time_within_train_step": 2.674098014831543, "step": 2062} +{"train_info/time_between_train_steps": 0.0034112930297851562, "step": 2062} +{"info/global_step": 2063, "train_info/time_within_train_step": 2.6740758419036865, "step": 2063} +{"train_info/time_between_train_steps": 0.0034317970275878906, "step": 2063} +{"info/global_step": 2064, "train_info/time_within_train_step": 2.6740193367004395, "step": 2064} +{"train_info/time_between_train_steps": 0.003383159637451172, "step": 2064} +{"info/global_step": 2065, "train_info/time_within_train_step": 2.672715425491333, "step": 2065} +{"train_info/time_between_train_steps": 0.003358125686645508, "step": 2065} +{"info/global_step": 2066, "train_info/time_within_train_step": 2.6734609603881836, "step": 2066} +{"train_info/time_between_train_steps": 0.003417491912841797, "step": 2066} +{"info/global_step": 2067, "train_info/time_within_train_step": 2.673651695251465, "step": 2067} +{"train_info/time_between_train_steps": 0.0038650035858154297, "step": 2067} +{"info/global_step": 2068, "train_info/time_within_train_step": 2.6732685565948486, "step": 2068} +{"train_info/time_between_train_steps": 0.003742218017578125, "step": 2068} +{"info/global_step": 2069, "train_info/time_within_train_step": 2.6740500926971436, "step": 2069} +{"train_info/time_between_train_steps": 0.0038242340087890625, "step": 2069} +{"info/global_step": 2070, "train_info/time_within_train_step": 2.673921585083008, "step": 2070} +{"train_info/time_between_train_steps": 0.0036678314208984375, "step": 2070} +{"info/global_step": 2071, "train_info/time_within_train_step": 2.6727652549743652, "step": 2071} +{"train_info/time_between_train_steps": 0.003753185272216797, "step": 2071} +{"info/global_step": 2072, "train_info/time_within_train_step": 2.6723320484161377, "step": 2072} +{"train_info/time_between_train_steps": 0.0036907196044921875, "step": 2072} +{"info/global_step": 2073, "train_info/time_within_train_step": 2.6743545532226562, "step": 2073} +{"train_info/time_between_train_steps": 0.0036749839782714844, "step": 2073} +{"info/global_step": 2074, "train_info/time_within_train_step": 2.6734182834625244, "step": 2074} +{"train_info/time_between_train_steps": 0.0036842823028564453, "step": 2074} +{"info/global_step": 2075, "train_info/time_within_train_step": 2.674415349960327, "step": 2075} +{"train_info/time_between_train_steps": 0.0037996768951416016, "step": 2075} +{"info/global_step": 2076, "train_info/time_within_train_step": 2.6736655235290527, "step": 2076} +{"train_info/time_between_train_steps": 0.003700733184814453, "step": 2076} +{"info/global_step": 2077, "train_info/time_within_train_step": 2.6731863021850586, "step": 2077} +{"train_info/time_between_train_steps": 0.0036935806274414062, "step": 2077} +{"info/global_step": 2078, "train_info/time_within_train_step": 2.6742234230041504, "step": 2078} +{"train_info/time_between_train_steps": 0.0037279129028320312, "step": 2078} +{"info/global_step": 2079, "train_info/time_within_train_step": 2.6778764724731445, "step": 2079} +{"train_info/time_between_train_steps": 0.0036592483520507812, "step": 2079} +{"info/global_step": 2080, "train_info/time_within_train_step": 2.6732516288757324, "step": 2080} +{"train_info/time_between_train_steps": 0.0036318302154541016, "step": 2080} +{"info/global_step": 2081, "train_info/time_within_train_step": 2.6746344566345215, "step": 2081} +{"train_info/time_between_train_steps": 0.003776073455810547, "step": 2081} +{"info/global_step": 2082, "train_info/time_within_train_step": 3.0926036834716797, "step": 2082} +{"train_info/time_between_train_steps": 0.003492593765258789, "step": 2082} +{"info/global_step": 2083, "train_info/time_within_train_step": 2.6722047328948975, "step": 2083} +{"train_info/time_between_train_steps": 0.003386974334716797, "step": 2083} +{"info/global_step": 2084, "train_info/time_within_train_step": 2.671034336090088, "step": 2084} +{"train_info/time_between_train_steps": 0.003371000289916992, "step": 2084} +{"info/global_step": 2085, "train_info/time_within_train_step": 2.6723294258117676, "step": 2085} +{"train_info/time_between_train_steps": 0.0034339427947998047, "step": 2085} +{"info/global_step": 2086, "train_info/time_within_train_step": 2.6727733612060547, "step": 2086} +{"train_info/time_between_train_steps": 0.003417491912841797, "step": 2086} +{"info/global_step": 2087, "train_info/time_within_train_step": 2.6726670265197754, "step": 2087} +{"train_info/time_between_train_steps": 0.0033686161041259766, "step": 2087} +{"info/global_step": 2088, "train_info/time_within_train_step": 2.6717703342437744, "step": 2088} +{"train_info/time_between_train_steps": 0.0033855438232421875, "step": 2088} +{"info/global_step": 2089, "train_info/time_within_train_step": 2.673004627227783, "step": 2089} +{"train_info/time_between_train_steps": 0.003415346145629883, "step": 2089} +{"info/global_step": 2090, "train_info/time_within_train_step": 2.6716084480285645, "step": 2090} +{"train_info/time_between_train_steps": 0.003368854522705078, "step": 2090} +{"info/global_step": 2091, "train_info/time_within_train_step": 2.6714375019073486, "step": 2091} +{"train_info/time_between_train_steps": 0.0033638477325439453, "step": 2091} +{"info/global_step": 2092, "train_info/time_within_train_step": 2.6727476119995117, "step": 2092} +{"train_info/time_between_train_steps": 0.0034379959106445312, "step": 2092} +{"info/global_step": 2093, "train_info/time_within_train_step": 2.671344757080078, "step": 2093} +{"train_info/time_between_train_steps": 0.0033936500549316406, "step": 2093} +{"info/global_step": 2094, "train_info/time_within_train_step": 2.6720449924468994, "step": 2094} +{"train_info/time_between_train_steps": 0.003335237503051758, "step": 2094} +{"info/global_step": 2095, "train_info/time_within_train_step": 2.672269582748413, "step": 2095} +{"train_info/time_between_train_steps": 0.00334930419921875, "step": 2095} +{"info/global_step": 2096, "train_info/time_within_train_step": 2.672823905944824, "step": 2096} +{"train_info/time_between_train_steps": 0.003383159637451172, "step": 2096} +{"info/global_step": 2097, "train_info/time_within_train_step": 2.673999786376953, "step": 2097} +{"train_info/time_between_train_steps": 0.0033721923828125, "step": 2097} +{"info/global_step": 2098, "train_info/time_within_train_step": 2.673065662384033, "step": 2098} +{"train_info/time_between_train_steps": 0.0033788681030273438, "step": 2098} +{"info/global_step": 2099, "train_info/time_within_train_step": 2.6727287769317627, "step": 2099} +{"train_info/time_between_train_steps": 0.0035092830657958984, "step": 2099} +{"info/global_step": 2100, "train_info/time_within_train_step": 2.675548553466797, "step": 2100} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746209246, "_runtime": 6018}, "step": 2100} +{"logs": {"train/loss": 4.0869, "train/learning_rate": 0.00019999999999999998, "train/epoch": 2.12, "_timestamp": 1746209246, "_runtime": 6018}, "step": 2100} +{"train_info/time_between_train_steps": 26.0439395904541, "step": 2100} +{"info/global_step": 2101, "train_info/time_within_train_step": 2.46915864944458, "step": 2101} +{"train_info/time_between_train_steps": 0.0033826828002929688, "step": 2101} +{"info/global_step": 2102, "train_info/time_within_train_step": 2.4558324813842773, "step": 2102} +{"train_info/time_between_train_steps": 0.0034949779510498047, "step": 2102} +{"info/global_step": 2103, "train_info/time_within_train_step": 2.4568135738372803, "step": 2103} +{"train_info/time_between_train_steps": 0.1492316722869873, "step": 2103} +{"info/global_step": 2104, "train_info/time_within_train_step": 2.6155738830566406, "step": 2104} +{"train_info/time_between_train_steps": 0.0034165382385253906, "step": 2104} +{"info/global_step": 2105, "train_info/time_within_train_step": 2.664973258972168, "step": 2105} +{"train_info/time_between_train_steps": 0.003693819046020508, "step": 2105} +{"info/global_step": 2106, "train_info/time_within_train_step": 2.6744725704193115, "step": 2106} +{"train_info/time_between_train_steps": 0.0036652088165283203, "step": 2106} +{"info/global_step": 2107, "train_info/time_within_train_step": 2.6747326850891113, "step": 2107} +{"train_info/time_between_train_steps": 0.0036211013793945312, "step": 2107} +{"info/global_step": 2108, "train_info/time_within_train_step": 2.67484188079834, "step": 2108} +{"train_info/time_between_train_steps": 0.0038220882415771484, "step": 2108} +{"info/global_step": 2109, "train_info/time_within_train_step": 2.6759235858917236, "step": 2109} +{"train_info/time_between_train_steps": 0.0037412643432617188, "step": 2109} +{"info/global_step": 2110, "train_info/time_within_train_step": 2.6758008003234863, "step": 2110} +{"train_info/time_between_train_steps": 0.0037512779235839844, "step": 2110} +{"info/global_step": 2111, "train_info/time_within_train_step": 2.67598819732666, "step": 2111} +{"train_info/time_between_train_steps": 0.003732442855834961, "step": 2111} +{"info/global_step": 2112, "train_info/time_within_train_step": 2.6756551265716553, "step": 2112} +{"train_info/time_between_train_steps": 0.0037391185760498047, "step": 2112} +{"info/global_step": 2113, "train_info/time_within_train_step": 2.6758227348327637, "step": 2113} +{"train_info/time_between_train_steps": 0.0038683414459228516, "step": 2113} +{"info/global_step": 2114, "train_info/time_within_train_step": 2.6754567623138428, "step": 2114} +{"train_info/time_between_train_steps": 0.003847837448120117, "step": 2114} +{"info/global_step": 2115, "train_info/time_within_train_step": 2.6768407821655273, "step": 2115} +{"train_info/time_between_train_steps": 0.0037469863891601562, "step": 2115} +{"info/global_step": 2116, "train_info/time_within_train_step": 2.6753978729248047, "step": 2116} +{"train_info/time_between_train_steps": 0.003654003143310547, "step": 2116} +{"info/global_step": 2117, "train_info/time_within_train_step": 2.677903413772583, "step": 2117} +{"train_info/time_between_train_steps": 0.0038194656372070312, "step": 2117} +{"info/global_step": 2118, "train_info/time_within_train_step": 2.6758787631988525, "step": 2118} +{"train_info/time_between_train_steps": 0.0036437511444091797, "step": 2118} +{"info/global_step": 2119, "train_info/time_within_train_step": 2.6759579181671143, "step": 2119} +{"train_info/time_between_train_steps": 0.0037806034088134766, "step": 2119} +{"info/global_step": 2120, "train_info/time_within_train_step": 2.6756041049957275, "step": 2120} +{"train_info/time_between_train_steps": 0.0036923885345458984, "step": 2120} +{"info/global_step": 2121, "train_info/time_within_train_step": 2.6756153106689453, "step": 2121} +{"train_info/time_between_train_steps": 0.0037288665771484375, "step": 2121} +{"info/global_step": 2122, "train_info/time_within_train_step": 2.6751482486724854, "step": 2122} +{"train_info/time_between_train_steps": 0.0037202835083007812, "step": 2122} +{"info/global_step": 2123, "train_info/time_within_train_step": 2.67553973197937, "step": 2123} +{"train_info/time_between_train_steps": 0.003670930862426758, "step": 2123} +{"info/global_step": 2124, "train_info/time_within_train_step": 2.6746041774749756, "step": 2124} +{"train_info/time_between_train_steps": 0.0037147998809814453, "step": 2124} +{"info/global_step": 2125, "train_info/time_within_train_step": 2.6745338439941406, "step": 2125} +{"train_info/time_between_train_steps": 0.003756284713745117, "step": 2125} +{"info/global_step": 2126, "train_info/time_within_train_step": 2.673945665359497, "step": 2126} +{"train_info/time_between_train_steps": 0.0036385059356689453, "step": 2126} +{"info/global_step": 2127, "train_info/time_within_train_step": 2.6752572059631348, "step": 2127} +{"train_info/time_between_train_steps": 0.003657817840576172, "step": 2127} +{"info/global_step": 2128, "train_info/time_within_train_step": 2.6765902042388916, "step": 2128} +{"train_info/time_between_train_steps": 0.0036401748657226562, "step": 2128} +{"info/global_step": 2129, "train_info/time_within_train_step": 2.675771713256836, "step": 2129} +{"train_info/time_between_train_steps": 0.0036656856536865234, "step": 2129} +{"info/global_step": 2130, "train_info/time_within_train_step": 2.6764066219329834, "step": 2130} +{"train_info/time_between_train_steps": 0.003717660903930664, "step": 2130} +{"info/global_step": 2131, "train_info/time_within_train_step": 2.676292657852173, "step": 2131} +{"train_info/time_between_train_steps": 0.0037882328033447266, "step": 2131} +{"info/global_step": 2132, "train_info/time_within_train_step": 2.6768639087677, "step": 2132} +{"train_info/time_between_train_steps": 0.003718852996826172, "step": 2132} +{"info/global_step": 2133, "train_info/time_within_train_step": 2.676710367202759, "step": 2133} +{"train_info/time_between_train_steps": 0.003786802291870117, "step": 2133} +{"info/global_step": 2134, "train_info/time_within_train_step": 2.6761627197265625, "step": 2134} +{"train_info/time_between_train_steps": 0.003739595413208008, "step": 2134} +{"info/global_step": 2135, "train_info/time_within_train_step": 2.6750874519348145, "step": 2135} +{"train_info/time_between_train_steps": 0.0037758350372314453, "step": 2135} +{"info/global_step": 2136, "train_info/time_within_train_step": 2.675987958908081, "step": 2136} +{"train_info/time_between_train_steps": 0.0036835670471191406, "step": 2136} +{"info/global_step": 2137, "train_info/time_within_train_step": 2.6754822731018066, "step": 2137} +{"train_info/time_between_train_steps": 0.0038034915924072266, "step": 2137} +{"info/global_step": 2138, "train_info/time_within_train_step": 2.674321413040161, "step": 2138} +{"train_info/time_between_train_steps": 0.003746509552001953, "step": 2138} +{"info/global_step": 2139, "train_info/time_within_train_step": 2.6753504276275635, "step": 2139} +{"train_info/time_between_train_steps": 0.0036978721618652344, "step": 2139} +{"info/global_step": 2140, "train_info/time_within_train_step": 2.674792528152466, "step": 2140} +{"train_info/time_between_train_steps": 0.0037534236907958984, "step": 2140} +{"info/global_step": 2141, "train_info/time_within_train_step": 2.674278497695923, "step": 2141} +{"train_info/time_between_train_steps": 0.003875255584716797, "step": 2141} +{"info/global_step": 2142, "train_info/time_within_train_step": 2.6769561767578125, "step": 2142} +{"train_info/time_between_train_steps": 0.003643512725830078, "step": 2142} +{"info/global_step": 2143, "train_info/time_within_train_step": 2.6807103157043457, "step": 2143} +{"train_info/time_between_train_steps": 0.0035982131958007812, "step": 2143} +{"info/global_step": 2144, "train_info/time_within_train_step": 2.6751697063446045, "step": 2144} +{"train_info/time_between_train_steps": 0.0036287307739257812, "step": 2144} +{"info/global_step": 2145, "train_info/time_within_train_step": 3.030313014984131, "step": 2145} +{"train_info/time_between_train_steps": 0.0034246444702148438, "step": 2145} +{"info/global_step": 2146, "train_info/time_within_train_step": 2.6762263774871826, "step": 2146} +{"train_info/time_between_train_steps": 0.0045490264892578125, "step": 2146} +{"info/global_step": 2147, "train_info/time_within_train_step": 2.675546646118164, "step": 2147} +{"train_info/time_between_train_steps": 0.003470897674560547, "step": 2147} +{"info/global_step": 2148, "train_info/time_within_train_step": 2.673800468444824, "step": 2148} +{"train_info/time_between_train_steps": 0.0034232139587402344, "step": 2148} +{"info/global_step": 2149, "train_info/time_within_train_step": 2.6748244762420654, "step": 2149} +{"train_info/time_between_train_steps": 0.0035545825958251953, "step": 2149} +{"info/global_step": 2150, "train_info/time_within_train_step": 2.6763737201690674, "step": 2150} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746209407, "_runtime": 6179}, "step": 2150} +{"logs": {"train/loss": 4.0756, "train/learning_rate": 0.00018888888888888888, "train/epoch": 2.14, "_timestamp": 1746209407, "_runtime": 6179}, "step": 2150} +{"train_info/time_between_train_steps": 0.024495840072631836, "step": 2150} +{"info/global_step": 2151, "train_info/time_within_train_step": 2.6769537925720215, "step": 2151} +{"train_info/time_between_train_steps": 0.003587961196899414, "step": 2151} +{"info/global_step": 2152, "train_info/time_within_train_step": 2.6755948066711426, "step": 2152} +{"train_info/time_between_train_steps": 0.0036935806274414062, "step": 2152} +{"info/global_step": 2153, "train_info/time_within_train_step": 2.677135944366455, "step": 2153} +{"train_info/time_between_train_steps": 0.0037949085235595703, "step": 2153} +{"info/global_step": 2154, "train_info/time_within_train_step": 2.675696849822998, "step": 2154} +{"train_info/time_between_train_steps": 0.0036859512329101562, "step": 2154} +{"info/global_step": 2155, "train_info/time_within_train_step": 2.6757256984710693, "step": 2155} +{"train_info/time_between_train_steps": 0.003656148910522461, "step": 2155} +{"info/global_step": 2156, "train_info/time_within_train_step": 2.6770362854003906, "step": 2156} +{"train_info/time_between_train_steps": 0.0038347244262695312, "step": 2156} +{"info/global_step": 2157, "train_info/time_within_train_step": 2.6731255054473877, "step": 2157} +{"train_info/time_between_train_steps": 0.0037279129028320312, "step": 2157} +{"info/global_step": 2158, "train_info/time_within_train_step": 2.6738128662109375, "step": 2158} +{"train_info/time_between_train_steps": 0.0037314891815185547, "step": 2158} +{"info/global_step": 2159, "train_info/time_within_train_step": 2.6742193698883057, "step": 2159} +{"train_info/time_between_train_steps": 0.0037584304809570312, "step": 2159} +{"info/global_step": 2160, "train_info/time_within_train_step": 2.6796181201934814, "step": 2160} +{"train_info/time_between_train_steps": 0.0037374496459960938, "step": 2160} +{"info/global_step": 2161, "train_info/time_within_train_step": 2.683802366256714, "step": 2161} +{"train_info/time_between_train_steps": 0.003638029098510742, "step": 2161} +{"info/global_step": 2162, "train_info/time_within_train_step": 2.6756489276885986, "step": 2162} +{"train_info/time_between_train_steps": 0.0037097930908203125, "step": 2162} +{"info/global_step": 2163, "train_info/time_within_train_step": 2.6754305362701416, "step": 2163} +{"train_info/time_between_train_steps": 0.003660440444946289, "step": 2163} +{"info/global_step": 2164, "train_info/time_within_train_step": 2.675687313079834, "step": 2164} +{"train_info/time_between_train_steps": 0.004271745681762695, "step": 2164} +{"info/global_step": 2165, "train_info/time_within_train_step": 2.674903631210327, "step": 2165} +{"train_info/time_between_train_steps": 0.004015684127807617, "step": 2165} +{"info/global_step": 2166, "train_info/time_within_train_step": 2.8869009017944336, "step": 2166} +{"train_info/time_between_train_steps": 0.0035364627838134766, "step": 2166} +{"info/global_step": 2167, "train_info/time_within_train_step": 2.7100255489349365, "step": 2167} +{"train_info/time_between_train_steps": 0.0035600662231445312, "step": 2167} +{"info/global_step": 2168, "train_info/time_within_train_step": 2.6754727363586426, "step": 2168} +{"train_info/time_between_train_steps": 0.003599882125854492, "step": 2168} +{"info/global_step": 2169, "train_info/time_within_train_step": 2.6745686531066895, "step": 2169} +{"train_info/time_between_train_steps": 0.003572225570678711, "step": 2169} +{"info/global_step": 2170, "train_info/time_within_train_step": 2.6728556156158447, "step": 2170} +{"train_info/time_between_train_steps": 0.0037267208099365234, "step": 2170} +{"info/global_step": 2171, "train_info/time_within_train_step": 2.677637815475464, "step": 2171} +{"train_info/time_between_train_steps": 0.004354715347290039, "step": 2171} +{"info/global_step": 2172, "train_info/time_within_train_step": 2.675858974456787, "step": 2172} +{"train_info/time_between_train_steps": 0.004157304763793945, "step": 2172} +{"info/global_step": 2173, "train_info/time_within_train_step": 2.7279887199401855, "step": 2173} +{"train_info/time_between_train_steps": 0.0035855770111083984, "step": 2173} +{"info/global_step": 2174, "train_info/time_within_train_step": 2.6755454540252686, "step": 2174} +{"train_info/time_between_train_steps": 0.003639698028564453, "step": 2174} +{"info/global_step": 2175, "train_info/time_within_train_step": 2.6758477687835693, "step": 2175} +{"train_info/time_between_train_steps": 0.003673076629638672, "step": 2175} +{"info/global_step": 2176, "train_info/time_within_train_step": 2.674513101577759, "step": 2176} +{"train_info/time_between_train_steps": 0.0038230419158935547, "step": 2176} +{"info/global_step": 2177, "train_info/time_within_train_step": 2.6769216060638428, "step": 2177} +{"train_info/time_between_train_steps": 0.0037567615509033203, "step": 2177} +{"info/global_step": 2178, "train_info/time_within_train_step": 2.6765713691711426, "step": 2178} +{"train_info/time_between_train_steps": 0.0036106109619140625, "step": 2178} +{"info/global_step": 2179, "train_info/time_within_train_step": 2.67472243309021, "step": 2179} +{"train_info/time_between_train_steps": 0.0036597251892089844, "step": 2179} +{"info/global_step": 2180, "train_info/time_within_train_step": 2.6747636795043945, "step": 2180} +{"train_info/time_between_train_steps": 0.0037262439727783203, "step": 2180} +{"info/global_step": 2181, "train_info/time_within_train_step": 2.6756370067596436, "step": 2181} +{"train_info/time_between_train_steps": 0.00365447998046875, "step": 2181} +{"info/global_step": 2182, "train_info/time_within_train_step": 2.6742310523986816, "step": 2182} +{"train_info/time_between_train_steps": 0.003640413284301758, "step": 2182} +{"info/global_step": 2183, "train_info/time_within_train_step": 2.6744015216827393, "step": 2183} +{"train_info/time_between_train_steps": 0.0037021636962890625, "step": 2183} +{"info/global_step": 2184, "train_info/time_within_train_step": 2.6760127544403076, "step": 2184} +{"train_info/time_between_train_steps": 0.003688812255859375, "step": 2184} +{"info/global_step": 2185, "train_info/time_within_train_step": 2.6752045154571533, "step": 2185} +{"train_info/time_between_train_steps": 0.0036585330963134766, "step": 2185} +{"info/global_step": 2186, "train_info/time_within_train_step": 2.6745858192443848, "step": 2186} +{"train_info/time_between_train_steps": 0.003627300262451172, "step": 2186} +{"info/global_step": 2187, "train_info/time_within_train_step": 2.6749000549316406, "step": 2187} +{"train_info/time_between_train_steps": 0.003596067428588867, "step": 2187} +{"info/global_step": 2188, "train_info/time_within_train_step": 2.6758458614349365, "step": 2188} +{"train_info/time_between_train_steps": 0.003626108169555664, "step": 2188} +{"info/global_step": 2189, "train_info/time_within_train_step": 2.674556255340576, "step": 2189} +{"train_info/time_between_train_steps": 0.003693819046020508, "step": 2189} +{"info/global_step": 2190, "train_info/time_within_train_step": 2.677104949951172, "step": 2190} +{"train_info/time_between_train_steps": 0.003802776336669922, "step": 2190} +{"info/global_step": 2191, "train_info/time_within_train_step": 2.6754891872406006, "step": 2191} +{"train_info/time_between_train_steps": 0.0037364959716796875, "step": 2191} +{"info/global_step": 2192, "train_info/time_within_train_step": 2.6757516860961914, "step": 2192} +{"train_info/time_between_train_steps": 0.0038585662841796875, "step": 2192} +{"info/global_step": 2193, "train_info/time_within_train_step": 2.6763057708740234, "step": 2193} +{"train_info/time_between_train_steps": 0.0036017894744873047, "step": 2193} +{"info/global_step": 2194, "train_info/time_within_train_step": 2.6738829612731934, "step": 2194} +{"train_info/time_between_train_steps": 0.003621339797973633, "step": 2194} +{"info/global_step": 2195, "train_info/time_within_train_step": 2.6740455627441406, "step": 2195} +{"train_info/time_between_train_steps": 0.003587007522583008, "step": 2195} +{"info/global_step": 2196, "train_info/time_within_train_step": 2.6745011806488037, "step": 2196} +{"train_info/time_between_train_steps": 0.007235527038574219, "step": 2196} +{"info/global_step": 2197, "train_info/time_within_train_step": 2.6754708290100098, "step": 2197} +{"train_info/time_between_train_steps": 0.007201671600341797, "step": 2197} +{"info/global_step": 2198, "train_info/time_within_train_step": 2.676241159439087, "step": 2198} +{"train_info/time_between_train_steps": 0.0036504268646240234, "step": 2198} +{"info/global_step": 2199, "train_info/time_within_train_step": 2.6758720874786377, "step": 2199} +{"train_info/time_between_train_steps": 0.0036144256591796875, "step": 2199} +{"info/global_step": 2200, "train_info/time_within_train_step": 2.6768851280212402, "step": 2200} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746209542, "_runtime": 6314}, "step": 2200} +{"logs": {"train/loss": 4.0538, "train/learning_rate": 0.00017777777777777776, "train/epoch": 2.16, "_timestamp": 1746209542, "_runtime": 6314}, "step": 2200} +{"train_info/time_between_train_steps": 13.218204259872437, "step": 2200} +{"info/global_step": 2201, "train_info/time_within_train_step": 2.4710211753845215, "step": 2201} +{"train_info/time_between_train_steps": 0.0037980079650878906, "step": 2201} +{"info/global_step": 2202, "train_info/time_within_train_step": 2.4587669372558594, "step": 2202} +{"train_info/time_between_train_steps": 0.0037992000579833984, "step": 2202} +{"info/global_step": 2203, "train_info/time_within_train_step": 2.477938175201416, "step": 2203} +{"train_info/time_between_train_steps": 0.0037441253662109375, "step": 2203} +{"info/global_step": 2204, "train_info/time_within_train_step": 2.6568763256073, "step": 2204} +{"train_info/time_between_train_steps": 0.0037164688110351562, "step": 2204} +{"info/global_step": 2205, "train_info/time_within_train_step": 2.6733381748199463, "step": 2205} +{"train_info/time_between_train_steps": 0.0037603378295898438, "step": 2205} +{"info/global_step": 2206, "train_info/time_within_train_step": 2.6728920936584473, "step": 2206} +{"train_info/time_between_train_steps": 0.004001140594482422, "step": 2206} +{"info/global_step": 2207, "train_info/time_within_train_step": 2.7147014141082764, "step": 2207} +{"train_info/time_between_train_steps": 0.0037932395935058594, "step": 2207} +{"info/global_step": 2208, "train_info/time_within_train_step": 2.6747803688049316, "step": 2208} +{"train_info/time_between_train_steps": 0.003778219223022461, "step": 2208} +{"info/global_step": 2209, "train_info/time_within_train_step": 2.675442695617676, "step": 2209} +{"train_info/time_between_train_steps": 0.0037810802459716797, "step": 2209} +{"info/global_step": 2210, "train_info/time_within_train_step": 2.675759792327881, "step": 2210} +{"train_info/time_between_train_steps": 0.0037047863006591797, "step": 2210} +{"info/global_step": 2211, "train_info/time_within_train_step": 2.6753292083740234, "step": 2211} +{"train_info/time_between_train_steps": 0.003666400909423828, "step": 2211} +{"info/global_step": 2212, "train_info/time_within_train_step": 2.6754536628723145, "step": 2212} +{"train_info/time_between_train_steps": 0.0037233829498291016, "step": 2212} +{"info/global_step": 2213, "train_info/time_within_train_step": 2.725048542022705, "step": 2213} +{"train_info/time_between_train_steps": 0.0041103363037109375, "step": 2213} +{"info/global_step": 2214, "train_info/time_within_train_step": 3.067335605621338, "step": 2214} +{"train_info/time_between_train_steps": 0.003412961959838867, "step": 2214} +{"info/global_step": 2215, "train_info/time_within_train_step": 2.6762683391571045, "step": 2215} +{"train_info/time_between_train_steps": 0.003454446792602539, "step": 2215} +{"info/global_step": 2216, "train_info/time_within_train_step": 2.675605535507202, "step": 2216} +{"train_info/time_between_train_steps": 0.003387451171875, "step": 2216} +{"info/global_step": 2217, "train_info/time_within_train_step": 2.6756508350372314, "step": 2217} +{"train_info/time_between_train_steps": 0.003677845001220703, "step": 2217} +{"info/global_step": 2218, "train_info/time_within_train_step": 2.6759445667266846, "step": 2218} +{"train_info/time_between_train_steps": 0.0036361217498779297, "step": 2218} +{"info/global_step": 2219, "train_info/time_within_train_step": 2.675975799560547, "step": 2219} +{"train_info/time_between_train_steps": 0.003882169723510742, "step": 2219} +{"info/global_step": 2220, "train_info/time_within_train_step": 2.6769773960113525, "step": 2220} +{"train_info/time_between_train_steps": 0.0037326812744140625, "step": 2220} +{"info/global_step": 2221, "train_info/time_within_train_step": 2.6756181716918945, "step": 2221} +{"train_info/time_between_train_steps": 0.0036840438842773438, "step": 2221} +{"info/global_step": 2222, "train_info/time_within_train_step": 2.6780312061309814, "step": 2222} +{"train_info/time_between_train_steps": 0.003988504409790039, "step": 2222} +{"info/global_step": 2223, "train_info/time_within_train_step": 2.6777451038360596, "step": 2223} +{"train_info/time_between_train_steps": 0.004126787185668945, "step": 2223} +{"info/global_step": 2224, "train_info/time_within_train_step": 2.678356885910034, "step": 2224} +{"train_info/time_between_train_steps": 0.004082441329956055, "step": 2224} +{"info/global_step": 2225, "train_info/time_within_train_step": 2.679037094116211, "step": 2225} +{"train_info/time_between_train_steps": 0.004254579544067383, "step": 2225} +{"info/global_step": 2226, "train_info/time_within_train_step": 2.678370475769043, "step": 2226} +{"train_info/time_between_train_steps": 0.004046440124511719, "step": 2226} +{"info/global_step": 2227, "train_info/time_within_train_step": 2.677142858505249, "step": 2227} +{"train_info/time_between_train_steps": 0.0040166378021240234, "step": 2227} +{"info/global_step": 2228, "train_info/time_within_train_step": 2.6813931465148926, "step": 2228} +{"train_info/time_between_train_steps": 0.21664881706237793, "step": 2228} +{"info/global_step": 2229, "train_info/time_within_train_step": 2.719552993774414, "step": 2229} +{"train_info/time_between_train_steps": 0.0038580894470214844, "step": 2229} +{"info/global_step": 2230, "train_info/time_within_train_step": 2.6741464138031006, "step": 2230} +{"train_info/time_between_train_steps": 0.0035369396209716797, "step": 2230} +{"info/global_step": 2231, "train_info/time_within_train_step": 2.6744003295898438, "step": 2231} +{"train_info/time_between_train_steps": 0.0036334991455078125, "step": 2231} +{"info/global_step": 2232, "train_info/time_within_train_step": 2.6741418838500977, "step": 2232} +{"train_info/time_between_train_steps": 0.003492593765258789, "step": 2232} +{"info/global_step": 2233, "train_info/time_within_train_step": 2.6749823093414307, "step": 2233} +{"train_info/time_between_train_steps": 0.003607511520385742, "step": 2233} +{"info/global_step": 2234, "train_info/time_within_train_step": 2.6764309406280518, "step": 2234} +{"train_info/time_between_train_steps": 0.0037190914154052734, "step": 2234} +{"info/global_step": 2235, "train_info/time_within_train_step": 2.727694511413574, "step": 2235} +{"train_info/time_between_train_steps": 0.0037336349487304688, "step": 2235} +{"info/global_step": 2236, "train_info/time_within_train_step": 2.6751723289489746, "step": 2236} +{"train_info/time_between_train_steps": 0.003697633743286133, "step": 2236} +{"info/global_step": 2237, "train_info/time_within_train_step": 2.675894021987915, "step": 2237} +{"train_info/time_between_train_steps": 0.003817319869995117, "step": 2237} +{"info/global_step": 2238, "train_info/time_within_train_step": 2.676449775695801, "step": 2238} +{"train_info/time_between_train_steps": 0.003917217254638672, "step": 2238} +{"info/global_step": 2239, "train_info/time_within_train_step": 2.67553973197937, "step": 2239} +{"train_info/time_between_train_steps": 0.003901243209838867, "step": 2239} +{"info/global_step": 2240, "train_info/time_within_train_step": 2.67777156829834, "step": 2240} +{"train_info/time_between_train_steps": 0.003979206085205078, "step": 2240} +{"info/global_step": 2241, "train_info/time_within_train_step": 2.6765832901000977, "step": 2241} +{"train_info/time_between_train_steps": 0.00408625602722168, "step": 2241} +{"info/global_step": 2242, "train_info/time_within_train_step": 2.6757776737213135, "step": 2242} +{"train_info/time_between_train_steps": 0.003740549087524414, "step": 2242} +{"info/global_step": 2243, "train_info/time_within_train_step": 2.675363779067993, "step": 2243} +{"train_info/time_between_train_steps": 0.0038442611694335938, "step": 2243} +{"info/global_step": 2244, "train_info/time_within_train_step": 2.674715757369995, "step": 2244} +{"train_info/time_between_train_steps": 0.003884553909301758, "step": 2244} +{"info/global_step": 2245, "train_info/time_within_train_step": 2.6765191555023193, "step": 2245} +{"train_info/time_between_train_steps": 0.003812551498413086, "step": 2245} +{"info/global_step": 2246, "train_info/time_within_train_step": 2.6752681732177734, "step": 2246} +{"train_info/time_between_train_steps": 0.003890514373779297, "step": 2246} +{"info/global_step": 2247, "train_info/time_within_train_step": 2.675987720489502, "step": 2247} +{"train_info/time_between_train_steps": 0.0037567615509033203, "step": 2247} +{"info/global_step": 2248, "train_info/time_within_train_step": 2.6753652095794678, "step": 2248} +{"train_info/time_between_train_steps": 0.00386810302734375, "step": 2248} +{"info/global_step": 2249, "train_info/time_within_train_step": 2.6769351959228516, "step": 2249} +{"train_info/time_between_train_steps": 0.003955841064453125, "step": 2249} +{"info/global_step": 2250, "train_info/time_within_train_step": 3.2425479888916016, "step": 2250} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746209691, "_runtime": 6463}, "step": 2250} +{"logs": {"train/loss": 4.0301, "train/learning_rate": 0.00016666666666666666, "train/epoch": 2.17, "_timestamp": 1746209691, "_runtime": 6463}, "step": 2250} +{"train_info/time_between_train_steps": 0.024904251098632812, "step": 2250} +{"info/global_step": 2251, "train_info/time_within_train_step": 2.7143962383270264, "step": 2251} +{"train_info/time_between_train_steps": 0.0039255619049072266, "step": 2251} +{"info/global_step": 2252, "train_info/time_within_train_step": 2.6763157844543457, "step": 2252} +{"train_info/time_between_train_steps": 0.003922462463378906, "step": 2252} +{"info/global_step": 2253, "train_info/time_within_train_step": 2.6746866703033447, "step": 2253} +{"train_info/time_between_train_steps": 0.003748178482055664, "step": 2253} +{"info/global_step": 2254, "train_info/time_within_train_step": 2.6728079319000244, "step": 2254} +{"train_info/time_between_train_steps": 0.0037474632263183594, "step": 2254} +{"info/global_step": 2255, "train_info/time_within_train_step": 2.6734838485717773, "step": 2255} +{"train_info/time_between_train_steps": 0.0038056373596191406, "step": 2255} +{"info/global_step": 2256, "train_info/time_within_train_step": 2.6774871349334717, "step": 2256} +{"train_info/time_between_train_steps": 0.003803730010986328, "step": 2256} +{"info/global_step": 2257, "train_info/time_within_train_step": 2.7275924682617188, "step": 2257} +{"train_info/time_between_train_steps": 0.004055500030517578, "step": 2257} +{"info/global_step": 2258, "train_info/time_within_train_step": 2.675821304321289, "step": 2258} +{"train_info/time_between_train_steps": 0.0039174556732177734, "step": 2258} +{"info/global_step": 2259, "train_info/time_within_train_step": 2.6773767471313477, "step": 2259} +{"train_info/time_between_train_steps": 0.0038526058197021484, "step": 2259} +{"info/global_step": 2260, "train_info/time_within_train_step": 2.67805552482605, "step": 2260} +{"train_info/time_between_train_steps": 0.0038657188415527344, "step": 2260} +{"info/global_step": 2261, "train_info/time_within_train_step": 2.677882194519043, "step": 2261} +{"train_info/time_between_train_steps": 0.00398707389831543, "step": 2261} +{"info/global_step": 2262, "train_info/time_within_train_step": 2.679607391357422, "step": 2262} +{"train_info/time_between_train_steps": 0.00403904914855957, "step": 2262} +{"info/global_step": 2263, "train_info/time_within_train_step": 2.674544334411621, "step": 2263} +{"train_info/time_between_train_steps": 0.003786802291870117, "step": 2263} +{"info/global_step": 2264, "train_info/time_within_train_step": 2.6736884117126465, "step": 2264} +{"train_info/time_between_train_steps": 0.004166841506958008, "step": 2264} +{"info/global_step": 2265, "train_info/time_within_train_step": 2.6757259368896484, "step": 2265} +{"train_info/time_between_train_steps": 0.003998517990112305, "step": 2265} +{"info/global_step": 2266, "train_info/time_within_train_step": 2.675344228744507, "step": 2266} +{"train_info/time_between_train_steps": 0.0040857791900634766, "step": 2266} +{"info/global_step": 2267, "train_info/time_within_train_step": 2.6744556427001953, "step": 2267} +{"train_info/time_between_train_steps": 0.004072666168212891, "step": 2267} +{"info/global_step": 2268, "train_info/time_within_train_step": 2.676072835922241, "step": 2268} +{"train_info/time_between_train_steps": 0.0041925907135009766, "step": 2268} +{"info/global_step": 2269, "train_info/time_within_train_step": 2.677443742752075, "step": 2269} +{"train_info/time_between_train_steps": 0.004218339920043945, "step": 2269} +{"info/global_step": 2270, "train_info/time_within_train_step": 2.6765549182891846, "step": 2270} +{"train_info/time_between_train_steps": 0.0038862228393554688, "step": 2270} +{"info/global_step": 2271, "train_info/time_within_train_step": 2.6780643463134766, "step": 2271} +{"train_info/time_between_train_steps": 0.0038099288940429688, "step": 2271} +{"info/global_step": 2272, "train_info/time_within_train_step": 2.675440788269043, "step": 2272} +{"train_info/time_between_train_steps": 0.0038840770721435547, "step": 2272} +{"info/global_step": 2273, "train_info/time_within_train_step": 2.677245855331421, "step": 2273} +{"train_info/time_between_train_steps": 0.0038073062896728516, "step": 2273} +{"info/global_step": 2274, "train_info/time_within_train_step": 2.6738851070404053, "step": 2274} +{"train_info/time_between_train_steps": 0.0038106441497802734, "step": 2274} +{"info/global_step": 2275, "train_info/time_within_train_step": 2.6750893592834473, "step": 2275} +{"train_info/time_between_train_steps": 0.003746509552001953, "step": 2275} +{"info/global_step": 2276, "train_info/time_within_train_step": 2.6740925312042236, "step": 2276} +{"train_info/time_between_train_steps": 0.003869771957397461, "step": 2276} +{"info/global_step": 2277, "train_info/time_within_train_step": 2.6737818717956543, "step": 2277} +{"train_info/time_between_train_steps": 0.0037555694580078125, "step": 2277} +{"info/global_step": 2278, "train_info/time_within_train_step": 2.674827814102173, "step": 2278} +{"train_info/time_between_train_steps": 0.003924131393432617, "step": 2278} +{"info/global_step": 2279, "train_info/time_within_train_step": 2.676060438156128, "step": 2279} +{"train_info/time_between_train_steps": 0.0038814544677734375, "step": 2279} +{"info/global_step": 2280, "train_info/time_within_train_step": 2.727450132369995, "step": 2280} +{"train_info/time_between_train_steps": 0.003425121307373047, "step": 2280} +{"info/global_step": 2281, "train_info/time_within_train_step": 2.6748170852661133, "step": 2281} +{"train_info/time_between_train_steps": 0.003192424774169922, "step": 2281} +{"info/global_step": 2282, "train_info/time_within_train_step": 2.6744942665100098, "step": 2282} +{"train_info/time_between_train_steps": 0.0032606124877929688, "step": 2282} +{"info/global_step": 2283, "train_info/time_within_train_step": 2.6741983890533447, "step": 2283} +{"train_info/time_between_train_steps": 0.003262758255004883, "step": 2283} +{"info/global_step": 2284, "train_info/time_within_train_step": 2.675865650177002, "step": 2284} +{"train_info/time_between_train_steps": 0.003245830535888672, "step": 2284} +{"info/global_step": 2285, "train_info/time_within_train_step": 2.676056146621704, "step": 2285} +{"train_info/time_between_train_steps": 0.003448486328125, "step": 2285} +{"info/global_step": 2286, "train_info/time_within_train_step": 2.6766345500946045, "step": 2286} +{"train_info/time_between_train_steps": 0.0033147335052490234, "step": 2286} +{"info/global_step": 2287, "train_info/time_within_train_step": 2.675687074661255, "step": 2287} +{"train_info/time_between_train_steps": 0.0033719539642333984, "step": 2287} +{"info/global_step": 2288, "train_info/time_within_train_step": 2.676449775695801, "step": 2288} +{"train_info/time_between_train_steps": 0.0033638477325439453, "step": 2288} +{"info/global_step": 2289, "train_info/time_within_train_step": 2.674888849258423, "step": 2289} +{"train_info/time_between_train_steps": 0.003272533416748047, "step": 2289} +{"info/global_step": 2290, "train_info/time_within_train_step": 2.6719157695770264, "step": 2290} +{"train_info/time_between_train_steps": 0.003124713897705078, "step": 2290} +{"info/global_step": 2291, "train_info/time_within_train_step": 2.672616720199585, "step": 2291} +{"train_info/time_between_train_steps": 0.003215789794921875, "step": 2291} +{"info/global_step": 2292, "train_info/time_within_train_step": 2.675734758377075, "step": 2292} +{"train_info/time_between_train_steps": 0.0033082962036132812, "step": 2292} +{"info/global_step": 2293, "train_info/time_within_train_step": 2.6739652156829834, "step": 2293} +{"train_info/time_between_train_steps": 0.003215312957763672, "step": 2293} +{"info/global_step": 2294, "train_info/time_within_train_step": 2.6747806072235107, "step": 2294} +{"train_info/time_between_train_steps": 0.0033142566680908203, "step": 2294} +{"info/global_step": 2295, "train_info/time_within_train_step": 2.6739988327026367, "step": 2295} +{"train_info/time_between_train_steps": 0.0032384395599365234, "step": 2295} +{"info/global_step": 2296, "train_info/time_within_train_step": 2.673565626144409, "step": 2296} +{"train_info/time_between_train_steps": 0.003580808639526367, "step": 2296} +{"info/global_step": 2297, "train_info/time_within_train_step": 2.675421953201294, "step": 2297} +{"train_info/time_between_train_steps": 0.003409862518310547, "step": 2297} +{"info/global_step": 2298, "train_info/time_within_train_step": 2.6740591526031494, "step": 2298} +{"train_info/time_between_train_steps": 0.0033376216888427734, "step": 2298} +{"info/global_step": 2299, "train_info/time_within_train_step": 2.674804925918579, "step": 2299} +{"train_info/time_between_train_steps": 0.0034084320068359375, "step": 2299} +{"info/global_step": 2300, "train_info/time_within_train_step": 2.6747772693634033, "step": 2300} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746209826, "_runtime": 6598}, "step": 2300} +{"logs": {"train/loss": 4.0314, "train/learning_rate": 0.00015555555555555554, "train/epoch": 2.19, "_timestamp": 1746209826, "_runtime": 6598}, "step": 2300} +{"train_info/time_between_train_steps": 13.083020210266113, "step": 2300} +{"info/global_step": 2301, "train_info/time_within_train_step": 2.4801459312438965, "step": 2301} +{"train_info/time_between_train_steps": 0.003682374954223633, "step": 2301} +{"info/global_step": 2302, "train_info/time_within_train_step": 2.862156391143799, "step": 2302} +{"train_info/time_between_train_steps": 0.0031938552856445312, "step": 2302} +{"info/global_step": 2303, "train_info/time_within_train_step": 2.4648144245147705, "step": 2303} +{"train_info/time_between_train_steps": 0.003202199935913086, "step": 2303} +{"info/global_step": 2304, "train_info/time_within_train_step": 2.6363422870635986, "step": 2304} +{"train_info/time_between_train_steps": 0.0033521652221679688, "step": 2304} +{"info/global_step": 2305, "train_info/time_within_train_step": 2.6729893684387207, "step": 2305} +{"train_info/time_between_train_steps": 0.003353118896484375, "step": 2305} +{"info/global_step": 2306, "train_info/time_within_train_step": 2.6729178428649902, "step": 2306} +{"train_info/time_between_train_steps": 0.003318309783935547, "step": 2306} +{"info/global_step": 2307, "train_info/time_within_train_step": 2.673396110534668, "step": 2307} +{"train_info/time_between_train_steps": 0.0033538341522216797, "step": 2307} +{"info/global_step": 2308, "train_info/time_within_train_step": 2.6733930110931396, "step": 2308} +{"train_info/time_between_train_steps": 0.0032339096069335938, "step": 2308} +{"info/global_step": 2309, "train_info/time_within_train_step": 2.674138069152832, "step": 2309} +{"train_info/time_between_train_steps": 0.003267526626586914, "step": 2309} +{"info/global_step": 2310, "train_info/time_within_train_step": 2.6759142875671387, "step": 2310} +{"train_info/time_between_train_steps": 0.003368377685546875, "step": 2310} +{"info/global_step": 2311, "train_info/time_within_train_step": 2.675045967102051, "step": 2311} +{"train_info/time_between_train_steps": 0.0033347606658935547, "step": 2311} +{"info/global_step": 2312, "train_info/time_within_train_step": 2.675157070159912, "step": 2312} +{"train_info/time_between_train_steps": 0.0032787322998046875, "step": 2312} +{"info/global_step": 2313, "train_info/time_within_train_step": 2.6763734817504883, "step": 2313} +{"train_info/time_between_train_steps": 0.0032858848571777344, "step": 2313} +{"info/global_step": 2314, "train_info/time_within_train_step": 2.674802303314209, "step": 2314} +{"train_info/time_between_train_steps": 0.0032758712768554688, "step": 2314} +{"info/global_step": 2315, "train_info/time_within_train_step": 2.675645351409912, "step": 2315} +{"train_info/time_between_train_steps": 0.0033025741577148438, "step": 2315} +{"info/global_step": 2316, "train_info/time_within_train_step": 2.6757426261901855, "step": 2316} +{"train_info/time_between_train_steps": 0.0033130645751953125, "step": 2316} +{"info/global_step": 2317, "train_info/time_within_train_step": 2.6740951538085938, "step": 2317} +{"train_info/time_between_train_steps": 0.0032324790954589844, "step": 2317} +{"info/global_step": 2318, "train_info/time_within_train_step": 2.675323963165283, "step": 2318} +{"train_info/time_between_train_steps": 0.0032701492309570312, "step": 2318} +{"info/global_step": 2319, "train_info/time_within_train_step": 2.6753594875335693, "step": 2319} +{"train_info/time_between_train_steps": 0.003238677978515625, "step": 2319} +{"info/global_step": 2320, "train_info/time_within_train_step": 2.6738781929016113, "step": 2320} +{"train_info/time_between_train_steps": 0.003279447555541992, "step": 2320} +{"info/global_step": 2321, "train_info/time_within_train_step": 2.6757402420043945, "step": 2321} +{"train_info/time_between_train_steps": 0.0033206939697265625, "step": 2321} +{"info/global_step": 2322, "train_info/time_within_train_step": 2.6764259338378906, "step": 2322} +{"train_info/time_between_train_steps": 0.003304004669189453, "step": 2322} +{"info/global_step": 2323, "train_info/time_within_train_step": 2.675682544708252, "step": 2323} +{"train_info/time_between_train_steps": 0.0032205581665039062, "step": 2323} +{"info/global_step": 2324, "train_info/time_within_train_step": 2.674708604812622, "step": 2324} +{"train_info/time_between_train_steps": 0.003300905227661133, "step": 2324} +{"info/global_step": 2325, "train_info/time_within_train_step": 2.674095630645752, "step": 2325} +{"train_info/time_between_train_steps": 0.0032837390899658203, "step": 2325} +{"info/global_step": 2326, "train_info/time_within_train_step": 2.674614191055298, "step": 2326} +{"train_info/time_between_train_steps": 0.0032460689544677734, "step": 2326} +{"info/global_step": 2327, "train_info/time_within_train_step": 2.6734821796417236, "step": 2327} +{"train_info/time_between_train_steps": 0.0032944679260253906, "step": 2327} +{"info/global_step": 2328, "train_info/time_within_train_step": 2.674832582473755, "step": 2328} +{"train_info/time_between_train_steps": 0.003332376480102539, "step": 2328} +{"info/global_step": 2329, "train_info/time_within_train_step": 2.6747732162475586, "step": 2329} +{"train_info/time_between_train_steps": 0.003326416015625, "step": 2329} +{"info/global_step": 2330, "train_info/time_within_train_step": 2.6736483573913574, "step": 2330} +{"train_info/time_between_train_steps": 0.0032563209533691406, "step": 2330} +{"info/global_step": 2331, "train_info/time_within_train_step": 2.6749203205108643, "step": 2331} +{"train_info/time_between_train_steps": 0.003275156021118164, "step": 2331} +{"info/global_step": 2332, "train_info/time_within_train_step": 2.67332124710083, "step": 2332} +{"train_info/time_between_train_steps": 0.003228902816772461, "step": 2332} +{"info/global_step": 2333, "train_info/time_within_train_step": 2.6754567623138428, "step": 2333} +{"train_info/time_between_train_steps": 0.0032892227172851562, "step": 2333} +{"info/global_step": 2334, "train_info/time_within_train_step": 2.674717426300049, "step": 2334} +{"train_info/time_between_train_steps": 0.0033140182495117188, "step": 2334} +{"info/global_step": 2335, "train_info/time_within_train_step": 2.6755752563476562, "step": 2335} +{"train_info/time_between_train_steps": 0.003300905227661133, "step": 2335} +{"info/global_step": 2336, "train_info/time_within_train_step": 2.673893690109253, "step": 2336} +{"train_info/time_between_train_steps": 0.003318309783935547, "step": 2336} +{"info/global_step": 2337, "train_info/time_within_train_step": 2.6750125885009766, "step": 2337} +{"train_info/time_between_train_steps": 0.003263711929321289, "step": 2337} +{"info/global_step": 2338, "train_info/time_within_train_step": 2.6755309104919434, "step": 2338} +{"train_info/time_between_train_steps": 0.003403186798095703, "step": 2338} +{"info/global_step": 2339, "train_info/time_within_train_step": 2.6767780780792236, "step": 2339} +{"train_info/time_between_train_steps": 0.0034041404724121094, "step": 2339} +{"info/global_step": 2340, "train_info/time_within_train_step": 2.67372465133667, "step": 2340} +{"train_info/time_between_train_steps": 0.0032553672790527344, "step": 2340} +{"info/global_step": 2341, "train_info/time_within_train_step": 2.6733920574188232, "step": 2341} +{"train_info/time_between_train_steps": 0.0033102035522460938, "step": 2341} +{"info/global_step": 2342, "train_info/time_within_train_step": 2.6736552715301514, "step": 2342} +{"train_info/time_between_train_steps": 0.0032308101654052734, "step": 2342} +{"info/global_step": 2343, "train_info/time_within_train_step": 2.6738710403442383, "step": 2343} +{"train_info/time_between_train_steps": 0.003331899642944336, "step": 2343} +{"info/global_step": 2344, "train_info/time_within_train_step": 2.6745707988739014, "step": 2344} +{"train_info/time_between_train_steps": 0.003284454345703125, "step": 2344} +{"info/global_step": 2345, "train_info/time_within_train_step": 2.673037052154541, "step": 2345} +{"train_info/time_between_train_steps": 0.003276348114013672, "step": 2345} +{"info/global_step": 2346, "train_info/time_within_train_step": 2.6716437339782715, "step": 2346} +{"train_info/time_between_train_steps": 0.0032393932342529297, "step": 2346} +{"info/global_step": 2347, "train_info/time_within_train_step": 2.6731934547424316, "step": 2347} +{"train_info/time_between_train_steps": 0.003244638442993164, "step": 2347} +{"info/global_step": 2348, "train_info/time_within_train_step": 2.672560214996338, "step": 2348} +{"train_info/time_between_train_steps": 0.003417491912841797, "step": 2348} +{"info/global_step": 2349, "train_info/time_within_train_step": 2.6745259761810303, "step": 2349} +{"train_info/time_between_train_steps": 0.0033864974975585938, "step": 2349} +{"info/global_step": 2350, "train_info/time_within_train_step": 2.6734936237335205, "step": 2350} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746209974, "_runtime": 6746}, "step": 2350} +{"logs": {"train/loss": 4.0048, "train/learning_rate": 0.0001444444444444444, "train/epoch": 2.21, "_timestamp": 1746209974, "_runtime": 6746}, "step": 2350} +{"train_info/time_between_train_steps": 0.02404189109802246, "step": 2350} +{"info/global_step": 2351, "train_info/time_within_train_step": 2.673161029815674, "step": 2351} +{"train_info/time_between_train_steps": 0.00344085693359375, "step": 2351} +{"info/global_step": 2352, "train_info/time_within_train_step": 2.67372989654541, "step": 2352} +{"train_info/time_between_train_steps": 0.003373384475708008, "step": 2352} +{"info/global_step": 2353, "train_info/time_within_train_step": 2.6742098331451416, "step": 2353} +{"train_info/time_between_train_steps": 0.003284931182861328, "step": 2353} +{"info/global_step": 2354, "train_info/time_within_train_step": 2.677748680114746, "step": 2354} +{"train_info/time_between_train_steps": 0.0040874481201171875, "step": 2354} +{"info/global_step": 2355, "train_info/time_within_train_step": 2.67446231842041, "step": 2355} +{"train_info/time_between_train_steps": 0.003325223922729492, "step": 2355} +{"info/global_step": 2356, "train_info/time_within_train_step": 2.6734161376953125, "step": 2356} +{"train_info/time_between_train_steps": 0.0033447742462158203, "step": 2356} +{"info/global_step": 2357, "train_info/time_within_train_step": 2.6770029067993164, "step": 2357} +{"train_info/time_between_train_steps": 0.00424504280090332, "step": 2357} +{"info/global_step": 2358, "train_info/time_within_train_step": 2.6741065979003906, "step": 2358} +{"train_info/time_between_train_steps": 0.0033919811248779297, "step": 2358} +{"info/global_step": 2359, "train_info/time_within_train_step": 2.673931360244751, "step": 2359} +{"train_info/time_between_train_steps": 0.003566265106201172, "step": 2359} +{"info/global_step": 2360, "train_info/time_within_train_step": 2.673929452896118, "step": 2360} +{"train_info/time_between_train_steps": 0.003424406051635742, "step": 2360} +{"info/global_step": 2361, "train_info/time_within_train_step": 2.673447847366333, "step": 2361} +{"train_info/time_between_train_steps": 0.0034286975860595703, "step": 2361} +{"info/global_step": 2362, "train_info/time_within_train_step": 2.674405574798584, "step": 2362} +{"train_info/time_between_train_steps": 0.0033495426177978516, "step": 2362} +{"info/global_step": 2363, "train_info/time_within_train_step": 2.6715657711029053, "step": 2363} +{"train_info/time_between_train_steps": 0.00335693359375, "step": 2363} +{"info/global_step": 2364, "train_info/time_within_train_step": 2.673518419265747, "step": 2364} +{"train_info/time_between_train_steps": 0.0033190250396728516, "step": 2364} +{"info/global_step": 2365, "train_info/time_within_train_step": 2.6714210510253906, "step": 2365} +{"train_info/time_between_train_steps": 0.0032198429107666016, "step": 2365} +{"info/global_step": 2366, "train_info/time_within_train_step": 2.6712942123413086, "step": 2366} +{"train_info/time_between_train_steps": 0.0032455921173095703, "step": 2366} +{"info/global_step": 2367, "train_info/time_within_train_step": 2.6709442138671875, "step": 2367} +{"train_info/time_between_train_steps": 0.0033364295959472656, "step": 2367} +{"info/global_step": 2368, "train_info/time_within_train_step": 2.67354154586792, "step": 2368} +{"train_info/time_between_train_steps": 0.00335693359375, "step": 2368} +{"info/global_step": 2369, "train_info/time_within_train_step": 2.674548387527466, "step": 2369} +{"train_info/time_between_train_steps": 0.003332853317260742, "step": 2369} +{"info/global_step": 2370, "train_info/time_within_train_step": 2.6711175441741943, "step": 2370} +{"train_info/time_between_train_steps": 0.0032052993774414062, "step": 2370} +{"info/global_step": 2371, "train_info/time_within_train_step": 2.6726064682006836, "step": 2371} +{"train_info/time_between_train_steps": 0.003317117691040039, "step": 2371} +{"info/global_step": 2372, "train_info/time_within_train_step": 2.9988503456115723, "step": 2372} +{"train_info/time_between_train_steps": 0.003204822540283203, "step": 2372} +{"info/global_step": 2373, "train_info/time_within_train_step": 2.672837018966675, "step": 2373} +{"train_info/time_between_train_steps": 0.003134012222290039, "step": 2373} +{"info/global_step": 2374, "train_info/time_within_train_step": 2.672041177749634, "step": 2374} +{"train_info/time_between_train_steps": 0.003114938735961914, "step": 2374} +{"info/global_step": 2375, "train_info/time_within_train_step": 2.6722710132598877, "step": 2375} +{"train_info/time_between_train_steps": 0.003082275390625, "step": 2375} +{"info/global_step": 2376, "train_info/time_within_train_step": 2.675215005874634, "step": 2376} +{"train_info/time_between_train_steps": 0.003433704376220703, "step": 2376} +{"info/global_step": 2377, "train_info/time_within_train_step": 2.6743969917297363, "step": 2377} +{"train_info/time_between_train_steps": 0.003336668014526367, "step": 2377} +{"info/global_step": 2378, "train_info/time_within_train_step": 2.6770176887512207, "step": 2378} +{"train_info/time_between_train_steps": 0.003899812698364258, "step": 2378} +{"info/global_step": 2379, "train_info/time_within_train_step": 2.674590587615967, "step": 2379} +{"train_info/time_between_train_steps": 0.0036618709564208984, "step": 2379} +{"info/global_step": 2380, "train_info/time_within_train_step": 2.6753153800964355, "step": 2380} +{"train_info/time_between_train_steps": 0.003730297088623047, "step": 2380} +{"info/global_step": 2381, "train_info/time_within_train_step": 2.6743130683898926, "step": 2381} +{"train_info/time_between_train_steps": 0.003520488739013672, "step": 2381} +{"info/global_step": 2382, "train_info/time_within_train_step": 2.6737985610961914, "step": 2382} +{"train_info/time_between_train_steps": 0.003921985626220703, "step": 2382} +{"info/global_step": 2383, "train_info/time_within_train_step": 2.6757559776306152, "step": 2383} +{"train_info/time_between_train_steps": 0.0037119388580322266, "step": 2383} +{"info/global_step": 2384, "train_info/time_within_train_step": 2.6763522624969482, "step": 2384} +{"train_info/time_between_train_steps": 0.003728151321411133, "step": 2384} +{"info/global_step": 2385, "train_info/time_within_train_step": 2.6756668090820312, "step": 2385} +{"train_info/time_between_train_steps": 0.003732442855834961, "step": 2385} +{"info/global_step": 2386, "train_info/time_within_train_step": 2.7249958515167236, "step": 2386} +{"train_info/time_between_train_steps": 0.0036373138427734375, "step": 2386} +{"info/global_step": 2387, "train_info/time_within_train_step": 2.6754236221313477, "step": 2387} +{"train_info/time_between_train_steps": 0.006784677505493164, "step": 2387} +{"info/global_step": 2388, "train_info/time_within_train_step": 2.675320625305176, "step": 2388} +{"train_info/time_between_train_steps": 0.0033092498779296875, "step": 2388} +{"info/global_step": 2389, "train_info/time_within_train_step": 2.6732540130615234, "step": 2389} +{"train_info/time_between_train_steps": 0.0033500194549560547, "step": 2389} +{"info/global_step": 2390, "train_info/time_within_train_step": 2.6724295616149902, "step": 2390} +{"train_info/time_between_train_steps": 0.003505229949951172, "step": 2390} +{"info/global_step": 2391, "train_info/time_within_train_step": 2.6740477085113525, "step": 2391} +{"train_info/time_between_train_steps": 0.0036814212799072266, "step": 2391} +{"info/global_step": 2392, "train_info/time_within_train_step": 2.6744508743286133, "step": 2392} +{"train_info/time_between_train_steps": 0.003689289093017578, "step": 2392} +{"info/global_step": 2393, "train_info/time_within_train_step": 2.67435622215271, "step": 2393} +{"train_info/time_between_train_steps": 0.0037050247192382812, "step": 2393} +{"info/global_step": 2394, "train_info/time_within_train_step": 2.6738483905792236, "step": 2394} +{"train_info/time_between_train_steps": 0.003688812255859375, "step": 2394} +{"info/global_step": 2395, "train_info/time_within_train_step": 2.6736462116241455, "step": 2395} +{"train_info/time_between_train_steps": 0.0036056041717529297, "step": 2395} +{"info/global_step": 2396, "train_info/time_within_train_step": 2.6727800369262695, "step": 2396} +{"train_info/time_between_train_steps": 0.003372669219970703, "step": 2396} +{"info/global_step": 2397, "train_info/time_within_train_step": 2.6758129596710205, "step": 2397} +{"train_info/time_between_train_steps": 0.0036368370056152344, "step": 2397} +{"info/global_step": 2398, "train_info/time_within_train_step": 2.6755852699279785, "step": 2398} +{"train_info/time_between_train_steps": 0.003632068634033203, "step": 2398} +{"info/global_step": 2399, "train_info/time_within_train_step": 2.6737146377563477, "step": 2399} +{"train_info/time_between_train_steps": 0.003631591796875, "step": 2399} +{"info/global_step": 2400, "train_info/time_within_train_step": 2.6740310192108154, "step": 2400} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746210109, "_runtime": 6881}, "step": 2400} +{"logs": {"train/loss": 3.9918, "train/learning_rate": 0.0001333333333333333, "train/epoch": 2.22, "_timestamp": 1746210109, "_runtime": 6881}, "step": 2400} +{"train_info/time_between_train_steps": 12.853787183761597, "step": 2400} +{"info/global_step": 2401, "train_info/time_within_train_step": 2.4707744121551514, "step": 2401} +{"train_info/time_between_train_steps": 0.003564596176147461, "step": 2401} +{"info/global_step": 2402, "train_info/time_within_train_step": 2.4588265419006348, "step": 2402} +{"train_info/time_between_train_steps": 0.003556489944458008, "step": 2402} +{"info/global_step": 2403, "train_info/time_within_train_step": 2.512676239013672, "step": 2403} +{"train_info/time_between_train_steps": 0.003794431686401367, "step": 2403} +{"info/global_step": 2404, "train_info/time_within_train_step": 2.6694138050079346, "step": 2404} +{"train_info/time_between_train_steps": 0.0036668777465820312, "step": 2404} +{"info/global_step": 2405, "train_info/time_within_train_step": 2.6746110916137695, "step": 2405} +{"train_info/time_between_train_steps": 0.003698587417602539, "step": 2405} +{"info/global_step": 2406, "train_info/time_within_train_step": 2.675936698913574, "step": 2406} +{"train_info/time_between_train_steps": 0.003734111785888672, "step": 2406} +{"info/global_step": 2407, "train_info/time_within_train_step": 2.673536539077759, "step": 2407} +{"train_info/time_between_train_steps": 0.0035250186920166016, "step": 2407} +{"info/global_step": 2408, "train_info/time_within_train_step": 2.6737303733825684, "step": 2408} +{"train_info/time_between_train_steps": 0.003448963165283203, "step": 2408} +{"info/global_step": 2409, "train_info/time_within_train_step": 2.6756606101989746, "step": 2409} +{"train_info/time_between_train_steps": 0.0034570693969726562, "step": 2409} +{"info/global_step": 2410, "train_info/time_within_train_step": 2.675027370452881, "step": 2410} +{"train_info/time_between_train_steps": 0.003514528274536133, "step": 2410} +{"info/global_step": 2411, "train_info/time_within_train_step": 2.674320936203003, "step": 2411} +{"train_info/time_between_train_steps": 0.003517627716064453, "step": 2411} +{"info/global_step": 2412, "train_info/time_within_train_step": 2.986595869064331, "step": 2412} +{"train_info/time_between_train_steps": 0.003164052963256836, "step": 2412} +{"info/global_step": 2413, "train_info/time_within_train_step": 2.672715902328491, "step": 2413} +{"train_info/time_between_train_steps": 0.0031278133392333984, "step": 2413} +{"info/global_step": 2414, "train_info/time_within_train_step": 2.673278570175171, "step": 2414} +{"train_info/time_between_train_steps": 0.0031890869140625, "step": 2414} +{"info/global_step": 2415, "train_info/time_within_train_step": 2.6751906871795654, "step": 2415} +{"train_info/time_between_train_steps": 0.003492593765258789, "step": 2415} +{"info/global_step": 2416, "train_info/time_within_train_step": 2.673611640930176, "step": 2416} +{"train_info/time_between_train_steps": 0.0032808780670166016, "step": 2416} +{"info/global_step": 2417, "train_info/time_within_train_step": 2.6739211082458496, "step": 2417} +{"train_info/time_between_train_steps": 0.003309488296508789, "step": 2417} +{"info/global_step": 2418, "train_info/time_within_train_step": 2.673915147781372, "step": 2418} +{"train_info/time_between_train_steps": 0.0033380985260009766, "step": 2418} +{"info/global_step": 2419, "train_info/time_within_train_step": 2.674715280532837, "step": 2419} +{"train_info/time_between_train_steps": 0.003246307373046875, "step": 2419} +{"info/global_step": 2420, "train_info/time_within_train_step": 2.6741182804107666, "step": 2420} +{"train_info/time_between_train_steps": 0.0032329559326171875, "step": 2420} +{"info/global_step": 2421, "train_info/time_within_train_step": 2.67413592338562, "step": 2421} +{"train_info/time_between_train_steps": 0.0031757354736328125, "step": 2421} +{"info/global_step": 2422, "train_info/time_within_train_step": 2.6735482215881348, "step": 2422} +{"train_info/time_between_train_steps": 0.0032165050506591797, "step": 2422} +{"info/global_step": 2423, "train_info/time_within_train_step": 2.6752817630767822, "step": 2423} +{"train_info/time_between_train_steps": 0.003347635269165039, "step": 2423} +{"info/global_step": 2424, "train_info/time_within_train_step": 2.675293207168579, "step": 2424} +{"train_info/time_between_train_steps": 0.003384828567504883, "step": 2424} +{"info/global_step": 2425, "train_info/time_within_train_step": 2.6755292415618896, "step": 2425} +{"train_info/time_between_train_steps": 0.003244161605834961, "step": 2425} +{"info/global_step": 2426, "train_info/time_within_train_step": 2.7255876064300537, "step": 2426} +{"train_info/time_between_train_steps": 0.0033507347106933594, "step": 2426} +{"info/global_step": 2427, "train_info/time_within_train_step": 2.67505145072937, "step": 2427} +{"train_info/time_between_train_steps": 0.0032491683959960938, "step": 2427} +{"info/global_step": 2428, "train_info/time_within_train_step": 2.674346446990967, "step": 2428} +{"train_info/time_between_train_steps": 0.003240346908569336, "step": 2428} +{"info/global_step": 2429, "train_info/time_within_train_step": 2.6756174564361572, "step": 2429} +{"train_info/time_between_train_steps": 0.0034079551696777344, "step": 2429} +{"info/global_step": 2430, "train_info/time_within_train_step": 2.6756105422973633, "step": 2430} +{"train_info/time_between_train_steps": 0.0032587051391601562, "step": 2430} +{"info/global_step": 2431, "train_info/time_within_train_step": 2.6741669178009033, "step": 2431} +{"train_info/time_between_train_steps": 0.003308534622192383, "step": 2431} +{"info/global_step": 2432, "train_info/time_within_train_step": 2.6751513481140137, "step": 2432} +{"train_info/time_between_train_steps": 0.0033245086669921875, "step": 2432} +{"info/global_step": 2433, "train_info/time_within_train_step": 2.674464702606201, "step": 2433} +{"train_info/time_between_train_steps": 0.0033202171325683594, "step": 2433} +{"info/global_step": 2434, "train_info/time_within_train_step": 2.674738883972168, "step": 2434} +{"train_info/time_between_train_steps": 0.003258228302001953, "step": 2434} +{"info/global_step": 2435, "train_info/time_within_train_step": 2.6749720573425293, "step": 2435} +{"train_info/time_between_train_steps": 0.0033745765686035156, "step": 2435} +{"info/global_step": 2436, "train_info/time_within_train_step": 2.6739590167999268, "step": 2436} +{"train_info/time_between_train_steps": 0.0033037662506103516, "step": 2436} +{"info/global_step": 2437, "train_info/time_within_train_step": 2.6746201515197754, "step": 2437} +{"train_info/time_between_train_steps": 0.0033075809478759766, "step": 2437} +{"info/global_step": 2438, "train_info/time_within_train_step": 2.676231622695923, "step": 2438} +{"train_info/time_between_train_steps": 0.003242015838623047, "step": 2438} +{"info/global_step": 2439, "train_info/time_within_train_step": 2.674175500869751, "step": 2439} +{"train_info/time_between_train_steps": 0.0032329559326171875, "step": 2439} +{"info/global_step": 2440, "train_info/time_within_train_step": 2.6749613285064697, "step": 2440} +{"train_info/time_between_train_steps": 0.0032682418823242188, "step": 2440} +{"info/global_step": 2441, "train_info/time_within_train_step": 2.6738739013671875, "step": 2441} +{"train_info/time_between_train_steps": 0.0034313201904296875, "step": 2441} +{"info/global_step": 2442, "train_info/time_within_train_step": 2.673809051513672, "step": 2442} +{"train_info/time_between_train_steps": 0.0031843185424804688, "step": 2442} +{"info/global_step": 2443, "train_info/time_within_train_step": 2.6740994453430176, "step": 2443} +{"train_info/time_between_train_steps": 0.0031843185424804688, "step": 2443} +{"info/global_step": 2444, "train_info/time_within_train_step": 2.6753039360046387, "step": 2444} +{"train_info/time_between_train_steps": 0.0033257007598876953, "step": 2444} +{"info/global_step": 2445, "train_info/time_within_train_step": 2.673358201980591, "step": 2445} +{"train_info/time_between_train_steps": 0.003222942352294922, "step": 2445} +{"info/global_step": 2446, "train_info/time_within_train_step": 2.67372989654541, "step": 2446} +{"train_info/time_between_train_steps": 0.003141164779663086, "step": 2446} +{"info/global_step": 2447, "train_info/time_within_train_step": 2.6738786697387695, "step": 2447} +{"train_info/time_between_train_steps": 0.0032019615173339844, "step": 2447} +{"info/global_step": 2448, "train_info/time_within_train_step": 2.6752731800079346, "step": 2448} +{"train_info/time_between_train_steps": 0.003248453140258789, "step": 2448} +{"info/global_step": 2449, "train_info/time_within_train_step": 2.6763062477111816, "step": 2449} +{"train_info/time_between_train_steps": 0.0032951831817626953, "step": 2449} +{"info/global_step": 2450, "train_info/time_within_train_step": 2.6748433113098145, "step": 2450} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746210257, "_runtime": 7029}, "step": 2450} +{"logs": {"train/loss": 3.9806, "train/learning_rate": 0.00012222222222222221, "train/epoch": 2.24, "_timestamp": 1746210257, "_runtime": 7029}, "step": 2450} +{"train_info/time_between_train_steps": 0.024102449417114258, "step": 2450} +{"info/global_step": 2451, "train_info/time_within_train_step": 2.67466402053833, "step": 2451} +{"train_info/time_between_train_steps": 0.003302335739135742, "step": 2451} +{"info/global_step": 2452, "train_info/time_within_train_step": 2.6760518550872803, "step": 2452} +{"train_info/time_between_train_steps": 0.0031578540802001953, "step": 2452} +{"info/global_step": 2453, "train_info/time_within_train_step": 2.676468849182129, "step": 2453} +{"train_info/time_between_train_steps": 0.0033342838287353516, "step": 2453} +{"info/global_step": 2454, "train_info/time_within_train_step": 2.6767475605010986, "step": 2454} +{"train_info/time_between_train_steps": 0.0032880306243896484, "step": 2454} +{"info/global_step": 2455, "train_info/time_within_train_step": 2.6764578819274902, "step": 2455} +{"train_info/time_between_train_steps": 0.0032868385314941406, "step": 2455} +{"info/global_step": 2456, "train_info/time_within_train_step": 2.675769805908203, "step": 2456} +{"train_info/time_between_train_steps": 0.003222227096557617, "step": 2456} +{"info/global_step": 2457, "train_info/time_within_train_step": 2.675632953643799, "step": 2457} +{"train_info/time_between_train_steps": 0.0032892227172851562, "step": 2457} +{"info/global_step": 2458, "train_info/time_within_train_step": 2.6759369373321533, "step": 2458} +{"train_info/time_between_train_steps": 0.0033833980560302734, "step": 2458} +{"info/global_step": 2459, "train_info/time_within_train_step": 2.6747491359710693, "step": 2459} +{"train_info/time_between_train_steps": 0.0032820701599121094, "step": 2459} +{"info/global_step": 2460, "train_info/time_within_train_step": 2.674755096435547, "step": 2460} +{"train_info/time_between_train_steps": 0.003354310989379883, "step": 2460} +{"info/global_step": 2461, "train_info/time_within_train_step": 2.6754226684570312, "step": 2461} +{"train_info/time_between_train_steps": 0.0032889842987060547, "step": 2461} +{"info/global_step": 2462, "train_info/time_within_train_step": 2.673858404159546, "step": 2462} +{"train_info/time_between_train_steps": 0.0032651424407958984, "step": 2462} +{"info/global_step": 2463, "train_info/time_within_train_step": 2.6761136054992676, "step": 2463} +{"train_info/time_between_train_steps": 0.0032584667205810547, "step": 2463} +{"info/global_step": 2464, "train_info/time_within_train_step": 2.6746885776519775, "step": 2464} +{"train_info/time_between_train_steps": 0.003354310989379883, "step": 2464} +{"info/global_step": 2465, "train_info/time_within_train_step": 2.6750667095184326, "step": 2465} +{"train_info/time_between_train_steps": 0.0034050941467285156, "step": 2465} +{"info/global_step": 2466, "train_info/time_within_train_step": 2.675473690032959, "step": 2466} +{"train_info/time_between_train_steps": 0.003412008285522461, "step": 2466} +{"info/global_step": 2467, "train_info/time_within_train_step": 2.6748099327087402, "step": 2467} +{"train_info/time_between_train_steps": 0.0033800601959228516, "step": 2467} +{"info/global_step": 2468, "train_info/time_within_train_step": 2.676154613494873, "step": 2468} +{"train_info/time_between_train_steps": 0.0034334659576416016, "step": 2468} +{"info/global_step": 2469, "train_info/time_within_train_step": 2.675708770751953, "step": 2469} +{"train_info/time_between_train_steps": 0.003366708755493164, "step": 2469} +{"info/global_step": 2470, "train_info/time_within_train_step": 2.6755874156951904, "step": 2470} +{"train_info/time_between_train_steps": 0.003606557846069336, "step": 2470} +{"info/global_step": 2471, "train_info/time_within_train_step": 2.67486310005188, "step": 2471} +{"train_info/time_between_train_steps": 0.0036704540252685547, "step": 2471} +{"info/global_step": 2472, "train_info/time_within_train_step": 2.676363706588745, "step": 2472} +{"train_info/time_between_train_steps": 0.003582000732421875, "step": 2472} +{"info/global_step": 2473, "train_info/time_within_train_step": 2.6745169162750244, "step": 2473} +{"train_info/time_between_train_steps": 0.0035102367401123047, "step": 2473} +{"info/global_step": 2474, "train_info/time_within_train_step": 2.6757972240448, "step": 2474} +{"train_info/time_between_train_steps": 0.003632783889770508, "step": 2474} +{"info/global_step": 2475, "train_info/time_within_train_step": 2.676229953765869, "step": 2475} +{"train_info/time_between_train_steps": 0.0035991668701171875, "step": 2475} +{"info/global_step": 2476, "train_info/time_within_train_step": 2.676372766494751, "step": 2476} +{"train_info/time_between_train_steps": 0.00460052490234375, "step": 2476} +{"info/global_step": 2477, "train_info/time_within_train_step": 2.676879405975342, "step": 2477} +{"train_info/time_between_train_steps": 0.0034902095794677734, "step": 2477} +{"info/global_step": 2478, "train_info/time_within_train_step": 2.676950216293335, "step": 2478} +{"train_info/time_between_train_steps": 0.0035314559936523438, "step": 2478} +{"info/global_step": 2479, "train_info/time_within_train_step": 2.6752703189849854, "step": 2479} +{"train_info/time_between_train_steps": 0.0032911300659179688, "step": 2479} +{"info/global_step": 2480, "train_info/time_within_train_step": 2.6757490634918213, "step": 2480} +{"train_info/time_between_train_steps": 0.0033731460571289062, "step": 2480} +{"info/global_step": 2481, "train_info/time_within_train_step": 2.6754941940307617, "step": 2481} +{"train_info/time_between_train_steps": 0.003294229507446289, "step": 2481} +{"info/global_step": 2482, "train_info/time_within_train_step": 2.6748368740081787, "step": 2482} +{"train_info/time_between_train_steps": 0.0032444000244140625, "step": 2482} +{"info/global_step": 2483, "train_info/time_within_train_step": 2.6744771003723145, "step": 2483} +{"train_info/time_between_train_steps": 0.003347158432006836, "step": 2483} +{"info/global_step": 2484, "train_info/time_within_train_step": 2.674453020095825, "step": 2484} +{"train_info/time_between_train_steps": 0.0033826828002929688, "step": 2484} +{"info/global_step": 2485, "train_info/time_within_train_step": 2.676227569580078, "step": 2485} +{"train_info/time_between_train_steps": 0.003348112106323242, "step": 2485} +{"info/global_step": 2486, "train_info/time_within_train_step": 2.674414873123169, "step": 2486} +{"train_info/time_between_train_steps": 0.003237485885620117, "step": 2486} +{"info/global_step": 2487, "train_info/time_within_train_step": 2.6755077838897705, "step": 2487} +{"train_info/time_between_train_steps": 0.003369569778442383, "step": 2487} +{"info/global_step": 2488, "train_info/time_within_train_step": 2.6750242710113525, "step": 2488} +{"train_info/time_between_train_steps": 0.0032777786254882812, "step": 2488} +{"info/global_step": 2489, "train_info/time_within_train_step": 2.6761856079101562, "step": 2489} +{"train_info/time_between_train_steps": 0.0033164024353027344, "step": 2489} +{"info/global_step": 2490, "train_info/time_within_train_step": 2.674321174621582, "step": 2490} +{"train_info/time_between_train_steps": 0.0032906532287597656, "step": 2490} +{"info/global_step": 2491, "train_info/time_within_train_step": 2.676804304122925, "step": 2491} +{"train_info/time_between_train_steps": 0.003274202346801758, "step": 2491} +{"info/global_step": 2492, "train_info/time_within_train_step": 2.6756093502044678, "step": 2492} +{"train_info/time_between_train_steps": 0.0032286643981933594, "step": 2492} +{"info/global_step": 2493, "train_info/time_within_train_step": 2.6766724586486816, "step": 2493} +{"train_info/time_between_train_steps": 0.003232240676879883, "step": 2493} +{"info/global_step": 2494, "train_info/time_within_train_step": 2.6743850708007812, "step": 2494} +{"train_info/time_between_train_steps": 0.0032117366790771484, "step": 2494} +{"info/global_step": 2495, "train_info/time_within_train_step": 2.674945831298828, "step": 2495} +{"train_info/time_between_train_steps": 0.003224611282348633, "step": 2495} +{"info/global_step": 2496, "train_info/time_within_train_step": 2.675564765930176, "step": 2496} +{"train_info/time_between_train_steps": 0.0032134056091308594, "step": 2496} +{"info/global_step": 2497, "train_info/time_within_train_step": 2.6748011112213135, "step": 2497} +{"train_info/time_between_train_steps": 0.0033292770385742188, "step": 2497} +{"info/global_step": 2498, "train_info/time_within_train_step": 2.6743674278259277, "step": 2498} +{"train_info/time_between_train_steps": 0.003209829330444336, "step": 2498} +{"info/global_step": 2499, "train_info/time_within_train_step": 2.673780918121338, "step": 2499} +{"train_info/time_between_train_steps": 0.006435394287109375, "step": 2499} +{"info/global_step": 2500, "train_info/time_within_train_step": 3.23264479637146, "step": 2500} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746210392, "_runtime": 7164}, "step": 2500} +{"logs": {"train/loss": 3.9673, "train/learning_rate": 0.00011111111111111109, "train/epoch": 2.26, "_timestamp": 1746210392, "_runtime": 7164}, "step": 2500} +{"train_info/time_between_train_steps": 13.736678838729858, "step": 2500} +{"info/global_step": 2501, "train_info/time_within_train_step": 2.472421169281006, "step": 2501} +{"train_info/time_between_train_steps": 0.003180265426635742, "step": 2501} +{"info/global_step": 2502, "train_info/time_within_train_step": 2.4577410221099854, "step": 2502} +{"train_info/time_between_train_steps": 0.0031349658966064453, "step": 2502} +{"info/global_step": 2503, "train_info/time_within_train_step": 2.4694762229919434, "step": 2503} +{"train_info/time_between_train_steps": 0.0031991004943847656, "step": 2503} +{"info/global_step": 2504, "train_info/time_within_train_step": 2.7749457359313965, "step": 2504} +{"train_info/time_between_train_steps": 0.0030241012573242188, "step": 2504} +{"info/global_step": 2505, "train_info/time_within_train_step": 2.673896074295044, "step": 2505} +{"train_info/time_between_train_steps": 0.003200531005859375, "step": 2505} +{"info/global_step": 2506, "train_info/time_within_train_step": 2.6729278564453125, "step": 2506} +{"train_info/time_between_train_steps": 0.003092527389526367, "step": 2506} +{"info/global_step": 2507, "train_info/time_within_train_step": 2.673285722732544, "step": 2507} +{"train_info/time_between_train_steps": 0.003099203109741211, "step": 2507} +{"info/global_step": 2508, "train_info/time_within_train_step": 2.6750402450561523, "step": 2508} +{"train_info/time_between_train_steps": 0.0031566619873046875, "step": 2508} +{"info/global_step": 2509, "train_info/time_within_train_step": 2.67340350151062, "step": 2509} +{"train_info/time_between_train_steps": 0.003131389617919922, "step": 2509} +{"info/global_step": 2510, "train_info/time_within_train_step": 2.72391414642334, "step": 2510} +{"train_info/time_between_train_steps": 0.0032706260681152344, "step": 2510} +{"info/global_step": 2511, "train_info/time_within_train_step": 2.673905611038208, "step": 2511} +{"train_info/time_between_train_steps": 0.003209829330444336, "step": 2511} +{"info/global_step": 2512, "train_info/time_within_train_step": 2.673278331756592, "step": 2512} +{"train_info/time_between_train_steps": 0.003196239471435547, "step": 2512} +{"info/global_step": 2513, "train_info/time_within_train_step": 2.67317271232605, "step": 2513} +{"train_info/time_between_train_steps": 0.0032269954681396484, "step": 2513} +{"info/global_step": 2514, "train_info/time_within_train_step": 2.673278570175171, "step": 2514} +{"train_info/time_between_train_steps": 0.003190279006958008, "step": 2514} +{"info/global_step": 2515, "train_info/time_within_train_step": 2.6718571186065674, "step": 2515} +{"train_info/time_between_train_steps": 0.0031280517578125, "step": 2515} +{"info/global_step": 2516, "train_info/time_within_train_step": 2.674288034439087, "step": 2516} +{"train_info/time_between_train_steps": 0.0032634735107421875, "step": 2516} +{"info/global_step": 2517, "train_info/time_within_train_step": 2.673772096633911, "step": 2517} +{"train_info/time_between_train_steps": 0.003124237060546875, "step": 2517} +{"info/global_step": 2518, "train_info/time_within_train_step": 2.674041271209717, "step": 2518} +{"train_info/time_between_train_steps": 0.003170013427734375, "step": 2518} +{"info/global_step": 2519, "train_info/time_within_train_step": 2.674496650695801, "step": 2519} +{"train_info/time_between_train_steps": 0.003107786178588867, "step": 2519} +{"info/global_step": 2520, "train_info/time_within_train_step": 2.6747171878814697, "step": 2520} +{"train_info/time_between_train_steps": 0.0031042098999023438, "step": 2520} +{"info/global_step": 2521, "train_info/time_within_train_step": 2.6753427982330322, "step": 2521} +{"train_info/time_between_train_steps": 0.0031499862670898438, "step": 2521} +{"info/global_step": 2522, "train_info/time_within_train_step": 2.6725621223449707, "step": 2522} +{"train_info/time_between_train_steps": 0.003141164779663086, "step": 2522} +{"info/global_step": 2523, "train_info/time_within_train_step": 2.6737284660339355, "step": 2523} +{"train_info/time_between_train_steps": 0.003082752227783203, "step": 2523} +{"info/global_step": 2524, "train_info/time_within_train_step": 2.673799991607666, "step": 2524} +{"train_info/time_between_train_steps": 0.0031337738037109375, "step": 2524} +{"info/global_step": 2525, "train_info/time_within_train_step": 2.673274278640747, "step": 2525} +{"train_info/time_between_train_steps": 0.006365299224853516, "step": 2525} +{"info/global_step": 2526, "train_info/time_within_train_step": 2.6754117012023926, "step": 2526} +{"train_info/time_between_train_steps": 0.0063512325286865234, "step": 2526} +{"info/global_step": 2527, "train_info/time_within_train_step": 2.6772336959838867, "step": 2527} +{"train_info/time_between_train_steps": 0.0030846595764160156, "step": 2527} +{"info/global_step": 2528, "train_info/time_within_train_step": 2.6733291149139404, "step": 2528} +{"train_info/time_between_train_steps": 0.006193637847900391, "step": 2528} +{"info/global_step": 2529, "train_info/time_within_train_step": 2.6740217208862305, "step": 2529} +{"train_info/time_between_train_steps": 0.006256103515625, "step": 2529} +{"info/global_step": 2530, "train_info/time_within_train_step": 2.672708511352539, "step": 2530} +{"train_info/time_between_train_steps": 0.0030739307403564453, "step": 2530} +{"info/global_step": 2531, "train_info/time_within_train_step": 2.6737115383148193, "step": 2531} +{"train_info/time_between_train_steps": 0.0030753612518310547, "step": 2531} +{"info/global_step": 2532, "train_info/time_within_train_step": 2.6735568046569824, "step": 2532} +{"train_info/time_between_train_steps": 0.003055572509765625, "step": 2532} +{"info/global_step": 2533, "train_info/time_within_train_step": 2.672914505004883, "step": 2533} +{"train_info/time_between_train_steps": 0.0031914710998535156, "step": 2533} +{"info/global_step": 2534, "train_info/time_within_train_step": 2.673044204711914, "step": 2534} +{"train_info/time_between_train_steps": 0.003101348876953125, "step": 2534} +{"info/global_step": 2535, "train_info/time_within_train_step": 2.6727969646453857, "step": 2535} +{"train_info/time_between_train_steps": 0.0030815601348876953, "step": 2535} +{"info/global_step": 2536, "train_info/time_within_train_step": 2.673436164855957, "step": 2536} +{"train_info/time_between_train_steps": 0.0030705928802490234, "step": 2536} +{"info/global_step": 2537, "train_info/time_within_train_step": 2.672220230102539, "step": 2537} +{"train_info/time_between_train_steps": 0.0031328201293945312, "step": 2537} +{"info/global_step": 2538, "train_info/time_within_train_step": 2.672430992126465, "step": 2538} +{"train_info/time_between_train_steps": 0.003130197525024414, "step": 2538} +{"info/global_step": 2539, "train_info/time_within_train_step": 2.6740968227386475, "step": 2539} +{"train_info/time_between_train_steps": 0.0030858516693115234, "step": 2539} +{"info/global_step": 2540, "train_info/time_within_train_step": 2.6729583740234375, "step": 2540} +{"train_info/time_between_train_steps": 0.003150463104248047, "step": 2540} +{"info/global_step": 2541, "train_info/time_within_train_step": 2.7582435607910156, "step": 2541} +{"train_info/time_between_train_steps": 0.0030999183654785156, "step": 2541} +{"info/global_step": 2542, "train_info/time_within_train_step": 2.6727824211120605, "step": 2542} +{"train_info/time_between_train_steps": 0.002978086471557617, "step": 2542} +{"info/global_step": 2543, "train_info/time_within_train_step": 2.671576499938965, "step": 2543} +{"train_info/time_between_train_steps": 0.002955198287963867, "step": 2543} +{"info/global_step": 2544, "train_info/time_within_train_step": 2.6727211475372314, "step": 2544} +{"train_info/time_between_train_steps": 0.002991914749145508, "step": 2544} +{"info/global_step": 2545, "train_info/time_within_train_step": 2.671295642852783, "step": 2545} +{"train_info/time_between_train_steps": 0.0030274391174316406, "step": 2545} +{"info/global_step": 2546, "train_info/time_within_train_step": 2.670830488204956, "step": 2546} +{"train_info/time_between_train_steps": 0.0029289722442626953, "step": 2546} +{"info/global_step": 2547, "train_info/time_within_train_step": 2.672510862350464, "step": 2547} +{"train_info/time_between_train_steps": 0.002971649169921875, "step": 2547} +{"info/global_step": 2548, "train_info/time_within_train_step": 2.672435760498047, "step": 2548} +{"train_info/time_between_train_steps": 0.0030372142791748047, "step": 2548} +{"info/global_step": 2549, "train_info/time_within_train_step": 2.6723291873931885, "step": 2549} +{"train_info/time_between_train_steps": 0.0030448436737060547, "step": 2549} +{"info/global_step": 2550, "train_info/time_within_train_step": 2.6724112033843994, "step": 2550} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746210541, "_runtime": 7313}, "step": 2550} +{"logs": {"train/loss": 3.9575, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 2.27, "_timestamp": 1746210541, "_runtime": 7313}, "step": 2550} +{"train_info/time_between_train_steps": 0.023311376571655273, "step": 2550} +{"info/global_step": 2551, "train_info/time_within_train_step": 2.6712403297424316, "step": 2551} +{"train_info/time_between_train_steps": 0.003183126449584961, "step": 2551} +{"info/global_step": 2552, "train_info/time_within_train_step": 2.6712381839752197, "step": 2552} +{"train_info/time_between_train_steps": 0.0030846595764160156, "step": 2552} +{"info/global_step": 2553, "train_info/time_within_train_step": 2.6709511280059814, "step": 2553} +{"train_info/time_between_train_steps": 0.003054380416870117, "step": 2553} +{"info/global_step": 2554, "train_info/time_within_train_step": 2.670224666595459, "step": 2554} +{"train_info/time_between_train_steps": 0.0029671192169189453, "step": 2554} +{"info/global_step": 2555, "train_info/time_within_train_step": 2.6698555946350098, "step": 2555} +{"train_info/time_between_train_steps": 0.0029747486114501953, "step": 2555} +{"info/global_step": 2556, "train_info/time_within_train_step": 2.6712863445281982, "step": 2556} +{"train_info/time_between_train_steps": 0.003075838088989258, "step": 2556} +{"info/global_step": 2557, "train_info/time_within_train_step": 2.6718947887420654, "step": 2557} +{"train_info/time_between_train_steps": 0.0030515193939208984, "step": 2557} +{"info/global_step": 2558, "train_info/time_within_train_step": 2.671717882156372, "step": 2558} +{"train_info/time_between_train_steps": 0.0030374526977539062, "step": 2558} +{"info/global_step": 2559, "train_info/time_within_train_step": 2.671414375305176, "step": 2559} +{"train_info/time_between_train_steps": 0.003072023391723633, "step": 2559} +{"info/global_step": 2560, "train_info/time_within_train_step": 2.671355724334717, "step": 2560} +{"train_info/time_between_train_steps": 0.003103017807006836, "step": 2560} +{"info/global_step": 2561, "train_info/time_within_train_step": 2.6729815006256104, "step": 2561} +{"train_info/time_between_train_steps": 0.0031251907348632812, "step": 2561} +{"info/global_step": 2562, "train_info/time_within_train_step": 2.6730103492736816, "step": 2562} +{"train_info/time_between_train_steps": 0.0030226707458496094, "step": 2562} +{"info/global_step": 2563, "train_info/time_within_train_step": 2.6729178428649902, "step": 2563} +{"train_info/time_between_train_steps": 0.0031311511993408203, "step": 2563} +{"info/global_step": 2564, "train_info/time_within_train_step": 2.6736302375793457, "step": 2564} +{"train_info/time_between_train_steps": 0.003102540969848633, "step": 2564} +{"info/global_step": 2565, "train_info/time_within_train_step": 2.6722540855407715, "step": 2565} +{"train_info/time_between_train_steps": 0.003042459487915039, "step": 2565} +{"info/global_step": 2566, "train_info/time_within_train_step": 2.670680046081543, "step": 2566} +{"train_info/time_between_train_steps": 0.003020763397216797, "step": 2566} +{"info/global_step": 2567, "train_info/time_within_train_step": 2.669672727584839, "step": 2567} +{"train_info/time_between_train_steps": 0.0030524730682373047, "step": 2567} +{"info/global_step": 2568, "train_info/time_within_train_step": 2.669635534286499, "step": 2568} +{"train_info/time_between_train_steps": 0.00304412841796875, "step": 2568} +{"info/global_step": 2569, "train_info/time_within_train_step": 2.6704790592193604, "step": 2569} +{"train_info/time_between_train_steps": 0.00299072265625, "step": 2569} +{"info/global_step": 2570, "train_info/time_within_train_step": 2.670903205871582, "step": 2570} +{"train_info/time_between_train_steps": 0.0030493736267089844, "step": 2570} +{"info/global_step": 2571, "train_info/time_within_train_step": 2.671005964279175, "step": 2571} +{"train_info/time_between_train_steps": 0.0031425952911376953, "step": 2571} +{"info/global_step": 2572, "train_info/time_within_train_step": 2.6705827713012695, "step": 2572} +{"train_info/time_between_train_steps": 0.0031719207763671875, "step": 2572} +{"info/global_step": 2573, "train_info/time_within_train_step": 2.6720640659332275, "step": 2573} +{"train_info/time_between_train_steps": 0.0031588077545166016, "step": 2573} +{"info/global_step": 2574, "train_info/time_within_train_step": 2.672450304031372, "step": 2574} +{"train_info/time_between_train_steps": 0.003202676773071289, "step": 2574} +{"info/global_step": 2575, "train_info/time_within_train_step": 2.671769857406616, "step": 2575} +{"train_info/time_between_train_steps": 0.003158092498779297, "step": 2575} +{"info/global_step": 2576, "train_info/time_within_train_step": 2.6718122959136963, "step": 2576} +{"train_info/time_between_train_steps": 0.0031719207763671875, "step": 2576} +{"info/global_step": 2577, "train_info/time_within_train_step": 2.7254903316497803, "step": 2577} +{"train_info/time_between_train_steps": 0.003344297409057617, "step": 2577} +{"info/global_step": 2578, "train_info/time_within_train_step": 2.6758439540863037, "step": 2578} +{"train_info/time_between_train_steps": 0.003286600112915039, "step": 2578} +{"info/global_step": 2579, "train_info/time_within_train_step": 2.674528121948242, "step": 2579} +{"train_info/time_between_train_steps": 0.003130674362182617, "step": 2579} +{"info/global_step": 2580, "train_info/time_within_train_step": 2.6719751358032227, "step": 2580} +{"train_info/time_between_train_steps": 0.003329038619995117, "step": 2580} +{"info/global_step": 2581, "train_info/time_within_train_step": 2.6711113452911377, "step": 2581} +{"train_info/time_between_train_steps": 0.003271818161010742, "step": 2581} +{"info/global_step": 2582, "train_info/time_within_train_step": 2.6729228496551514, "step": 2582} +{"train_info/time_between_train_steps": 0.0033516883850097656, "step": 2582} +{"info/global_step": 2583, "train_info/time_within_train_step": 2.671794891357422, "step": 2583} +{"train_info/time_between_train_steps": 0.003486156463623047, "step": 2583} +{"info/global_step": 2584, "train_info/time_within_train_step": 2.6733510494232178, "step": 2584} +{"train_info/time_between_train_steps": 0.0032525062561035156, "step": 2584} +{"info/global_step": 2585, "train_info/time_within_train_step": 2.6741139888763428, "step": 2585} +{"train_info/time_between_train_steps": 0.0036072731018066406, "step": 2585} +{"info/global_step": 2586, "train_info/time_within_train_step": 2.675304651260376, "step": 2586} +{"train_info/time_between_train_steps": 0.003511667251586914, "step": 2586} +{"info/global_step": 2587, "train_info/time_within_train_step": 2.675203323364258, "step": 2587} +{"train_info/time_between_train_steps": 0.0035724639892578125, "step": 2587} +{"info/global_step": 2588, "train_info/time_within_train_step": 2.6745481491088867, "step": 2588} +{"train_info/time_between_train_steps": 0.003495931625366211, "step": 2588} +{"info/global_step": 2589, "train_info/time_within_train_step": 2.675438165664673, "step": 2589} +{"train_info/time_between_train_steps": 0.0035982131958007812, "step": 2589} +{"info/global_step": 2590, "train_info/time_within_train_step": 2.6752169132232666, "step": 2590} +{"train_info/time_between_train_steps": 0.0035147666931152344, "step": 2590} +{"info/global_step": 2591, "train_info/time_within_train_step": 2.673825979232788, "step": 2591} +{"train_info/time_between_train_steps": 0.0035982131958007812, "step": 2591} +{"info/global_step": 2592, "train_info/time_within_train_step": 2.673553228378296, "step": 2592} +{"train_info/time_between_train_steps": 0.00331878662109375, "step": 2592} +{"train_info/time_between_train_steps": 2.578963279724121, "step": 2592} +{"info/global_step": 2593, "train_info/time_within_train_step": 2.5900046825408936, "step": 2593} +{"train_info/time_between_train_steps": 0.0032548904418945312, "step": 2593} +{"info/global_step": 2594, "train_info/time_within_train_step": 2.672269821166992, "step": 2594} +{"train_info/time_between_train_steps": 0.0032362937927246094, "step": 2594} +{"info/global_step": 2595, "train_info/time_within_train_step": 2.673154354095459, "step": 2595} +{"train_info/time_between_train_steps": 0.003311634063720703, "step": 2595} +{"info/global_step": 2596, "train_info/time_within_train_step": 2.675387144088745, "step": 2596} +{"train_info/time_between_train_steps": 0.003262758255004883, "step": 2596} +{"info/global_step": 2597, "train_info/time_within_train_step": 2.6726131439208984, "step": 2597} +{"train_info/time_between_train_steps": 0.003195047378540039, "step": 2597} +{"info/global_step": 2598, "train_info/time_within_train_step": 2.6725986003875732, "step": 2598} +{"train_info/time_between_train_steps": 0.0032901763916015625, "step": 2598} +{"info/global_step": 2599, "train_info/time_within_train_step": 2.6743874549865723, "step": 2599} +{"train_info/time_between_train_steps": 0.003357410430908203, "step": 2599} +{"info/global_step": 2600, "train_info/time_within_train_step": 2.6742475032806396, "step": 2600} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746210678, "_runtime": 7450}, "step": 2600} +{"logs": {"train/loss": 3.9602, "train/learning_rate": 8.888888888888888e-05, "train/epoch": 3.0, "_timestamp": 1746210678, "_runtime": 7450}, "step": 2600} +{"train_info/time_between_train_steps": 13.187776565551758, "step": 2600} +{"info/global_step": 2601, "train_info/time_within_train_step": 2.4755032062530518, "step": 2601} +{"train_info/time_between_train_steps": 0.0032444000244140625, "step": 2601} +{"info/global_step": 2602, "train_info/time_within_train_step": 2.459609270095825, "step": 2602} +{"train_info/time_between_train_steps": 0.0034399032592773438, "step": 2602} +{"info/global_step": 2603, "train_info/time_within_train_step": 2.522960662841797, "step": 2603} +{"train_info/time_between_train_steps": 0.003376483917236328, "step": 2603} +{"info/global_step": 2604, "train_info/time_within_train_step": 2.670532703399658, "step": 2604} +{"train_info/time_between_train_steps": 0.004011392593383789, "step": 2604} +{"info/global_step": 2605, "train_info/time_within_train_step": 2.676786184310913, "step": 2605} +{"train_info/time_between_train_steps": 0.0039033889770507812, "step": 2605} +{"info/global_step": 2606, "train_info/time_within_train_step": 2.672912359237671, "step": 2606} +{"train_info/time_between_train_steps": 0.0036339759826660156, "step": 2606} +{"info/global_step": 2607, "train_info/time_within_train_step": 2.6734719276428223, "step": 2607} +{"train_info/time_between_train_steps": 0.0036242008209228516, "step": 2607} +{"info/global_step": 2608, "train_info/time_within_train_step": 2.675945520401001, "step": 2608} +{"train_info/time_between_train_steps": 0.0036525726318359375, "step": 2608} +{"info/global_step": 2609, "train_info/time_within_train_step": 2.6762712001800537, "step": 2609} +{"train_info/time_between_train_steps": 0.0035104751586914062, "step": 2609} +{"info/global_step": 2610, "train_info/time_within_train_step": 2.677239179611206, "step": 2610} +{"train_info/time_between_train_steps": 0.0035805702209472656, "step": 2610} +{"info/global_step": 2611, "train_info/time_within_train_step": 2.678382396697998, "step": 2611} +{"train_info/time_between_train_steps": 0.003601551055908203, "step": 2611} +{"info/global_step": 2612, "train_info/time_within_train_step": 2.678570032119751, "step": 2612} +{"train_info/time_between_train_steps": 0.003562450408935547, "step": 2612} +{"info/global_step": 2613, "train_info/time_within_train_step": 2.676090717315674, "step": 2613} +{"train_info/time_between_train_steps": 0.0035037994384765625, "step": 2613} +{"info/global_step": 2614, "train_info/time_within_train_step": 2.6785247325897217, "step": 2614} +{"train_info/time_between_train_steps": 0.00359344482421875, "step": 2614} +{"info/global_step": 2615, "train_info/time_within_train_step": 2.675851583480835, "step": 2615} +{"train_info/time_between_train_steps": 0.00354766845703125, "step": 2615} +{"info/global_step": 2616, "train_info/time_within_train_step": 2.7262580394744873, "step": 2616} +{"train_info/time_between_train_steps": 0.0035429000854492188, "step": 2616} +{"info/global_step": 2617, "train_info/time_within_train_step": 2.675971508026123, "step": 2617} +{"train_info/time_between_train_steps": 0.003605365753173828, "step": 2617} +{"info/global_step": 2618, "train_info/time_within_train_step": 2.674084186553955, "step": 2618} +{"train_info/time_between_train_steps": 0.0035026073455810547, "step": 2618} +{"info/global_step": 2619, "train_info/time_within_train_step": 2.675248384475708, "step": 2619} +{"train_info/time_between_train_steps": 0.003509521484375, "step": 2619} +{"info/global_step": 2620, "train_info/time_within_train_step": 2.6737797260284424, "step": 2620} +{"train_info/time_between_train_steps": 0.003550291061401367, "step": 2620} +{"info/global_step": 2621, "train_info/time_within_train_step": 2.6762609481811523, "step": 2621} +{"train_info/time_between_train_steps": 0.007187366485595703, "step": 2621} +{"info/global_step": 2622, "train_info/time_within_train_step": 2.6777384281158447, "step": 2622} +{"train_info/time_between_train_steps": 0.007051944732666016, "step": 2622} +{"info/global_step": 2623, "train_info/time_within_train_step": 2.677461862564087, "step": 2623} +{"train_info/time_between_train_steps": 0.007096529006958008, "step": 2623} +{"info/global_step": 2624, "train_info/time_within_train_step": 2.6769564151763916, "step": 2624} +{"train_info/time_between_train_steps": 0.0036101341247558594, "step": 2624} +{"info/global_step": 2625, "train_info/time_within_train_step": 2.677908420562744, "step": 2625} +{"train_info/time_between_train_steps": 0.0035860538482666016, "step": 2625} +{"info/global_step": 2626, "train_info/time_within_train_step": 2.6751317977905273, "step": 2626} +{"train_info/time_between_train_steps": 0.003603219985961914, "step": 2626} +{"info/global_step": 2627, "train_info/time_within_train_step": 2.675471305847168, "step": 2627} +{"train_info/time_between_train_steps": 0.007032871246337891, "step": 2627} +{"info/global_step": 2628, "train_info/time_within_train_step": 2.675558567047119, "step": 2628} +{"train_info/time_between_train_steps": 0.007046699523925781, "step": 2628} +{"info/global_step": 2629, "train_info/time_within_train_step": 2.6758499145507812, "step": 2629} +{"train_info/time_between_train_steps": 0.007168292999267578, "step": 2629} +{"info/global_step": 2630, "train_info/time_within_train_step": 3.0048677921295166, "step": 2630} +{"train_info/time_between_train_steps": 0.006340503692626953, "step": 2630} +{"info/global_step": 2631, "train_info/time_within_train_step": 2.678539514541626, "step": 2631} +{"train_info/time_between_train_steps": 0.0033380985260009766, "step": 2631} +{"info/global_step": 2632, "train_info/time_within_train_step": 2.675870656967163, "step": 2632} +{"train_info/time_between_train_steps": 0.0033910274505615234, "step": 2632} +{"info/global_step": 2633, "train_info/time_within_train_step": 2.6756417751312256, "step": 2633} +{"train_info/time_between_train_steps": 0.003423452377319336, "step": 2633} +{"info/global_step": 2634, "train_info/time_within_train_step": 2.67622447013855, "step": 2634} +{"train_info/time_between_train_steps": 0.006688356399536133, "step": 2634} +{"info/global_step": 2635, "train_info/time_within_train_step": 2.6756365299224854, "step": 2635} +{"train_info/time_between_train_steps": 0.0033152103424072266, "step": 2635} +{"info/global_step": 2636, "train_info/time_within_train_step": 2.6792187690734863, "step": 2636} +{"train_info/time_between_train_steps": 0.0033981800079345703, "step": 2636} +{"info/global_step": 2637, "train_info/time_within_train_step": 2.675025224685669, "step": 2637} +{"train_info/time_between_train_steps": 0.0033278465270996094, "step": 2637} +{"info/global_step": 2638, "train_info/time_within_train_step": 2.6755259037017822, "step": 2638} +{"train_info/time_between_train_steps": 0.003364086151123047, "step": 2638} +{"info/global_step": 2639, "train_info/time_within_train_step": 2.682382583618164, "step": 2639} +{"train_info/time_between_train_steps": 0.003372669219970703, "step": 2639} +{"info/global_step": 2640, "train_info/time_within_train_step": 2.6789886951446533, "step": 2640} +{"train_info/time_between_train_steps": 0.0036268234252929688, "step": 2640} +{"info/global_step": 2641, "train_info/time_within_train_step": 2.6765127182006836, "step": 2641} +{"train_info/time_between_train_steps": 0.003485441207885742, "step": 2641} +{"info/global_step": 2642, "train_info/time_within_train_step": 2.6755664348602295, "step": 2642} +{"train_info/time_between_train_steps": 0.003564596176147461, "step": 2642} +{"info/global_step": 2643, "train_info/time_within_train_step": 2.678276777267456, "step": 2643} +{"train_info/time_between_train_steps": 0.003735065460205078, "step": 2643} +{"info/global_step": 2644, "train_info/time_within_train_step": 2.676274061203003, "step": 2644} +{"train_info/time_between_train_steps": 0.0035390853881835938, "step": 2644} +{"info/global_step": 2645, "train_info/time_within_train_step": 2.676387310028076, "step": 2645} +{"train_info/time_between_train_steps": 0.0035626888275146484, "step": 2645} +{"info/global_step": 2646, "train_info/time_within_train_step": 2.675788402557373, "step": 2646} +{"train_info/time_between_train_steps": 0.0069997310638427734, "step": 2646} +{"info/global_step": 2647, "train_info/time_within_train_step": 2.676781415939331, "step": 2647} +{"train_info/time_between_train_steps": 0.00699162483215332, "step": 2647} +{"info/global_step": 2648, "train_info/time_within_train_step": 2.6753480434417725, "step": 2648} +{"train_info/time_between_train_steps": 0.006963014602661133, "step": 2648} +{"info/global_step": 2649, "train_info/time_within_train_step": 2.673266649246216, "step": 2649} +{"train_info/time_between_train_steps": 0.0069599151611328125, "step": 2649} +{"info/global_step": 2650, "train_info/time_within_train_step": 2.673179864883423, "step": 2650} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746210826, "_runtime": 7598}, "step": 2650} +{"logs": {"train/loss": 3.9136, "train/learning_rate": 7.777777777777777e-05, "train/epoch": 3.02, "_timestamp": 1746210826, "_runtime": 7598}, "step": 2650} +{"train_info/time_between_train_steps": 0.025639772415161133, "step": 2650} +{"info/global_step": 2651, "train_info/time_within_train_step": 2.6744861602783203, "step": 2651} +{"train_info/time_between_train_steps": 0.0035409927368164062, "step": 2651} +{"info/global_step": 2652, "train_info/time_within_train_step": 2.674013614654541, "step": 2652} +{"train_info/time_between_train_steps": 0.003536701202392578, "step": 2652} +{"info/global_step": 2653, "train_info/time_within_train_step": 2.674095869064331, "step": 2653} +{"train_info/time_between_train_steps": 0.003615856170654297, "step": 2653} +{"info/global_step": 2654, "train_info/time_within_train_step": 2.6732213497161865, "step": 2654} +{"train_info/time_between_train_steps": 0.003532886505126953, "step": 2654} +{"info/global_step": 2655, "train_info/time_within_train_step": 2.838862657546997, "step": 2655} +{"train_info/time_between_train_steps": 0.0033800601959228516, "step": 2655} +{"info/global_step": 2656, "train_info/time_within_train_step": 2.6756432056427, "step": 2656} +{"train_info/time_between_train_steps": 0.003369569778442383, "step": 2656} +{"info/global_step": 2657, "train_info/time_within_train_step": 2.679539680480957, "step": 2657} +{"train_info/time_between_train_steps": 0.0034956932067871094, "step": 2657} +{"info/global_step": 2658, "train_info/time_within_train_step": 2.6755030155181885, "step": 2658} +{"train_info/time_between_train_steps": 0.0034503936767578125, "step": 2658} +{"info/global_step": 2659, "train_info/time_within_train_step": 2.6744918823242188, "step": 2659} +{"train_info/time_between_train_steps": 0.003602743148803711, "step": 2659} +{"info/global_step": 2660, "train_info/time_within_train_step": 2.673985481262207, "step": 2660} +{"train_info/time_between_train_steps": 0.0034704208374023438, "step": 2660} +{"info/global_step": 2661, "train_info/time_within_train_step": 2.6755788326263428, "step": 2661} +{"train_info/time_between_train_steps": 0.0036132335662841797, "step": 2661} +{"info/global_step": 2662, "train_info/time_within_train_step": 2.677898406982422, "step": 2662} +{"train_info/time_between_train_steps": 0.003638029098510742, "step": 2662} +{"info/global_step": 2663, "train_info/time_within_train_step": 2.6773831844329834, "step": 2663} +{"train_info/time_between_train_steps": 0.0037283897399902344, "step": 2663} +{"info/global_step": 2664, "train_info/time_within_train_step": 2.6755101680755615, "step": 2664} +{"train_info/time_between_train_steps": 0.003574848175048828, "step": 2664} +{"info/global_step": 2665, "train_info/time_within_train_step": 2.6761722564697266, "step": 2665} +{"train_info/time_between_train_steps": 0.003572225570678711, "step": 2665} +{"info/global_step": 2666, "train_info/time_within_train_step": 2.673788547515869, "step": 2666} +{"train_info/time_between_train_steps": 0.0034618377685546875, "step": 2666} +{"info/global_step": 2667, "train_info/time_within_train_step": 2.672536849975586, "step": 2667} +{"train_info/time_between_train_steps": 0.0035021305084228516, "step": 2667} +{"info/global_step": 2668, "train_info/time_within_train_step": 2.6728742122650146, "step": 2668} +{"train_info/time_between_train_steps": 0.0035691261291503906, "step": 2668} +{"info/global_step": 2669, "train_info/time_within_train_step": 2.993419647216797, "step": 2669} +{"train_info/time_between_train_steps": 0.003319978713989258, "step": 2669} +{"info/global_step": 2670, "train_info/time_within_train_step": 2.673675537109375, "step": 2670} +{"train_info/time_between_train_steps": 0.003317594528198242, "step": 2670} +{"info/global_step": 2671, "train_info/time_within_train_step": 2.672431468963623, "step": 2671} +{"train_info/time_between_train_steps": 0.003491640090942383, "step": 2671} +{"info/global_step": 2672, "train_info/time_within_train_step": 2.6714229583740234, "step": 2672} +{"train_info/time_between_train_steps": 0.0033559799194335938, "step": 2672} +{"info/global_step": 2673, "train_info/time_within_train_step": 2.6780824661254883, "step": 2673} +{"train_info/time_between_train_steps": 0.0035109519958496094, "step": 2673} +{"info/global_step": 2674, "train_info/time_within_train_step": 2.6725590229034424, "step": 2674} +{"train_info/time_between_train_steps": 0.0033349990844726562, "step": 2674} +{"info/global_step": 2675, "train_info/time_within_train_step": 2.6713006496429443, "step": 2675} +{"train_info/time_between_train_steps": 0.003299236297607422, "step": 2675} +{"info/global_step": 2676, "train_info/time_within_train_step": 2.6725032329559326, "step": 2676} +{"train_info/time_between_train_steps": 0.003320455551147461, "step": 2676} +{"info/global_step": 2677, "train_info/time_within_train_step": 2.671800136566162, "step": 2677} +{"train_info/time_between_train_steps": 0.006613254547119141, "step": 2677} +{"info/global_step": 2678, "train_info/time_within_train_step": 2.6727967262268066, "step": 2678} +{"train_info/time_between_train_steps": 0.006639242172241211, "step": 2678} +{"info/global_step": 2679, "train_info/time_within_train_step": 2.672818899154663, "step": 2679} +{"train_info/time_between_train_steps": 0.006651401519775391, "step": 2679} +{"info/global_step": 2680, "train_info/time_within_train_step": 2.6724581718444824, "step": 2680} +{"train_info/time_between_train_steps": 0.006593227386474609, "step": 2680} +{"info/global_step": 2681, "train_info/time_within_train_step": 2.672515630722046, "step": 2681} +{"train_info/time_between_train_steps": 0.00667572021484375, "step": 2681} +{"info/global_step": 2682, "train_info/time_within_train_step": 2.6728575229644775, "step": 2682} +{"train_info/time_between_train_steps": 0.006546735763549805, "step": 2682} +{"info/global_step": 2683, "train_info/time_within_train_step": 2.673027515411377, "step": 2683} +{"train_info/time_between_train_steps": 0.006590127944946289, "step": 2683} +{"info/global_step": 2684, "train_info/time_within_train_step": 2.6716833114624023, "step": 2684} +{"train_info/time_between_train_steps": 0.006595611572265625, "step": 2684} +{"info/global_step": 2685, "train_info/time_within_train_step": 2.67250394821167, "step": 2685} +{"train_info/time_between_train_steps": 0.006674051284790039, "step": 2685} +{"info/global_step": 2686, "train_info/time_within_train_step": 2.6727454662323, "step": 2686} +{"train_info/time_between_train_steps": 0.0033435821533203125, "step": 2686} +{"info/global_step": 2687, "train_info/time_within_train_step": 2.6740024089813232, "step": 2687} +{"train_info/time_between_train_steps": 0.0034797191619873047, "step": 2687} +{"info/global_step": 2688, "train_info/time_within_train_step": 2.6735169887542725, "step": 2688} +{"train_info/time_between_train_steps": 0.0033490657806396484, "step": 2688} +{"info/global_step": 2689, "train_info/time_within_train_step": 2.671706199645996, "step": 2689} +{"train_info/time_between_train_steps": 0.003470897674560547, "step": 2689} +{"info/global_step": 2690, "train_info/time_within_train_step": 2.6782803535461426, "step": 2690} +{"train_info/time_between_train_steps": 0.003614187240600586, "step": 2690} +{"info/global_step": 2691, "train_info/time_within_train_step": 2.673063039779663, "step": 2691} +{"train_info/time_between_train_steps": 0.003467082977294922, "step": 2691} +{"info/global_step": 2692, "train_info/time_within_train_step": 2.6730401515960693, "step": 2692} +{"train_info/time_between_train_steps": 0.0035457611083984375, "step": 2692} +{"info/global_step": 2693, "train_info/time_within_train_step": 2.672390937805176, "step": 2693} +{"train_info/time_between_train_steps": 0.003506898880004883, "step": 2693} +{"info/global_step": 2694, "train_info/time_within_train_step": 2.673560857772827, "step": 2694} +{"train_info/time_between_train_steps": 0.0034971237182617188, "step": 2694} +{"info/global_step": 2695, "train_info/time_within_train_step": 2.6728498935699463, "step": 2695} +{"train_info/time_between_train_steps": 0.003459453582763672, "step": 2695} +{"info/global_step": 2696, "train_info/time_within_train_step": 2.6736674308776855, "step": 2696} +{"train_info/time_between_train_steps": 0.0034432411193847656, "step": 2696} +{"info/global_step": 2697, "train_info/time_within_train_step": 2.6716370582580566, "step": 2697} +{"train_info/time_between_train_steps": 0.0034508705139160156, "step": 2697} +{"info/global_step": 2698, "train_info/time_within_train_step": 2.6732282638549805, "step": 2698} +{"train_info/time_between_train_steps": 0.003473997116088867, "step": 2698} +{"info/global_step": 2699, "train_info/time_within_train_step": 2.671057939529419, "step": 2699} +{"train_info/time_between_train_steps": 0.0034704208374023438, "step": 2699} +{"info/global_step": 2700, "train_info/time_within_train_step": 2.672283887863159, "step": 2700} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746210961, "_runtime": 7733}, "step": 2700} +{"logs": {"train/loss": 3.9075, "train/learning_rate": 6.666666666666666e-05, "train/epoch": 3.04, "_timestamp": 1746210961, "_runtime": 7733}, "step": 2700} +{"train_info/time_between_train_steps": 12.87118911743164, "step": 2700} +{"info/global_step": 2701, "train_info/time_within_train_step": 2.4929678440093994, "step": 2701} +{"train_info/time_between_train_steps": 0.0039691925048828125, "step": 2701} +{"info/global_step": 2702, "train_info/time_within_train_step": 2.4614689350128174, "step": 2702} +{"train_info/time_between_train_steps": 0.003966808319091797, "step": 2702} +{"info/global_step": 2703, "train_info/time_within_train_step": 2.5194060802459717, "step": 2703} +{"train_info/time_between_train_steps": 0.003477811813354492, "step": 2703} +{"info/global_step": 2704, "train_info/time_within_train_step": 2.670443534851074, "step": 2704} +{"train_info/time_between_train_steps": 0.003555774688720703, "step": 2704} +{"info/global_step": 2705, "train_info/time_within_train_step": 2.674022674560547, "step": 2705} +{"train_info/time_between_train_steps": 0.0038309097290039062, "step": 2705} +{"info/global_step": 2706, "train_info/time_within_train_step": 2.674555540084839, "step": 2706} +{"train_info/time_between_train_steps": 0.0035140514373779297, "step": 2706} +{"info/global_step": 2707, "train_info/time_within_train_step": 2.6734886169433594, "step": 2707} +{"train_info/time_between_train_steps": 0.0035049915313720703, "step": 2707} +{"info/global_step": 2708, "train_info/time_within_train_step": 2.6741862297058105, "step": 2708} +{"train_info/time_between_train_steps": 0.003623485565185547, "step": 2708} +{"info/global_step": 2709, "train_info/time_within_train_step": 2.675609827041626, "step": 2709} +{"train_info/time_between_train_steps": 0.0034689903259277344, "step": 2709} +{"info/global_step": 2710, "train_info/time_within_train_step": 2.6744465827941895, "step": 2710} +{"train_info/time_between_train_steps": 0.0034880638122558594, "step": 2710} +{"info/global_step": 2711, "train_info/time_within_train_step": 2.6760928630828857, "step": 2711} +{"train_info/time_between_train_steps": 0.0034570693969726562, "step": 2711} +{"info/global_step": 2712, "train_info/time_within_train_step": 2.676387071609497, "step": 2712} +{"train_info/time_between_train_steps": 0.003681659698486328, "step": 2712} +{"info/global_step": 2713, "train_info/time_within_train_step": 2.6752002239227295, "step": 2713} +{"train_info/time_between_train_steps": 0.003494739532470703, "step": 2713} +{"info/global_step": 2714, "train_info/time_within_train_step": 2.6759722232818604, "step": 2714} +{"train_info/time_between_train_steps": 0.003518342971801758, "step": 2714} +{"info/global_step": 2715, "train_info/time_within_train_step": 2.675107002258301, "step": 2715} +{"train_info/time_between_train_steps": 0.003564119338989258, "step": 2715} +{"info/global_step": 2716, "train_info/time_within_train_step": 2.6751201152801514, "step": 2716} +{"train_info/time_between_train_steps": 0.00697779655456543, "step": 2716} +{"info/global_step": 2717, "train_info/time_within_train_step": 2.6749207973480225, "step": 2717} +{"train_info/time_between_train_steps": 0.21589326858520508, "step": 2717} +{"info/global_step": 2718, "train_info/time_within_train_step": 2.693588972091675, "step": 2718} +{"train_info/time_between_train_steps": 0.00341796875, "step": 2718} +{"info/global_step": 2719, "train_info/time_within_train_step": 2.67549729347229, "step": 2719} +{"train_info/time_between_train_steps": 0.0034034252166748047, "step": 2719} +{"info/global_step": 2720, "train_info/time_within_train_step": 2.675032377243042, "step": 2720} +{"train_info/time_between_train_steps": 0.003394603729248047, "step": 2720} +{"info/global_step": 2721, "train_info/time_within_train_step": 2.674302339553833, "step": 2721} +{"train_info/time_between_train_steps": 0.0033278465270996094, "step": 2721} +{"info/global_step": 2722, "train_info/time_within_train_step": 2.6752142906188965, "step": 2722} +{"train_info/time_between_train_steps": 0.003386259078979492, "step": 2722} +{"info/global_step": 2723, "train_info/time_within_train_step": 2.6739962100982666, "step": 2723} +{"train_info/time_between_train_steps": 0.0035212039947509766, "step": 2723} +{"info/global_step": 2724, "train_info/time_within_train_step": 2.6745409965515137, "step": 2724} +{"train_info/time_between_train_steps": 0.0033686161041259766, "step": 2724} +{"info/global_step": 2725, "train_info/time_within_train_step": 2.6744885444641113, "step": 2725} +{"train_info/time_between_train_steps": 0.003379344940185547, "step": 2725} +{"info/global_step": 2726, "train_info/time_within_train_step": 2.6749513149261475, "step": 2726} +{"train_info/time_between_train_steps": 0.0034036636352539062, "step": 2726} +{"info/global_step": 2727, "train_info/time_within_train_step": 2.674334764480591, "step": 2727} +{"train_info/time_between_train_steps": 0.0033817291259765625, "step": 2727} +{"info/global_step": 2728, "train_info/time_within_train_step": 2.6744801998138428, "step": 2728} +{"train_info/time_between_train_steps": 0.003359079360961914, "step": 2728} +{"info/global_step": 2729, "train_info/time_within_train_step": 2.6739983558654785, "step": 2729} +{"train_info/time_between_train_steps": 0.0033881664276123047, "step": 2729} +{"info/global_step": 2730, "train_info/time_within_train_step": 2.6741390228271484, "step": 2730} +{"train_info/time_between_train_steps": 0.0035886764526367188, "step": 2730} +{"info/global_step": 2731, "train_info/time_within_train_step": 2.6740312576293945, "step": 2731} +{"train_info/time_between_train_steps": 0.0036361217498779297, "step": 2731} +{"info/global_step": 2732, "train_info/time_within_train_step": 2.675128221511841, "step": 2732} +{"train_info/time_between_train_steps": 0.003529071807861328, "step": 2732} +{"info/global_step": 2733, "train_info/time_within_train_step": 2.6734378337860107, "step": 2733} +{"train_info/time_between_train_steps": 0.0036220550537109375, "step": 2733} +{"info/global_step": 2734, "train_info/time_within_train_step": 3.0035758018493652, "step": 2734} +{"train_info/time_between_train_steps": 0.003282785415649414, "step": 2734} +{"info/global_step": 2735, "train_info/time_within_train_step": 2.6740314960479736, "step": 2735} +{"train_info/time_between_train_steps": 0.003404378890991211, "step": 2735} +{"info/global_step": 2736, "train_info/time_within_train_step": 2.674121379852295, "step": 2736} +{"train_info/time_between_train_steps": 0.0037758350372314453, "step": 2736} +{"info/global_step": 2737, "train_info/time_within_train_step": 2.6773903369903564, "step": 2737} +{"train_info/time_between_train_steps": 0.0033426284790039062, "step": 2737} +{"info/global_step": 2738, "train_info/time_within_train_step": 2.6737728118896484, "step": 2738} +{"train_info/time_between_train_steps": 0.0032873153686523438, "step": 2738} +{"info/global_step": 2739, "train_info/time_within_train_step": 2.6737120151519775, "step": 2739} +{"train_info/time_between_train_steps": 0.003262042999267578, "step": 2739} +{"info/global_step": 2740, "train_info/time_within_train_step": 2.6752727031707764, "step": 2740} +{"train_info/time_between_train_steps": 0.0033059120178222656, "step": 2740} +{"info/global_step": 2741, "train_info/time_within_train_step": 2.674527645111084, "step": 2741} +{"train_info/time_between_train_steps": 0.0033960342407226562, "step": 2741} +{"info/global_step": 2742, "train_info/time_within_train_step": 2.6749765872955322, "step": 2742} +{"train_info/time_between_train_steps": 0.0033905506134033203, "step": 2742} +{"info/global_step": 2743, "train_info/time_within_train_step": 2.674582004547119, "step": 2743} +{"train_info/time_between_train_steps": 0.003326416015625, "step": 2743} +{"info/global_step": 2744, "train_info/time_within_train_step": 2.6740314960479736, "step": 2744} +{"train_info/time_between_train_steps": 0.003337860107421875, "step": 2744} +{"info/global_step": 2745, "train_info/time_within_train_step": 2.6746270656585693, "step": 2745} +{"train_info/time_between_train_steps": 0.0033071041107177734, "step": 2745} +{"info/global_step": 2746, "train_info/time_within_train_step": 2.674398422241211, "step": 2746} +{"train_info/time_between_train_steps": 0.0033559799194335938, "step": 2746} +{"info/global_step": 2747, "train_info/time_within_train_step": 2.6748552322387695, "step": 2747} +{"train_info/time_between_train_steps": 0.0034699440002441406, "step": 2747} +{"info/global_step": 2748, "train_info/time_within_train_step": 2.675527811050415, "step": 2748} +{"train_info/time_between_train_steps": 0.003367900848388672, "step": 2748} +{"info/global_step": 2749, "train_info/time_within_train_step": 2.674278736114502, "step": 2749} +{"train_info/time_between_train_steps": 0.003473043441772461, "step": 2749} +{"info/global_step": 2750, "train_info/time_within_train_step": 3.251624584197998, "step": 2750} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746211110, "_runtime": 7882}, "step": 2750} +{"logs": {"train/loss": 3.9042, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 3.05, "_timestamp": 1746211110, "_runtime": 7882}, "step": 2750} +{"train_info/time_between_train_steps": 0.02387690544128418, "step": 2750} +{"info/global_step": 2751, "train_info/time_within_train_step": 2.674778461456299, "step": 2751} +{"train_info/time_between_train_steps": 0.003354787826538086, "step": 2751} +{"info/global_step": 2752, "train_info/time_within_train_step": 2.678969383239746, "step": 2752} +{"train_info/time_between_train_steps": 0.0033295154571533203, "step": 2752} +{"info/global_step": 2753, "train_info/time_within_train_step": 2.6757984161376953, "step": 2753} +{"train_info/time_between_train_steps": 0.0033915042877197266, "step": 2753} +{"info/global_step": 2754, "train_info/time_within_train_step": 2.674525737762451, "step": 2754} +{"train_info/time_between_train_steps": 0.0032830238342285156, "step": 2754} +{"info/global_step": 2755, "train_info/time_within_train_step": 2.674636125564575, "step": 2755} +{"train_info/time_between_train_steps": 0.0034122467041015625, "step": 2755} +{"info/global_step": 2756, "train_info/time_within_train_step": 2.6736037731170654, "step": 2756} +{"train_info/time_between_train_steps": 0.0033762454986572266, "step": 2756} +{"info/global_step": 2757, "train_info/time_within_train_step": 2.6735031604766846, "step": 2757} +{"train_info/time_between_train_steps": 0.0035440921783447266, "step": 2757} +{"info/global_step": 2758, "train_info/time_within_train_step": 2.674912691116333, "step": 2758} +{"train_info/time_between_train_steps": 0.0038318634033203125, "step": 2758} +{"info/global_step": 2759, "train_info/time_within_train_step": 2.675346612930298, "step": 2759} +{"train_info/time_between_train_steps": 0.003498554229736328, "step": 2759} +{"info/global_step": 2760, "train_info/time_within_train_step": 2.674945592880249, "step": 2760} +{"train_info/time_between_train_steps": 0.003674745559692383, "step": 2760} +{"info/global_step": 2761, "train_info/time_within_train_step": 2.6747477054595947, "step": 2761} +{"train_info/time_between_train_steps": 0.003503084182739258, "step": 2761} +{"info/global_step": 2762, "train_info/time_within_train_step": 2.673832416534424, "step": 2762} +{"train_info/time_between_train_steps": 0.0035724639892578125, "step": 2762} +{"info/global_step": 2763, "train_info/time_within_train_step": 2.6750636100769043, "step": 2763} +{"train_info/time_between_train_steps": 0.003461599349975586, "step": 2763} +{"info/global_step": 2764, "train_info/time_within_train_step": 2.6737184524536133, "step": 2764} +{"train_info/time_between_train_steps": 0.003542184829711914, "step": 2764} +{"info/global_step": 2765, "train_info/time_within_train_step": 2.6743218898773193, "step": 2765} +{"train_info/time_between_train_steps": 0.0034286975860595703, "step": 2765} +{"info/global_step": 2766, "train_info/time_within_train_step": 2.6739652156829834, "step": 2766} +{"train_info/time_between_train_steps": 0.0034711360931396484, "step": 2766} +{"info/global_step": 2767, "train_info/time_within_train_step": 2.7230496406555176, "step": 2767} +{"train_info/time_between_train_steps": 0.003506898880004883, "step": 2767} +{"info/global_step": 2768, "train_info/time_within_train_step": 2.6713712215423584, "step": 2768} +{"train_info/time_between_train_steps": 0.0034589767456054688, "step": 2768} +{"info/global_step": 2769, "train_info/time_within_train_step": 2.6730501651763916, "step": 2769} +{"train_info/time_between_train_steps": 0.003522157669067383, "step": 2769} +{"info/global_step": 2770, "train_info/time_within_train_step": 2.672323703765869, "step": 2770} +{"train_info/time_between_train_steps": 0.003521442413330078, "step": 2770} +{"info/global_step": 2771, "train_info/time_within_train_step": 2.6727824211120605, "step": 2771} +{"train_info/time_between_train_steps": 0.003466367721557617, "step": 2771} +{"info/global_step": 2772, "train_info/time_within_train_step": 2.6741867065429688, "step": 2772} +{"train_info/time_between_train_steps": 0.006456851959228516, "step": 2772} +{"info/global_step": 2773, "train_info/time_within_train_step": 2.6751866340637207, "step": 2773} +{"train_info/time_between_train_steps": 0.0034444332122802734, "step": 2773} +{"info/global_step": 2774, "train_info/time_within_train_step": 2.6732797622680664, "step": 2774} +{"train_info/time_between_train_steps": 0.0035834312438964844, "step": 2774} +{"info/global_step": 2775, "train_info/time_within_train_step": 2.6735849380493164, "step": 2775} +{"train_info/time_between_train_steps": 0.0035860538482666016, "step": 2775} +{"info/global_step": 2776, "train_info/time_within_train_step": 2.6738967895507812, "step": 2776} +{"train_info/time_between_train_steps": 0.0035941600799560547, "step": 2776} +{"info/global_step": 2777, "train_info/time_within_train_step": 2.6730611324310303, "step": 2777} +{"train_info/time_between_train_steps": 0.0035734176635742188, "step": 2777} +{"info/global_step": 2778, "train_info/time_within_train_step": 2.67435884475708, "step": 2778} +{"train_info/time_between_train_steps": 0.003495931625366211, "step": 2778} +{"info/global_step": 2779, "train_info/time_within_train_step": 2.67411732673645, "step": 2779} +{"train_info/time_between_train_steps": 0.003531932830810547, "step": 2779} +{"info/global_step": 2780, "train_info/time_within_train_step": 2.831434726715088, "step": 2780} +{"train_info/time_between_train_steps": 0.0032968521118164062, "step": 2780} +{"info/global_step": 2781, "train_info/time_within_train_step": 2.672534465789795, "step": 2781} +{"train_info/time_between_train_steps": 0.0033156871795654297, "step": 2781} +{"info/global_step": 2782, "train_info/time_within_train_step": 2.6747474670410156, "step": 2782} +{"train_info/time_between_train_steps": 0.0034923553466796875, "step": 2782} +{"info/global_step": 2783, "train_info/time_within_train_step": 2.6728951930999756, "step": 2783} +{"train_info/time_between_train_steps": 0.0034461021423339844, "step": 2783} +{"info/global_step": 2784, "train_info/time_within_train_step": 2.672414541244507, "step": 2784} +{"train_info/time_between_train_steps": 0.0034406185150146484, "step": 2784} +{"info/global_step": 2785, "train_info/time_within_train_step": 2.6735682487487793, "step": 2785} +{"train_info/time_between_train_steps": 0.003491640090942383, "step": 2785} +{"info/global_step": 2786, "train_info/time_within_train_step": 2.6735949516296387, "step": 2786} +{"train_info/time_between_train_steps": 0.0034792423248291016, "step": 2786} +{"info/global_step": 2787, "train_info/time_within_train_step": 2.6800811290740967, "step": 2787} +{"train_info/time_between_train_steps": 0.0035436153411865234, "step": 2787} +{"info/global_step": 2788, "train_info/time_within_train_step": 3.00087571144104, "step": 2788} +{"train_info/time_between_train_steps": 0.003323078155517578, "step": 2788} +{"info/global_step": 2789, "train_info/time_within_train_step": 2.675536870956421, "step": 2789} +{"train_info/time_between_train_steps": 0.003348112106323242, "step": 2789} +{"info/global_step": 2790, "train_info/time_within_train_step": 2.673691749572754, "step": 2790} +{"train_info/time_between_train_steps": 0.003353595733642578, "step": 2790} +{"info/global_step": 2791, "train_info/time_within_train_step": 2.6739084720611572, "step": 2791} +{"train_info/time_between_train_steps": 0.003311634063720703, "step": 2791} +{"info/global_step": 2792, "train_info/time_within_train_step": 2.674556016921997, "step": 2792} +{"train_info/time_between_train_steps": 0.003331422805786133, "step": 2792} +{"info/global_step": 2793, "train_info/time_within_train_step": 2.675489664077759, "step": 2793} +{"train_info/time_between_train_steps": 0.00342559814453125, "step": 2793} +{"info/global_step": 2794, "train_info/time_within_train_step": 2.672917366027832, "step": 2794} +{"train_info/time_between_train_steps": 0.003290414810180664, "step": 2794} +{"info/global_step": 2795, "train_info/time_within_train_step": 2.6749520301818848, "step": 2795} +{"train_info/time_between_train_steps": 0.0033173561096191406, "step": 2795} +{"info/global_step": 2796, "train_info/time_within_train_step": 2.67398738861084, "step": 2796} +{"train_info/time_between_train_steps": 0.003298044204711914, "step": 2796} +{"info/global_step": 2797, "train_info/time_within_train_step": 2.673332929611206, "step": 2797} +{"train_info/time_between_train_steps": 0.003324747085571289, "step": 2797} +{"info/global_step": 2798, "train_info/time_within_train_step": 2.673433303833008, "step": 2798} +{"train_info/time_between_train_steps": 0.0033071041107177734, "step": 2798} +{"info/global_step": 2799, "train_info/time_within_train_step": 2.6723296642303467, "step": 2799} +{"train_info/time_between_train_steps": 0.0033142566680908203, "step": 2799} +{"info/global_step": 2800, "train_info/time_within_train_step": 2.6717753410339355, "step": 2800} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746211245, "_runtime": 8017}, "step": 2800} +{"logs": {"train/loss": 3.8868, "train/learning_rate": 4.444444444444444e-05, "train/epoch": 3.07, "_timestamp": 1746211245, "_runtime": 8017}, "step": 2800} +{"train_info/time_between_train_steps": 13.455726146697998, "step": 2800} +{"info/global_step": 2801, "train_info/time_within_train_step": 2.475414991378784, "step": 2801} +{"train_info/time_between_train_steps": 0.0035486221313476562, "step": 2801} +{"info/global_step": 2802, "train_info/time_within_train_step": 2.459937334060669, "step": 2802} +{"train_info/time_between_train_steps": 0.0032994747161865234, "step": 2802} +{"info/global_step": 2803, "train_info/time_within_train_step": 2.467282772064209, "step": 2803} +{"train_info/time_between_train_steps": 0.0033500194549560547, "step": 2803} +{"info/global_step": 2804, "train_info/time_within_train_step": 2.6424169540405273, "step": 2804} +{"train_info/time_between_train_steps": 0.00386810302734375, "step": 2804} +{"info/global_step": 2805, "train_info/time_within_train_step": 2.6722142696380615, "step": 2805} +{"train_info/time_between_train_steps": 0.003294706344604492, "step": 2805} +{"info/global_step": 2806, "train_info/time_within_train_step": 2.673942804336548, "step": 2806} +{"train_info/time_between_train_steps": 0.0033829212188720703, "step": 2806} +{"info/global_step": 2807, "train_info/time_within_train_step": 2.6737635135650635, "step": 2807} +{"train_info/time_between_train_steps": 0.00330352783203125, "step": 2807} +{"info/global_step": 2808, "train_info/time_within_train_step": 2.6747398376464844, "step": 2808} +{"train_info/time_between_train_steps": 0.0032873153686523438, "step": 2808} +{"info/global_step": 2809, "train_info/time_within_train_step": 2.6761913299560547, "step": 2809} +{"train_info/time_between_train_steps": 0.003373861312866211, "step": 2809} +{"info/global_step": 2810, "train_info/time_within_train_step": 2.6756844520568848, "step": 2810} +{"train_info/time_between_train_steps": 0.0033159255981445312, "step": 2810} +{"info/global_step": 2811, "train_info/time_within_train_step": 2.676156520843506, "step": 2811} +{"train_info/time_between_train_steps": 0.0032958984375, "step": 2811} +{"info/global_step": 2812, "train_info/time_within_train_step": 2.676577091217041, "step": 2812} +{"train_info/time_between_train_steps": 0.003376483917236328, "step": 2812} +{"info/global_step": 2813, "train_info/time_within_train_step": 2.677070379257202, "step": 2813} +{"train_info/time_between_train_steps": 0.003337860107421875, "step": 2813} +{"info/global_step": 2814, "train_info/time_within_train_step": 2.67771577835083, "step": 2814} +{"train_info/time_between_train_steps": 0.0034067630767822266, "step": 2814} +{"info/global_step": 2815, "train_info/time_within_train_step": 2.677934169769287, "step": 2815} +{"train_info/time_between_train_steps": 0.0033092498779296875, "step": 2815} +{"info/global_step": 2816, "train_info/time_within_train_step": 2.6767241954803467, "step": 2816} +{"train_info/time_between_train_steps": 0.0033655166625976562, "step": 2816} +{"info/global_step": 2817, "train_info/time_within_train_step": 2.6759374141693115, "step": 2817} +{"train_info/time_between_train_steps": 0.003309011459350586, "step": 2817} +{"info/global_step": 2818, "train_info/time_within_train_step": 2.6750235557556152, "step": 2818} +{"train_info/time_between_train_steps": 0.003289937973022461, "step": 2818} +{"info/global_step": 2819, "train_info/time_within_train_step": 2.6753365993499756, "step": 2819} +{"train_info/time_between_train_steps": 0.003293752670288086, "step": 2819} +{"info/global_step": 2820, "train_info/time_within_train_step": 2.6751859188079834, "step": 2820} +{"train_info/time_between_train_steps": 0.00328826904296875, "step": 2820} +{"info/global_step": 2821, "train_info/time_within_train_step": 2.67461895942688, "step": 2821} +{"train_info/time_between_train_steps": 0.0033550262451171875, "step": 2821} +{"info/global_step": 2822, "train_info/time_within_train_step": 2.6754250526428223, "step": 2822} +{"train_info/time_between_train_steps": 0.0033249855041503906, "step": 2822} +{"info/global_step": 2823, "train_info/time_within_train_step": 2.673578977584839, "step": 2823} +{"train_info/time_between_train_steps": 0.0033330917358398438, "step": 2823} +{"info/global_step": 2824, "train_info/time_within_train_step": 2.6749351024627686, "step": 2824} +{"train_info/time_between_train_steps": 0.0033283233642578125, "step": 2824} +{"info/global_step": 2825, "train_info/time_within_train_step": 2.674445390701294, "step": 2825} +{"train_info/time_between_train_steps": 0.003291606903076172, "step": 2825} +{"info/global_step": 2826, "train_info/time_within_train_step": 2.675069808959961, "step": 2826} +{"train_info/time_between_train_steps": 0.003299236297607422, "step": 2826} +{"info/global_step": 2827, "train_info/time_within_train_step": 2.676715135574341, "step": 2827} +{"train_info/time_between_train_steps": 0.0033125877380371094, "step": 2827} +{"info/global_step": 2828, "train_info/time_within_train_step": 2.674657106399536, "step": 2828} +{"train_info/time_between_train_steps": 0.0032989978790283203, "step": 2828} +{"info/global_step": 2829, "train_info/time_within_train_step": 2.6744425296783447, "step": 2829} +{"train_info/time_between_train_steps": 0.0032770633697509766, "step": 2829} +{"info/global_step": 2830, "train_info/time_within_train_step": 2.9103214740753174, "step": 2830} +{"train_info/time_between_train_steps": 0.003308534622192383, "step": 2830} +{"info/global_step": 2831, "train_info/time_within_train_step": 2.6722939014434814, "step": 2831} +{"train_info/time_between_train_steps": 0.0032968521118164062, "step": 2831} +{"info/global_step": 2832, "train_info/time_within_train_step": 2.673095703125, "step": 2832} +{"train_info/time_between_train_steps": 0.0032775402069091797, "step": 2832} +{"info/global_step": 2833, "train_info/time_within_train_step": 2.6753525733947754, "step": 2833} +{"train_info/time_between_train_steps": 0.003411531448364258, "step": 2833} +{"info/global_step": 2834, "train_info/time_within_train_step": 2.6732349395751953, "step": 2834} +{"train_info/time_between_train_steps": 0.003294229507446289, "step": 2834} +{"info/global_step": 2835, "train_info/time_within_train_step": 2.67378306388855, "step": 2835} +{"train_info/time_between_train_steps": 0.0033440589904785156, "step": 2835} +{"info/global_step": 2836, "train_info/time_within_train_step": 2.6726770401000977, "step": 2836} +{"train_info/time_between_train_steps": 0.003266572952270508, "step": 2836} +{"info/global_step": 2837, "train_info/time_within_train_step": 2.674532651901245, "step": 2837} +{"train_info/time_between_train_steps": 0.0033054351806640625, "step": 2837} +{"info/global_step": 2838, "train_info/time_within_train_step": 2.6737732887268066, "step": 2838} +{"train_info/time_between_train_steps": 0.0032892227172851562, "step": 2838} +{"info/global_step": 2839, "train_info/time_within_train_step": 2.674455404281616, "step": 2839} +{"train_info/time_between_train_steps": 0.0039365291595458984, "step": 2839} +{"info/global_step": 2840, "train_info/time_within_train_step": 2.674895763397217, "step": 2840} +{"train_info/time_between_train_steps": 0.0033164024353027344, "step": 2840} +{"info/global_step": 2841, "train_info/time_within_train_step": 2.674738645553589, "step": 2841} +{"train_info/time_between_train_steps": 0.003309965133666992, "step": 2841} +{"info/global_step": 2842, "train_info/time_within_train_step": 2.6734209060668945, "step": 2842} +{"train_info/time_between_train_steps": 0.12875914573669434, "step": 2842} +{"info/global_step": 2843, "train_info/time_within_train_step": 2.674870252609253, "step": 2843} +{"train_info/time_between_train_steps": 0.0033216476440429688, "step": 2843} +{"info/global_step": 2844, "train_info/time_within_train_step": 2.673433303833008, "step": 2844} +{"train_info/time_between_train_steps": 0.0038747787475585938, "step": 2844} +{"info/global_step": 2845, "train_info/time_within_train_step": 2.674550771713257, "step": 2845} +{"train_info/time_between_train_steps": 0.0032906532287597656, "step": 2845} +{"info/global_step": 2846, "train_info/time_within_train_step": 2.672471046447754, "step": 2846} +{"train_info/time_between_train_steps": 0.0032787322998046875, "step": 2846} +{"info/global_step": 2847, "train_info/time_within_train_step": 2.673945903778076, "step": 2847} +{"train_info/time_between_train_steps": 0.003276348114013672, "step": 2847} +{"info/global_step": 2848, "train_info/time_within_train_step": 2.7111763954162598, "step": 2848} +{"train_info/time_between_train_steps": 0.0036873817443847656, "step": 2848} +{"info/global_step": 2849, "train_info/time_within_train_step": 2.6741719245910645, "step": 2849} +{"train_info/time_between_train_steps": 0.0032825469970703125, "step": 2849} +{"info/global_step": 2850, "train_info/time_within_train_step": 2.6748850345611572, "step": 2850} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746211393, "_runtime": 8165}, "step": 2850} +{"logs": {"train/loss": 3.8735, "train/learning_rate": 3.333333333333333e-05, "train/epoch": 3.09, "_timestamp": 1746211393, "_runtime": 8165}, "step": 2850} +{"train_info/time_between_train_steps": 0.024411916732788086, "step": 2850} +{"info/global_step": 2851, "train_info/time_within_train_step": 2.6743199825286865, "step": 2851} +{"train_info/time_between_train_steps": 0.003262042999267578, "step": 2851} +{"info/global_step": 2852, "train_info/time_within_train_step": 2.67386794090271, "step": 2852} +{"train_info/time_between_train_steps": 0.003248929977416992, "step": 2852} +{"info/global_step": 2853, "train_info/time_within_train_step": 2.675198793411255, "step": 2853} +{"train_info/time_between_train_steps": 0.0034303665161132812, "step": 2853} +{"info/global_step": 2854, "train_info/time_within_train_step": 2.675262928009033, "step": 2854} +{"train_info/time_between_train_steps": 0.0033037662506103516, "step": 2854} +{"info/global_step": 2855, "train_info/time_within_train_step": 2.675299644470215, "step": 2855} +{"train_info/time_between_train_steps": 0.003271818161010742, "step": 2855} +{"info/global_step": 2856, "train_info/time_within_train_step": 2.6737794876098633, "step": 2856} +{"train_info/time_between_train_steps": 0.0033333301544189453, "step": 2856} +{"info/global_step": 2857, "train_info/time_within_train_step": 2.6741974353790283, "step": 2857} +{"train_info/time_between_train_steps": 0.0032625198364257812, "step": 2857} +{"info/global_step": 2858, "train_info/time_within_train_step": 2.6731672286987305, "step": 2858} +{"train_info/time_between_train_steps": 0.0032639503479003906, "step": 2858} +{"info/global_step": 2859, "train_info/time_within_train_step": 2.673030376434326, "step": 2859} +{"train_info/time_between_train_steps": 0.003305196762084961, "step": 2859} +{"info/global_step": 2860, "train_info/time_within_train_step": 2.6727523803710938, "step": 2860} +{"train_info/time_between_train_steps": 0.0032536983489990234, "step": 2860} +{"info/global_step": 2861, "train_info/time_within_train_step": 2.6724915504455566, "step": 2861} +{"train_info/time_between_train_steps": 0.0032711029052734375, "step": 2861} +{"info/global_step": 2862, "train_info/time_within_train_step": 2.6723053455352783, "step": 2862} +{"train_info/time_between_train_steps": 0.0032494068145751953, "step": 2862} +{"info/global_step": 2863, "train_info/time_within_train_step": 2.6720218658447266, "step": 2863} +{"train_info/time_between_train_steps": 0.0032906532287597656, "step": 2863} +{"info/global_step": 2864, "train_info/time_within_train_step": 2.6722002029418945, "step": 2864} +{"train_info/time_between_train_steps": 0.003308534622192383, "step": 2864} +{"info/global_step": 2865, "train_info/time_within_train_step": 2.6778147220611572, "step": 2865} +{"train_info/time_between_train_steps": 0.003272533416748047, "step": 2865} +{"info/global_step": 2866, "train_info/time_within_train_step": 2.6730997562408447, "step": 2866} +{"train_info/time_between_train_steps": 0.003282308578491211, "step": 2866} +{"info/global_step": 2867, "train_info/time_within_train_step": 2.6733176708221436, "step": 2867} +{"train_info/time_between_train_steps": 0.0033779144287109375, "step": 2867} +{"info/global_step": 2868, "train_info/time_within_train_step": 2.6737680435180664, "step": 2868} +{"train_info/time_between_train_steps": 0.003384828567504883, "step": 2868} +{"info/global_step": 2869, "train_info/time_within_train_step": 2.6742563247680664, "step": 2869} +{"train_info/time_between_train_steps": 0.0033011436462402344, "step": 2869} +{"info/global_step": 2870, "train_info/time_within_train_step": 2.673921585083008, "step": 2870} +{"train_info/time_between_train_steps": 0.003259420394897461, "step": 2870} +{"info/global_step": 2871, "train_info/time_within_train_step": 2.6736843585968018, "step": 2871} +{"train_info/time_between_train_steps": 0.0032737255096435547, "step": 2871} +{"info/global_step": 2872, "train_info/time_within_train_step": 2.6732826232910156, "step": 2872} +{"train_info/time_between_train_steps": 0.0033011436462402344, "step": 2872} +{"info/global_step": 2873, "train_info/time_within_train_step": 2.6714789867401123, "step": 2873} +{"train_info/time_between_train_steps": 0.0032644271850585938, "step": 2873} +{"info/global_step": 2874, "train_info/time_within_train_step": 2.6710500717163086, "step": 2874} +{"train_info/time_between_train_steps": 0.003299236297607422, "step": 2874} +{"info/global_step": 2875, "train_info/time_within_train_step": 2.672835111618042, "step": 2875} +{"train_info/time_between_train_steps": 0.0033164024353027344, "step": 2875} +{"info/global_step": 2876, "train_info/time_within_train_step": 2.673452377319336, "step": 2876} +{"train_info/time_between_train_steps": 0.003281116485595703, "step": 2876} +{"info/global_step": 2877, "train_info/time_within_train_step": 2.672661304473877, "step": 2877} +{"train_info/time_between_train_steps": 0.0033812522888183594, "step": 2877} +{"info/global_step": 2878, "train_info/time_within_train_step": 2.6746270656585693, "step": 2878} +{"train_info/time_between_train_steps": 0.0032470226287841797, "step": 2878} +{"info/global_step": 2879, "train_info/time_within_train_step": 2.673452138900757, "step": 2879} +{"train_info/time_between_train_steps": 0.0032656192779541016, "step": 2879} +{"info/global_step": 2880, "train_info/time_within_train_step": 2.672236204147339, "step": 2880} +{"train_info/time_between_train_steps": 0.003254413604736328, "step": 2880} +{"info/global_step": 2881, "train_info/time_within_train_step": 2.6739583015441895, "step": 2881} +{"train_info/time_between_train_steps": 0.003262042999267578, "step": 2881} +{"info/global_step": 2882, "train_info/time_within_train_step": 2.6745681762695312, "step": 2882} +{"train_info/time_between_train_steps": 0.0032851696014404297, "step": 2882} +{"info/global_step": 2883, "train_info/time_within_train_step": 2.6743054389953613, "step": 2883} +{"train_info/time_between_train_steps": 0.0032689571380615234, "step": 2883} +{"info/global_step": 2884, "train_info/time_within_train_step": 2.6731114387512207, "step": 2884} +{"train_info/time_between_train_steps": 0.00327301025390625, "step": 2884} +{"info/global_step": 2885, "train_info/time_within_train_step": 2.6737072467803955, "step": 2885} +{"train_info/time_between_train_steps": 0.003333568572998047, "step": 2885} +{"info/global_step": 2886, "train_info/time_within_train_step": 2.673020839691162, "step": 2886} +{"train_info/time_between_train_steps": 0.003271818161010742, "step": 2886} +{"info/global_step": 2887, "train_info/time_within_train_step": 2.672820568084717, "step": 2887} +{"train_info/time_between_train_steps": 0.0032677650451660156, "step": 2887} +{"info/global_step": 2888, "train_info/time_within_train_step": 2.6728482246398926, "step": 2888} +{"train_info/time_between_train_steps": 0.0032951831817626953, "step": 2888} +{"info/global_step": 2889, "train_info/time_within_train_step": 2.673778533935547, "step": 2889} +{"train_info/time_between_train_steps": 0.0032372474670410156, "step": 2889} +{"info/global_step": 2890, "train_info/time_within_train_step": 2.6729373931884766, "step": 2890} +{"train_info/time_between_train_steps": 0.003298521041870117, "step": 2890} +{"info/global_step": 2891, "train_info/time_within_train_step": 2.6738405227661133, "step": 2891} +{"train_info/time_between_train_steps": 0.0032851696014404297, "step": 2891} +{"info/global_step": 2892, "train_info/time_within_train_step": 2.673382043838501, "step": 2892} +{"train_info/time_between_train_steps": 0.0033316612243652344, "step": 2892} +{"info/global_step": 2893, "train_info/time_within_train_step": 2.6745615005493164, "step": 2893} +{"train_info/time_between_train_steps": 0.003261566162109375, "step": 2893} +{"info/global_step": 2894, "train_info/time_within_train_step": 2.674304962158203, "step": 2894} +{"train_info/time_between_train_steps": 0.0032837390899658203, "step": 2894} +{"info/global_step": 2895, "train_info/time_within_train_step": 2.6731104850769043, "step": 2895} +{"train_info/time_between_train_steps": 0.0033075809478759766, "step": 2895} +{"info/global_step": 2896, "train_info/time_within_train_step": 2.67547607421875, "step": 2896} +{"train_info/time_between_train_steps": 0.003237485885620117, "step": 2896} +{"info/global_step": 2897, "train_info/time_within_train_step": 2.6746766567230225, "step": 2897} +{"train_info/time_between_train_steps": 0.0033092498779296875, "step": 2897} +{"info/global_step": 2898, "train_info/time_within_train_step": 2.67495059967041, "step": 2898} +{"train_info/time_between_train_steps": 0.003256082534790039, "step": 2898} +{"info/global_step": 2899, "train_info/time_within_train_step": 2.676544666290283, "step": 2899} +{"train_info/time_between_train_steps": 0.003268718719482422, "step": 2899} +{"info/global_step": 2900, "train_info/time_within_train_step": 2.6738481521606445, "step": 2900} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746211528, "_runtime": 8300}, "step": 2900} +{"logs": {"train/loss": 3.8702, "train/learning_rate": 2.222222222222222e-05, "train/epoch": 3.1, "_timestamp": 1746211528, "_runtime": 8300}, "step": 2900} +{"train_info/time_between_train_steps": 12.86264157295227, "step": 2900} +{"info/global_step": 2901, "train_info/time_within_train_step": 2.469951868057251, "step": 2901} +{"train_info/time_between_train_steps": 0.0032927989959716797, "step": 2901} +{"info/global_step": 2902, "train_info/time_within_train_step": 2.462634563446045, "step": 2902} +{"train_info/time_between_train_steps": 0.0032956600189208984, "step": 2902} +{"info/global_step": 2903, "train_info/time_within_train_step": 2.5067787170410156, "step": 2903} +{"train_info/time_between_train_steps": 0.0033032894134521484, "step": 2903} +{"info/global_step": 2904, "train_info/time_within_train_step": 2.669952392578125, "step": 2904} +{"train_info/time_between_train_steps": 0.0033104419708251953, "step": 2904} +{"info/global_step": 2905, "train_info/time_within_train_step": 2.7988147735595703, "step": 2905} +{"train_info/time_between_train_steps": 0.0032720565795898438, "step": 2905} +{"info/global_step": 2906, "train_info/time_within_train_step": 2.6728663444519043, "step": 2906} +{"train_info/time_between_train_steps": 0.0033059120178222656, "step": 2906} +{"info/global_step": 2907, "train_info/time_within_train_step": 2.6744139194488525, "step": 2907} +{"train_info/time_between_train_steps": 0.0032646656036376953, "step": 2907} +{"info/global_step": 2908, "train_info/time_within_train_step": 2.67410945892334, "step": 2908} +{"train_info/time_between_train_steps": 0.0032472610473632812, "step": 2908} +{"info/global_step": 2909, "train_info/time_within_train_step": 2.6746981143951416, "step": 2909} +{"train_info/time_between_train_steps": 0.0032927989959716797, "step": 2909} +{"info/global_step": 2910, "train_info/time_within_train_step": 2.9203317165374756, "step": 2910} +{"train_info/time_between_train_steps": 0.003299236297607422, "step": 2910} +{"info/global_step": 2911, "train_info/time_within_train_step": 2.674119234085083, "step": 2911} +{"train_info/time_between_train_steps": 0.003242969512939453, "step": 2911} +{"info/global_step": 2912, "train_info/time_within_train_step": 2.6763906478881836, "step": 2912} +{"train_info/time_between_train_steps": 0.0033104419708251953, "step": 2912} +{"info/global_step": 2913, "train_info/time_within_train_step": 2.675236463546753, "step": 2913} +{"train_info/time_between_train_steps": 0.0034818649291992188, "step": 2913} +{"info/global_step": 2914, "train_info/time_within_train_step": 2.674809694290161, "step": 2914} +{"train_info/time_between_train_steps": 0.003298521041870117, "step": 2914} +{"info/global_step": 2915, "train_info/time_within_train_step": 2.676862955093384, "step": 2915} +{"train_info/time_between_train_steps": 0.0033111572265625, "step": 2915} +{"info/global_step": 2916, "train_info/time_within_train_step": 2.6763224601745605, "step": 2916} +{"train_info/time_between_train_steps": 0.003280162811279297, "step": 2916} +{"info/global_step": 2917, "train_info/time_within_train_step": 2.675705671310425, "step": 2917} +{"train_info/time_between_train_steps": 0.003271341323852539, "step": 2917} +{"info/global_step": 2918, "train_info/time_within_train_step": 2.6766841411590576, "step": 2918} +{"train_info/time_between_train_steps": 0.003298521041870117, "step": 2918} +{"info/global_step": 2919, "train_info/time_within_train_step": 2.6768665313720703, "step": 2919} +{"train_info/time_between_train_steps": 0.0033321380615234375, "step": 2919} +{"info/global_step": 2920, "train_info/time_within_train_step": 2.6760330200195312, "step": 2920} +{"train_info/time_between_train_steps": 0.0032787322998046875, "step": 2920} +{"info/global_step": 2921, "train_info/time_within_train_step": 2.6753547191619873, "step": 2921} +{"train_info/time_between_train_steps": 0.0033369064331054688, "step": 2921} +{"info/global_step": 2922, "train_info/time_within_train_step": 2.6748085021972656, "step": 2922} +{"train_info/time_between_train_steps": 0.0032067298889160156, "step": 2922} +{"info/global_step": 2923, "train_info/time_within_train_step": 2.6733739376068115, "step": 2923} +{"train_info/time_between_train_steps": 0.003297567367553711, "step": 2923} +{"info/global_step": 2924, "train_info/time_within_train_step": 2.6725246906280518, "step": 2924} +{"train_info/time_between_train_steps": 0.003276348114013672, "step": 2924} +{"info/global_step": 2925, "train_info/time_within_train_step": 2.6737048625946045, "step": 2925} +{"train_info/time_between_train_steps": 0.0032410621643066406, "step": 2925} +{"info/global_step": 2926, "train_info/time_within_train_step": 2.673428535461426, "step": 2926} +{"train_info/time_between_train_steps": 0.0032939910888671875, "step": 2926} +{"info/global_step": 2927, "train_info/time_within_train_step": 2.6723735332489014, "step": 2927} +{"train_info/time_between_train_steps": 0.003227710723876953, "step": 2927} +{"info/global_step": 2928, "train_info/time_within_train_step": 2.672102212905884, "step": 2928} +{"train_info/time_between_train_steps": 0.006630659103393555, "step": 2928} +{"info/global_step": 2929, "train_info/time_within_train_step": 2.6749329566955566, "step": 2929} +{"train_info/time_between_train_steps": 0.006627321243286133, "step": 2929} +{"info/global_step": 2930, "train_info/time_within_train_step": 2.674862861633301, "step": 2930} +{"train_info/time_between_train_steps": 0.006714582443237305, "step": 2930} +{"info/global_step": 2931, "train_info/time_within_train_step": 2.674778699874878, "step": 2931} +{"train_info/time_between_train_steps": 0.006662607192993164, "step": 2931} +{"info/global_step": 2932, "train_info/time_within_train_step": 2.675288200378418, "step": 2932} +{"train_info/time_between_train_steps": 0.006838321685791016, "step": 2932} +{"info/global_step": 2933, "train_info/time_within_train_step": 2.674196243286133, "step": 2933} +{"train_info/time_between_train_steps": 0.006676912307739258, "step": 2933} +{"info/global_step": 2934, "train_info/time_within_train_step": 2.67401123046875, "step": 2934} +{"train_info/time_between_train_steps": 0.0050313472747802734, "step": 2934} +{"info/global_step": 2935, "train_info/time_within_train_step": 2.6749465465545654, "step": 2935} +{"train_info/time_between_train_steps": 0.0032966136932373047, "step": 2935} +{"info/global_step": 2936, "train_info/time_within_train_step": 2.674363374710083, "step": 2936} +{"train_info/time_between_train_steps": 0.0032553672790527344, "step": 2936} +{"info/global_step": 2937, "train_info/time_within_train_step": 2.674668550491333, "step": 2937} +{"train_info/time_between_train_steps": 0.0032711029052734375, "step": 2937} +{"info/global_step": 2938, "train_info/time_within_train_step": 2.6743552684783936, "step": 2938} +{"train_info/time_between_train_steps": 0.0033044815063476562, "step": 2938} +{"info/global_step": 2939, "train_info/time_within_train_step": 2.6744801998138428, "step": 2939} +{"train_info/time_between_train_steps": 0.003311634063720703, "step": 2939} +{"info/global_step": 2940, "train_info/time_within_train_step": 2.674630641937256, "step": 2940} +{"train_info/time_between_train_steps": 0.003264904022216797, "step": 2940} +{"info/global_step": 2941, "train_info/time_within_train_step": 2.6735482215881348, "step": 2941} +{"train_info/time_between_train_steps": 0.0032806396484375, "step": 2941} +{"info/global_step": 2942, "train_info/time_within_train_step": 2.6737327575683594, "step": 2942} +{"train_info/time_between_train_steps": 0.006656646728515625, "step": 2942} +{"info/global_step": 2943, "train_info/time_within_train_step": 2.6744883060455322, "step": 2943} +{"train_info/time_between_train_steps": 0.0033125877380371094, "step": 2943} +{"info/global_step": 2944, "train_info/time_within_train_step": 2.677509307861328, "step": 2944} +{"train_info/time_between_train_steps": 0.003293752670288086, "step": 2944} +{"info/global_step": 2945, "train_info/time_within_train_step": 2.676260232925415, "step": 2945} +{"train_info/time_between_train_steps": 0.003285646438598633, "step": 2945} +{"info/global_step": 2946, "train_info/time_within_train_step": 2.6737890243530273, "step": 2946} +{"train_info/time_between_train_steps": 0.0032880306243896484, "step": 2946} +{"info/global_step": 2947, "train_info/time_within_train_step": 2.6731503009796143, "step": 2947} +{"train_info/time_between_train_steps": 0.0032851696014404297, "step": 2947} +{"info/global_step": 2948, "train_info/time_within_train_step": 2.6744120121002197, "step": 2948} +{"train_info/time_between_train_steps": 0.003238201141357422, "step": 2948} +{"info/global_step": 2949, "train_info/time_within_train_step": 2.9271421432495117, "step": 2949} +{"train_info/time_between_train_steps": 0.00330352783203125, "step": 2949} +{"info/global_step": 2950, "train_info/time_within_train_step": 2.6737253665924072, "step": 2950} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746211676, "_runtime": 8448}, "step": 2950} +{"logs": {"train/loss": 3.8562, "train/learning_rate": 1.111111111111111e-05, "train/epoch": 3.12, "_timestamp": 1746211676, "_runtime": 8448}, "step": 2950} +{"train_info/time_between_train_steps": 0.0240631103515625, "step": 2950} +{"info/global_step": 2951, "train_info/time_within_train_step": 2.672407865524292, "step": 2951} +{"train_info/time_between_train_steps": 0.0033104419708251953, "step": 2951} +{"info/global_step": 2952, "train_info/time_within_train_step": 2.6729068756103516, "step": 2952} +{"train_info/time_between_train_steps": 0.00666356086730957, "step": 2952} +{"info/global_step": 2953, "train_info/time_within_train_step": 2.672938108444214, "step": 2953} +{"train_info/time_between_train_steps": 0.006668806076049805, "step": 2953} +{"info/global_step": 2954, "train_info/time_within_train_step": 2.6725687980651855, "step": 2954} +{"train_info/time_between_train_steps": 0.0033197402954101562, "step": 2954} +{"info/global_step": 2955, "train_info/time_within_train_step": 2.709916591644287, "step": 2955} +{"train_info/time_between_train_steps": 0.0033211708068847656, "step": 2955} +{"info/global_step": 2956, "train_info/time_within_train_step": 2.673344612121582, "step": 2956} +{"train_info/time_between_train_steps": 0.0035076141357421875, "step": 2956} +{"info/global_step": 2957, "train_info/time_within_train_step": 2.6744368076324463, "step": 2957} +{"train_info/time_between_train_steps": 0.0033152103424072266, "step": 2957} +{"info/global_step": 2958, "train_info/time_within_train_step": 2.6734633445739746, "step": 2958} +{"train_info/time_between_train_steps": 0.003254413604736328, "step": 2958} +{"info/global_step": 2959, "train_info/time_within_train_step": 2.673030376434326, "step": 2959} +{"train_info/time_between_train_steps": 0.0032677650451660156, "step": 2959} +{"info/global_step": 2960, "train_info/time_within_train_step": 2.6735923290252686, "step": 2960} +{"train_info/time_between_train_steps": 0.003281831741333008, "step": 2960} +{"info/global_step": 2961, "train_info/time_within_train_step": 2.673970937728882, "step": 2961} +{"train_info/time_between_train_steps": 0.003242969512939453, "step": 2961} +{"info/global_step": 2962, "train_info/time_within_train_step": 2.6736879348754883, "step": 2962} +{"train_info/time_between_train_steps": 0.00360107421875, "step": 2962} +{"info/global_step": 2963, "train_info/time_within_train_step": 2.671766519546509, "step": 2963} +{"train_info/time_between_train_steps": 0.0032167434692382812, "step": 2963} +{"info/global_step": 2964, "train_info/time_within_train_step": 2.6744015216827393, "step": 2964} +{"train_info/time_between_train_steps": 0.0032987594604492188, "step": 2964} +{"info/global_step": 2965, "train_info/time_within_train_step": 2.672804117202759, "step": 2965} +{"train_info/time_between_train_steps": 0.0033829212188720703, "step": 2965} +{"info/global_step": 2966, "train_info/time_within_train_step": 2.674408435821533, "step": 2966} +{"train_info/time_between_train_steps": 0.003274679183959961, "step": 2966} +{"info/global_step": 2967, "train_info/time_within_train_step": 2.672597885131836, "step": 2967} +{"train_info/time_between_train_steps": 0.1378796100616455, "step": 2967} +{"info/global_step": 2968, "train_info/time_within_train_step": 2.6715950965881348, "step": 2968} +{"train_info/time_between_train_steps": 0.0033066272735595703, "step": 2968} +{"info/global_step": 2969, "train_info/time_within_train_step": 2.672774076461792, "step": 2969} +{"train_info/time_between_train_steps": 0.00334930419921875, "step": 2969} +{"info/global_step": 2970, "train_info/time_within_train_step": 2.6731839179992676, "step": 2970} +{"train_info/time_between_train_steps": 0.0033791065216064453, "step": 2970} +{"info/global_step": 2971, "train_info/time_within_train_step": 2.673473596572876, "step": 2971} +{"train_info/time_between_train_steps": 0.0032854080200195312, "step": 2971} +{"info/global_step": 2972, "train_info/time_within_train_step": 2.6730213165283203, "step": 2972} +{"train_info/time_between_train_steps": 0.003292560577392578, "step": 2972} +{"info/global_step": 2973, "train_info/time_within_train_step": 2.673793315887451, "step": 2973} +{"train_info/time_between_train_steps": 0.0033206939697265625, "step": 2973} +{"info/global_step": 2974, "train_info/time_within_train_step": 2.6740007400512695, "step": 2974} +{"train_info/time_between_train_steps": 0.003316640853881836, "step": 2974} +{"info/global_step": 2975, "train_info/time_within_train_step": 2.6738672256469727, "step": 2975} +{"train_info/time_between_train_steps": 0.0039479732513427734, "step": 2975} +{"info/global_step": 2976, "train_info/time_within_train_step": 2.673654794692993, "step": 2976} +{"train_info/time_between_train_steps": 0.003297567367553711, "step": 2976} +{"info/global_step": 2977, "train_info/time_within_train_step": 2.672657012939453, "step": 2977} +{"train_info/time_between_train_steps": 0.006722450256347656, "step": 2977} +{"info/global_step": 2978, "train_info/time_within_train_step": 2.6728098392486572, "step": 2978} +{"train_info/time_between_train_steps": 0.0032944679260253906, "step": 2978} +{"info/global_step": 2979, "train_info/time_within_train_step": 2.671910524368286, "step": 2979} +{"train_info/time_between_train_steps": 0.003301382064819336, "step": 2979} +{"info/global_step": 2980, "train_info/time_within_train_step": 2.6710433959960938, "step": 2980} +{"train_info/time_between_train_steps": 0.00327301025390625, "step": 2980} +{"info/global_step": 2981, "train_info/time_within_train_step": 2.671895742416382, "step": 2981} +{"train_info/time_between_train_steps": 0.00663304328918457, "step": 2981} +{"info/global_step": 2982, "train_info/time_within_train_step": 2.6709811687469482, "step": 2982} +{"train_info/time_between_train_steps": 0.0066416263580322266, "step": 2982} +{"info/global_step": 2983, "train_info/time_within_train_step": 2.671318769454956, "step": 2983} +{"train_info/time_between_train_steps": 0.0032663345336914062, "step": 2983} +{"info/global_step": 2984, "train_info/time_within_train_step": 2.674368381500244, "step": 2984} +{"train_info/time_between_train_steps": 0.003305196762084961, "step": 2984} +{"info/global_step": 2985, "train_info/time_within_train_step": 2.672945976257324, "step": 2985} +{"train_info/time_between_train_steps": 0.0032830238342285156, "step": 2985} +{"info/global_step": 2986, "train_info/time_within_train_step": 2.6725594997406006, "step": 2986} +{"train_info/time_between_train_steps": 0.0032503604888916016, "step": 2986} +{"info/global_step": 2987, "train_info/time_within_train_step": 2.6733450889587402, "step": 2987} +{"train_info/time_between_train_steps": 0.003297567367553711, "step": 2987} +{"info/global_step": 2988, "train_info/time_within_train_step": 2.672912359237671, "step": 2988} +{"train_info/time_between_train_steps": 0.003325939178466797, "step": 2988} +{"info/global_step": 2989, "train_info/time_within_train_step": 2.930034637451172, "step": 2989} +{"train_info/time_between_train_steps": 0.003369569778442383, "step": 2989} +{"info/global_step": 2990, "train_info/time_within_train_step": 2.673647165298462, "step": 2990} +{"train_info/time_between_train_steps": 0.003334522247314453, "step": 2990} +{"info/global_step": 2991, "train_info/time_within_train_step": 2.6737053394317627, "step": 2991} +{"train_info/time_between_train_steps": 0.0033197402954101562, "step": 2991} +{"info/global_step": 2992, "train_info/time_within_train_step": 2.6756818294525146, "step": 2992} +{"train_info/time_between_train_steps": 0.0032961368560791016, "step": 2992} +{"info/global_step": 2993, "train_info/time_within_train_step": 2.674839735031128, "step": 2993} +{"train_info/time_between_train_steps": 0.0032978057861328125, "step": 2993} +{"info/global_step": 2994, "train_info/time_within_train_step": 2.6723556518554688, "step": 2994} +{"train_info/time_between_train_steps": 0.003328084945678711, "step": 2994} +{"info/global_step": 2995, "train_info/time_within_train_step": 2.6739797592163086, "step": 2995} +{"train_info/time_between_train_steps": 0.006636381149291992, "step": 2995} +{"info/global_step": 2996, "train_info/time_within_train_step": 2.6732475757598877, "step": 2996} +{"train_info/time_between_train_steps": 0.006673574447631836, "step": 2996} +{"info/global_step": 2997, "train_info/time_within_train_step": 2.6735188961029053, "step": 2997} +{"train_info/time_between_train_steps": 0.0033397674560546875, "step": 2997} +{"info/global_step": 2998, "train_info/time_within_train_step": 2.6724114418029785, "step": 2998} +{"train_info/time_between_train_steps": 0.0033111572265625, "step": 2998} +{"info/global_step": 2999, "train_info/time_within_train_step": 2.674823045730591, "step": 2999} +{"train_info/time_between_train_steps": 0.003274679183959961, "step": 2999} +{"info/global_step": 3000, "train_info/time_within_train_step": 3.2423219680786133, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746211812, "_runtime": 8584}, "step": 3000} +{"logs": {"train/loss": 3.8499, "train/learning_rate": 0.0, "train/epoch": 3.14, "_timestamp": 1746211812, "_runtime": 8584}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746211817, "_runtime": 8589}, "step": 3000} +{"logs": {"eval/loss": 4.346645832061768, "eval/runtime": 5.5742, "eval/samples_per_second": 36.239, "eval/steps_per_second": 1.256, "train/epoch": 3.14, "_timestamp": 1746211817, "_runtime": 8589}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746211817, "_runtime": 8589}, "step": 3000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.346645832061768, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 77.21902249563382, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.5742, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.239, "train/epoch": 3.14, "_timestamp": 1746211817, "_runtime": 8589}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746211830, "_runtime": 8602}, "step": 3000} +{"logs": {"train/train_runtime": 8603.7053, "train/train_samples_per_second": 22.316, "train/train_steps_per_second": 0.349, "train/total_flos": 2.5088738328576e+16, "train/train_loss": 4.561715702692668, "train/epoch": 3.14, "_timestamp": 1746211830, "_runtime": 8602}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.771484375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746211840, "_runtime": 8612}, "step": 3000} +{"logs": {"eval/loss": 4.346645832061768, "eval/runtime": 5.1251, "eval/samples_per_second": 39.414, "eval/steps_per_second": 1.366, "train/epoch": 3.14, "_timestamp": 1746211840, "_runtime": 8612}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.771484375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746211840, "_runtime": 8612}, "step": 3000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.346645832061768, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 77.21902249563382, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1251, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 39.414, "train/epoch": 3.14, "_timestamp": 1746211840, "_runtime": 8612}, "step": 3000}